diff --git "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" --- "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" +++ "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2499, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 122858, "_timestamp": 1647497135, "_step": 17851, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 14.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 4.0, 9.0, 18.0, 29525.0, 875.0, 16.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.125, -168.603515625, -165.08203125, -161.560546875, -158.0390625, -154.517578125, -150.99609375, -147.474609375, -143.953125, -140.431640625, -136.91015625, -133.388671875, -129.8671875, -126.345703125, -122.82421875, -119.302734375, -115.78125, -112.259765625, -108.73828125, -105.216796875, -101.6953125, -98.173828125, -94.65234375, -91.130859375, -87.609375, -84.087890625, -80.56640625, -77.044921875, -73.5234375, -70.001953125, -66.48046875, -62.958984375, -59.4375, -55.916015625, -52.39453125, -48.873046875, -45.3515625, -41.830078125, -38.30859375, -34.787109375, -31.265625, -27.744140625, -24.22265625, -20.701171875, -17.1796875, -13.658203125, -10.13671875, -6.615234375, -3.09375, 0.427734375, 3.94921875, 7.470703125, 10.9921875, 14.513671875, 18.03515625, 21.556640625, 25.078125, 28.599609375, 32.12109375, 35.642578125, 39.1640625, 42.685546875, 46.20703125, 49.728515625, 53.25]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 3.0, 3.0, 6.0, 8.0, 6.0, 5.0, 13.0, 13.0, 17.0, 19.0, 24.0, 24.0, 22.0, 21.0, 35.0, 37.0, 47.0, 27.0, 39.0, 42.0, 41.0, 58.0, 41.0, 38.0, 43.0, 42.0, 39.0, 39.0, 38.0, 29.0, 20.0, 24.0, 26.0, 15.0, 15.0, 13.0, 6.0, 10.0, 10.0, 4.0, 7.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-37.44131088256836, -36.594993591308594, -35.74867630004883, -34.90236282348633, -34.05604553222656, -33.2097282409668, -32.36341094970703, -31.5170955657959, -30.670780181884766, -29.824462890625, -28.978147506713867, -28.1318302154541, -27.28551483154297, -26.439197540283203, -25.592880249023438, -24.746564865112305, -23.90024757385254, -23.053930282592773, -22.20761489868164, -21.361297607421875, -20.514982223510742, -19.668664932250977, -18.822349548339844, -17.976032257080078, -17.129714965820312, -16.283397674560547, -15.437082290649414, -14.590764999389648, -13.744449615478516, -12.89813232421875, -12.0518159866333, -11.205499649047852, -10.359186172485352, -9.512869834899902, -8.666553497314453, -7.820236682891846, -6.9739203453063965, -6.127604007720947, -5.28128719329834, -4.434970855712891, -3.5886545181274414, -2.742338180541992, -1.8960216045379639, -1.0497050285339355, -0.20338869094848633, 0.6429276466369629, 1.4892444610595703, 2.3355607986450195, 3.1818771362304688, 4.028193473815918, 4.874509811401367, 5.720826625823975, 6.567142963409424, 7.413459300994873, 8.25977611541748, 9.10609245300293, 9.952408790588379, 10.798725128173828, 11.645041465759277, 12.491357803344727, 13.337675094604492, 14.183990478515625, 15.03030776977539, 15.87662410736084, 16.72294044494629]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 8.0, 6.0, 9.0, 6.0, 11.0, 9.0, 17.0, 14.0, 31.0, 26.0, 29.0, 23.0, 36.0, 51.0, 43.0, 34.0, 44.0, 50.0, 42.0, 32.0, 52.0, 35.0, 40.0, 48.0, 33.0, 29.0, 20.0, 31.0, 30.0, 16.0, 24.0, 27.0, 13.0, 17.0, 17.0, 10.0, 9.0, 4.0, 4.0, 8.0, 8.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.865875244140625, -26.000263214111328, -25.13465118408203, -24.269039154052734, -23.403425216674805, -22.537813186645508, -21.67220115661621, -20.806589126586914, -19.940975189208984, -19.075363159179688, -18.20975112915039, -17.344139099121094, -16.478525161743164, -15.612913131713867, -14.74730110168457, -13.881689071655273, -13.016077041625977, -12.15046501159668, -11.284852027893066, -10.41923999786377, -9.553627014160156, -8.68801498413086, -7.8224029541015625, -6.956790447235107, -6.091177940368652, -5.225565433502197, -4.359952926635742, -3.4943408966064453, -2.6287283897399902, -1.7631158828735352, -0.8975038528442383, -0.0318913459777832, 0.8337230682373047, 1.6993354558944702, 2.5649478435516357, 3.4305601119995117, 4.296172618865967, 5.161785125732422, 6.027397155761719, 6.893009662628174, 7.758622169494629, 8.624234199523926, 9.489847183227539, 10.355459213256836, 11.221071243286133, 12.086684226989746, 12.952296257019043, 13.817909240722656, 14.683521270751953, 15.54913330078125, 16.414745330810547, 17.280357360839844, 18.145971298217773, 19.01158332824707, 19.877195358276367, 20.742807388305664, 21.608421325683594, 22.47403335571289, 23.339645385742188, 24.205257415771484, 25.070871353149414, 25.93648338317871, 26.802095413208008, 27.667707443237305, 28.5333194732666]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 13.0, 11.0, 18.0, 35.0, 61.0, 87.0, 144.0, 236.0, 381.0, 558.0, 930.0, 1512.0, 2314.0, 3589.0, 5697.0, 8750.0, 12940.0, 19432.0, 27520.0, 38987.0, 51489.0, 67133.0, 81702.0, 94353.0, 120262.0, 107531.0, 91995.0, 79255.0, 64688.0, 50098.0, 37011.0, 26422.0, 18287.0, 12305.0, 8119.0, 5403.0, 3480.0, 2149.0, 1360.0, 858.0, 533.0, 316.0, 200.0, 140.0, 90.0, 56.0, 41.0, 28.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.25, -85.396484375, -82.54296875, -79.689453125, -76.8359375, -73.982421875, -71.12890625, -68.275390625, -65.421875, -62.568359375, -59.71484375, -56.861328125, -54.0078125, -51.154296875, -48.30078125, -45.447265625, -42.59375, -39.740234375, -36.88671875, -34.033203125, -31.1796875, -28.326171875, -25.47265625, -22.619140625, -19.765625, -16.912109375, -14.05859375, -11.205078125, -8.3515625, -5.498046875, -2.64453125, 0.208984375, 3.0625, 5.916015625, 8.76953125, 11.623046875, 14.4765625, 17.330078125, 20.18359375, 23.037109375, 25.890625, 28.744140625, 31.59765625, 34.451171875, 37.3046875, 40.158203125, 43.01171875, 45.865234375, 48.71875, 51.572265625, 54.42578125, 57.279296875, 60.1328125, 62.986328125, 65.83984375, 68.693359375, 71.546875, 74.400390625, 77.25390625, 80.107421875, 82.9609375, 85.814453125, 88.66796875, 91.521484375, 94.375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 6.0, 13.0, 20.0, 24.0, 14.0, 25.0, 33.0, 35.0, 52.0, 42.0, 43.0, 50.0, 43.0, 73.0, 84.0, 53.0, 57.0, 36.0, 45.0, 46.0, 32.0, 39.0, 16.0, 15.0, 17.0, 18.0, 13.0, 9.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.84619140625, -51.1923828125, -49.53857421875, -47.884765625, -46.23095703125, -44.5771484375, -42.92333984375, -41.26953125, -39.61572265625, -37.9619140625, -36.30810546875, -34.654296875, -33.00048828125, -31.3466796875, -29.69287109375, -28.0390625, -26.38525390625, -24.7314453125, -23.07763671875, -21.423828125, -19.77001953125, -18.1162109375, -16.46240234375, -14.80859375, -13.15478515625, -11.5009765625, -9.84716796875, -8.193359375, -6.53955078125, -4.8857421875, -3.23193359375, -1.578125, 0.07568359375, 1.7294921875, 3.38330078125, 5.037109375, 6.69091796875, 8.3447265625, 9.99853515625, 11.65234375, 13.30615234375, 14.9599609375, 16.61376953125, 18.267578125, 19.92138671875, 21.5751953125, 23.22900390625, 24.8828125, 26.53662109375, 28.1904296875, 29.84423828125, 31.498046875, 33.15185546875, 34.8056640625, 36.45947265625, 38.11328125, 39.76708984375, 41.4208984375, 43.07470703125, 44.728515625, 46.38232421875, 48.0361328125, 49.68994140625, 51.34375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 12.0, 5.0, 7.0, 4.0, 18.0, 19.0, 24.0, 31.0, 37.0, 40.0, 42.0, 53.0, 33.0, 37.0, 45.0, 41.0, 56.0, 48.0, 60.0, 46.0, 43.0, 32.0, 37.0, 29.0, 25.0, 29.0, 25.0, 17.0, 12.0, 21.0, 17.0, 12.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.385425567626953, -25.43740463256836, -24.489383697509766, -23.541362762451172, -22.59334373474121, -21.645322799682617, -20.697301864624023, -19.74928092956543, -18.80126190185547, -17.853240966796875, -16.90522003173828, -15.957200050354004, -15.009180068969727, -14.061159133911133, -13.113138198852539, -12.165117263793945, -11.217096328735352, -10.269075393676758, -9.32105541229248, -8.373034477233887, -7.425014019012451, -6.476993560791016, -5.528972625732422, -4.580952167510986, -3.632931709289551, -2.6849112510681152, -1.7368905544281006, -0.7888698577880859, 0.1591506004333496, 1.1071710586547852, 2.055191993713379, 3.0032124519348145, 3.95123291015625, 4.8992533683776855, 5.847273826599121, 6.795294761657715, 7.74331521987915, 8.691335678100586, 9.63935661315918, 10.587377548217773, 11.53539752960205, 12.483418464660645, 13.431438446044922, 14.379459381103516, 15.32748031616211, 16.275501251220703, 17.223522186279297, 18.171541213989258, 19.11956214904785, 20.067583084106445, 21.01560401916504, 21.963623046875, 22.911643981933594, 23.859664916992188, 24.80768585205078, 25.755706787109375, 26.70372772216797, 27.651748657226562, 28.599769592285156, 29.54779052734375, 30.49580955505371, 31.443830490112305, 32.39185333251953, 33.33987045288086, 34.28789138793945]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 18.0, 13.0, 19.0, 24.0, 17.0, 28.0, 28.0, 27.0, 33.0, 37.0, 38.0, 38.0, 34.0, 37.0, 29.0, 32.0, 34.0, 50.0, 35.0, 29.0, 39.0, 29.0, 23.0, 26.0, 23.0, 22.0, 25.0, 22.0, 16.0, 13.0, 16.0, 13.0, 13.0, 7.0, 3.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.41060447692871, -23.645917892456055, -22.881229400634766, -22.11654281616211, -21.351856231689453, -20.587169647216797, -19.822481155395508, -19.05779457092285, -18.293106079101562, -17.528419494628906, -16.763731002807617, -15.999044418334961, -15.234357833862305, -14.469670295715332, -13.70498275756836, -12.940296173095703, -12.175609588623047, -11.410922050476074, -10.646235466003418, -9.881547927856445, -9.116861343383789, -8.352173805236816, -7.587486267089844, -6.822799205780029, -6.058112144470215, -5.2934250831604, -4.528738021850586, -3.7640504837036133, -2.999363422393799, -2.2346763610839844, -1.4699888229370117, -0.7053017616271973, 0.059383392333984375, 0.8240705728530884, 1.5887577533721924, 2.353445053100586, 3.1181321144104004, 3.882819175720215, 4.6475067138671875, 5.412193775177002, 6.176880836486816, 6.941567897796631, 7.706254959106445, 8.470942497253418, 9.23563003540039, 10.000316619873047, 10.76500415802002, 11.529691696166992, 12.294378280639648, 13.059065818786621, 13.823752403259277, 14.58843994140625, 15.353126525878906, 16.117813110351562, 16.88250160217285, 17.647188186645508, 18.411876678466797, 19.176563262939453, 19.941251754760742, 20.7059383392334, 21.470624923706055, 22.235313415527344, 23.0, 23.764686584472656, 24.529373168945312]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 3.0, 8.0, 18.0, 32.0, 34.0, 52.0, 100.0, 157.0, 221.0, 375.0, 630.0, 1037.0, 1504.0, 2432.0, 3798.0, 5961.0, 9766.0, 15600.0, 24875.0, 39892.0, 65460.0, 105003.0, 171497.0, 273961.0, 430752.0, 634959.0, 751476.0, 601193.0, 398115.0, 250380.0, 154641.0, 95080.0, 58549.0, 35874.0, 22552.0, 13783.0, 8724.0, 5604.0, 3651.0, 2317.0, 1469.0, 901.0, 638.0, 386.0, 280.0, 207.0, 125.0, 71.0, 59.0, 37.0, 16.0, 16.0, 6.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-41.5, -40.1357421875, -38.771484375, -37.4072265625, -36.04296875, -34.6787109375, -33.314453125, -31.9501953125, -30.5859375, -29.2216796875, -27.857421875, -26.4931640625, -25.12890625, -23.7646484375, -22.400390625, -21.0361328125, -19.671875, -18.3076171875, -16.943359375, -15.5791015625, -14.21484375, -12.8505859375, -11.486328125, -10.1220703125, -8.7578125, -7.3935546875, -6.029296875, -4.6650390625, -3.30078125, -1.9365234375, -0.572265625, 0.7919921875, 2.15625, 3.5205078125, 4.884765625, 6.2490234375, 7.61328125, 8.9775390625, 10.341796875, 11.7060546875, 13.0703125, 14.4345703125, 15.798828125, 17.1630859375, 18.52734375, 19.8916015625, 21.255859375, 22.6201171875, 23.984375, 25.3486328125, 26.712890625, 28.0771484375, 29.44140625, 30.8056640625, 32.169921875, 33.5341796875, 34.8984375, 36.2626953125, 37.626953125, 38.9912109375, 40.35546875, 41.7197265625, 43.083984375, 44.4482421875, 45.8125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 22.0, 13.0, 16.0, 19.0, 23.0, 22.0, 19.0, 30.0, 23.0, 24.0, 40.0, 30.0, 45.0, 34.0, 31.0, 31.0, 27.0, 42.0, 40.0, 39.0, 26.0, 39.0, 27.0, 32.0, 27.0, 14.0, 31.0, 22.0, 26.0, 12.0, 21.0, 16.0, 16.0, 12.0, 18.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.96875, -20.309326171875, -19.64990234375, -18.990478515625, -18.3310546875, -17.671630859375, -17.01220703125, -16.352783203125, -15.693359375, -15.033935546875, -14.37451171875, -13.715087890625, -13.0556640625, -12.396240234375, -11.73681640625, -11.077392578125, -10.41796875, -9.758544921875, -9.09912109375, -8.439697265625, -7.7802734375, -7.120849609375, -6.46142578125, -5.802001953125, -5.142578125, -4.483154296875, -3.82373046875, -3.164306640625, -2.5048828125, -1.845458984375, -1.18603515625, -0.526611328125, 0.1328125, 0.792236328125, 1.45166015625, 2.111083984375, 2.7705078125, 3.429931640625, 4.08935546875, 4.748779296875, 5.408203125, 6.067626953125, 6.72705078125, 7.386474609375, 8.0458984375, 8.705322265625, 9.36474609375, 10.024169921875, 10.68359375, 11.343017578125, 12.00244140625, 12.661865234375, 13.3212890625, 13.980712890625, 14.64013671875, 15.299560546875, 15.958984375, 16.618408203125, 17.27783203125, 17.937255859375, 18.5966796875, 19.256103515625, 19.91552734375, 20.574951171875, 21.234375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 11.0, 13.0, 5.0, 29.0, 44.0, 67.0, 103.0, 168.0, 251.0, 365.0, 604.0, 976.0, 1532.0, 2343.0, 3750.0, 5927.0, 9563.0, 14926.0, 23821.0, 37469.0, 59351.0, 92981.0, 144844.0, 219601.0, 324507.0, 455309.0, 581203.0, 610101.0, 505410.0, 370667.0, 255806.0, 169993.0, 110137.0, 70691.0, 45003.0, 28529.0, 17916.0, 11100.0, 7026.0, 4359.0, 2848.0, 1764.0, 1187.0, 706.0, 465.0, 323.0, 183.0, 115.0, 74.0, 50.0, 25.0, 18.0, 14.0, 14.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-27.90625, -27.039306640625, -26.17236328125, -25.305419921875, -24.4384765625, -23.571533203125, -22.70458984375, -21.837646484375, -20.970703125, -20.103759765625, -19.23681640625, -18.369873046875, -17.5029296875, -16.635986328125, -15.76904296875, -14.902099609375, -14.03515625, -13.168212890625, -12.30126953125, -11.434326171875, -10.5673828125, -9.700439453125, -8.83349609375, -7.966552734375, -7.099609375, -6.232666015625, -5.36572265625, -4.498779296875, -3.6318359375, -2.764892578125, -1.89794921875, -1.031005859375, -0.1640625, 0.702880859375, 1.56982421875, 2.436767578125, 3.3037109375, 4.170654296875, 5.03759765625, 5.904541015625, 6.771484375, 7.638427734375, 8.50537109375, 9.372314453125, 10.2392578125, 11.106201171875, 11.97314453125, 12.840087890625, 13.70703125, 14.573974609375, 15.44091796875, 16.307861328125, 17.1748046875, 18.041748046875, 18.90869140625, 19.775634765625, 20.642578125, 21.509521484375, 22.37646484375, 23.243408203125, 24.1103515625, 24.977294921875, 25.84423828125, 26.711181640625, 27.578125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 9.0, 10.0, 17.0, 17.0, 27.0, 30.0, 41.0, 40.0, 49.0, 75.0, 94.0, 122.0, 135.0, 163.0, 175.0, 177.0, 235.0, 248.0, 258.0, 237.0, 241.0, 216.0, 218.0, 181.0, 191.0, 135.0, 127.0, 99.0, 92.0, 64.0, 71.0, 49.0, 40.0, 40.0, 27.0, 22.0, 16.0, 26.0, 15.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9765625, -11.58203125, -11.1875, -10.79296875, -10.3984375, -10.00390625, -9.609375, -9.21484375, -8.8203125, -8.42578125, -8.03125, -7.63671875, -7.2421875, -6.84765625, -6.453125, -6.05859375, -5.6640625, -5.26953125, -4.875, -4.48046875, -4.0859375, -3.69140625, -3.296875, -2.90234375, -2.5078125, -2.11328125, -1.71875, -1.32421875, -0.9296875, -0.53515625, -0.140625, 0.25390625, 0.6484375, 1.04296875, 1.4375, 1.83203125, 2.2265625, 2.62109375, 3.015625, 3.41015625, 3.8046875, 4.19921875, 4.59375, 4.98828125, 5.3828125, 5.77734375, 6.171875, 6.56640625, 6.9609375, 7.35546875, 7.75, 8.14453125, 8.5390625, 8.93359375, 9.328125, 9.72265625, 10.1171875, 10.51171875, 10.90625, 11.30078125, 11.6953125, 12.08984375, 12.484375, 12.87890625, 13.2734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 18.0, 21.0, 17.0, 31.0, 19.0, 31.0, 17.0, 35.0, 53.0, 36.0, 50.0, 47.0, 61.0, 61.0, 54.0, 60.0, 58.0, 47.0, 56.0, 32.0, 30.0, 31.0, 27.0, 18.0, 13.0, 15.0, 16.0, 11.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.50990104675293, -29.452804565429688, -28.395709991455078, -27.338613510131836, -26.281517028808594, -25.224422454833984, -24.167325973510742, -23.1102294921875, -22.05313491821289, -20.99603843688965, -19.93894386291504, -18.881847381591797, -17.824750900268555, -16.767654418945312, -15.710559844970703, -14.653463363647461, -13.596366882324219, -12.539271354675293, -11.48217487335205, -10.425079345703125, -9.367982864379883, -8.310887336730957, -7.253791809082031, -6.196695804595947, -5.139599800109863, -4.082503795623779, -3.0254080295562744, -1.9683122634887695, -0.9112162590026855, 0.14587974548339844, 1.2029752731323242, 2.260071277618408, 3.317169189453125, 4.374265193939209, 5.431361198425293, 6.488456726074219, 7.545552730560303, 8.602648735046387, 9.659744262695312, 10.716840744018555, 11.77393627166748, 12.831031799316406, 13.888128280639648, 14.945223808288574, 16.0023193359375, 17.059415817260742, 18.116512298583984, 19.173606872558594, 20.230703353881836, 21.287799835205078, 22.344894409179688, 23.40199089050293, 24.459087371826172, 25.51618194580078, 26.573278427124023, 27.630374908447266, 28.687469482421875, 29.744565963745117, 30.801660537719727, 31.85875701904297, 32.91585159301758, 33.97294998168945, 35.03004455566406, 36.08713912963867, 37.14423751831055]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 13.0, 7.0, 18.0, 20.0, 21.0, 21.0, 28.0, 26.0, 34.0, 36.0, 38.0, 40.0, 37.0, 38.0, 36.0, 39.0, 50.0, 46.0, 43.0, 31.0, 37.0, 35.0, 25.0, 25.0, 32.0, 29.0, 25.0, 31.0, 19.0, 22.0, 8.0, 17.0, 11.0, 7.0, 11.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.82933235168457, -25.998638153076172, -25.16794204711914, -24.337247848510742, -23.50655174255371, -22.675857543945312, -21.84516143798828, -21.014467239379883, -20.183773040771484, -19.353078842163086, -18.522382736206055, -17.691688537597656, -16.860992431640625, -16.030298233032227, -15.199603080749512, -14.368907928466797, -13.538211822509766, -12.70751667022705, -11.876821517944336, -11.046127319335938, -10.215431213378906, -9.384737014770508, -8.554041862487793, -7.723346710205078, -6.892651557922363, -6.061956405639648, -5.231261253356934, -4.400566577911377, -3.569871425628662, -2.7391762733459473, -1.9084815979003906, -1.0777864456176758, -0.24708938598632812, 0.5836056470870972, 1.4143006801605225, 2.244995594024658, 3.075690746307373, 3.906385898590088, 4.7370805740356445, 5.567775726318359, 6.398470878601074, 7.229166030883789, 8.059861183166504, 8.890556335449219, 9.721250534057617, 10.551946640014648, 11.382640838623047, 12.213335990905762, 13.044031143188477, 13.874726295471191, 14.705421447753906, 15.536115646362305, 16.366811752319336, 17.197505950927734, 18.028202056884766, 18.858896255493164, 19.689590454101562, 20.52028465270996, 21.350980758666992, 22.18167495727539, 23.012371063232422, 23.84306526184082, 24.67375946044922, 25.50445556640625, 26.33515167236328]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 17.0, 19.0, 31.0, 43.0, 77.0, 87.0, 147.0, 224.0, 339.0, 516.0, 854.0, 1359.0, 1890.0, 3049.0, 4505.0, 6896.0, 10347.0, 15084.0, 22622.0, 33123.0, 47921.0, 67835.0, 91363.0, 115509.0, 131494.0, 125950.0, 105654.0, 79613.0, 57718.0, 40394.0, 27504.0, 18776.0, 12876.0, 8414.0, 5651.0, 3673.0, 2466.0, 1545.0, 1020.0, 697.0, 445.0, 323.0, 165.0, 103.0, 83.0, 52.0, 31.0, 23.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-14.734375, -14.28466796875, -13.8349609375, -13.38525390625, -12.935546875, -12.48583984375, -12.0361328125, -11.58642578125, -11.13671875, -10.68701171875, -10.2373046875, -9.78759765625, -9.337890625, -8.88818359375, -8.4384765625, -7.98876953125, -7.5390625, -7.08935546875, -6.6396484375, -6.18994140625, -5.740234375, -5.29052734375, -4.8408203125, -4.39111328125, -3.94140625, -3.49169921875, -3.0419921875, -2.59228515625, -2.142578125, -1.69287109375, -1.2431640625, -0.79345703125, -0.34375, 0.10595703125, 0.5556640625, 1.00537109375, 1.455078125, 1.90478515625, 2.3544921875, 2.80419921875, 3.25390625, 3.70361328125, 4.1533203125, 4.60302734375, 5.052734375, 5.50244140625, 5.9521484375, 6.40185546875, 6.8515625, 7.30126953125, 7.7509765625, 8.20068359375, 8.650390625, 9.10009765625, 9.5498046875, 9.99951171875, 10.44921875, 10.89892578125, 11.3486328125, 11.79833984375, 12.248046875, 12.69775390625, 13.1474609375, 13.59716796875, 14.046875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 17.0, 17.0, 16.0, 17.0, 16.0, 29.0, 34.0, 41.0, 37.0, 37.0, 45.0, 36.0, 46.0, 47.0, 38.0, 53.0, 43.0, 36.0, 27.0, 32.0, 38.0, 27.0, 34.0, 34.0, 25.0, 23.0, 20.0, 27.0, 19.0, 12.0, 13.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.990478515625, -23.18408203125, -22.377685546875, -21.5712890625, -20.764892578125, -19.95849609375, -19.152099609375, -18.345703125, -17.539306640625, -16.73291015625, -15.926513671875, -15.1201171875, -14.313720703125, -13.50732421875, -12.700927734375, -11.89453125, -11.088134765625, -10.28173828125, -9.475341796875, -8.6689453125, -7.862548828125, -7.05615234375, -6.249755859375, -5.443359375, -4.636962890625, -3.83056640625, -3.024169921875, -2.2177734375, -1.411376953125, -0.60498046875, 0.201416015625, 1.0078125, 1.814208984375, 2.62060546875, 3.427001953125, 4.2333984375, 5.039794921875, 5.84619140625, 6.652587890625, 7.458984375, 8.265380859375, 9.07177734375, 9.878173828125, 10.6845703125, 11.490966796875, 12.29736328125, 13.103759765625, 13.91015625, 14.716552734375, 15.52294921875, 16.329345703125, 17.1357421875, 17.942138671875, 18.74853515625, 19.554931640625, 20.361328125, 21.167724609375, 21.97412109375, 22.780517578125, 23.5869140625, 24.393310546875, 25.19970703125, 26.006103515625, 26.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 9.0, 13.0, 11.0, 25.0, 23.0, 42.0, 65.0, 63.0, 132.0, 151.0, 209.0, 301.0, 444.0, 662.0, 951.0, 1321.0, 2091.0, 3223.0, 5351.0, 8662.0, 15274.0, 32503.0, 724323.0, 193773.0, 24985.0, 13108.0, 7510.0, 4683.0, 2910.0, 1873.0, 1240.0, 817.0, 555.0, 355.0, 261.0, 191.0, 125.0, 89.0, 66.0, 57.0, 39.0, 18.0, 19.0, 7.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.0, -33.86572265625, -32.7314453125, -31.59716796875, -30.462890625, -29.32861328125, -28.1943359375, -27.06005859375, -25.92578125, -24.79150390625, -23.6572265625, -22.52294921875, -21.388671875, -20.25439453125, -19.1201171875, -17.98583984375, -16.8515625, -15.71728515625, -14.5830078125, -13.44873046875, -12.314453125, -11.18017578125, -10.0458984375, -8.91162109375, -7.77734375, -6.64306640625, -5.5087890625, -4.37451171875, -3.240234375, -2.10595703125, -0.9716796875, 0.16259765625, 1.296875, 2.43115234375, 3.5654296875, 4.69970703125, 5.833984375, 6.96826171875, 8.1025390625, 9.23681640625, 10.37109375, 11.50537109375, 12.6396484375, 13.77392578125, 14.908203125, 16.04248046875, 17.1767578125, 18.31103515625, 19.4453125, 20.57958984375, 21.7138671875, 22.84814453125, 23.982421875, 25.11669921875, 26.2509765625, 27.38525390625, 28.51953125, 29.65380859375, 30.7880859375, 31.92236328125, 33.056640625, 34.19091796875, 35.3251953125, 36.45947265625, 37.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 8.0, 12.0, 8.0, 18.0, 14.0, 27.0, 20.0, 30.0, 29.0, 36.0, 42.0, 52.0, 47.0, 54.0, 56.0, 60.0, 59.0, 48.0, 49.0, 39.0, 47.0, 37.0, 35.0, 26.0, 20.0, 24.0, 19.0, 14.0, 11.0, 7.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.546630859375, -22.68701171875, -21.827392578125, -20.9677734375, -20.108154296875, -19.24853515625, -18.388916015625, -17.529296875, -16.669677734375, -15.81005859375, -14.950439453125, -14.0908203125, -13.231201171875, -12.37158203125, -11.511962890625, -10.65234375, -9.792724609375, -8.93310546875, -8.073486328125, -7.2138671875, -6.354248046875, -5.49462890625, -4.635009765625, -3.775390625, -2.915771484375, -2.05615234375, -1.196533203125, -0.3369140625, 0.522705078125, 1.38232421875, 2.241943359375, 3.1015625, 3.961181640625, 4.82080078125, 5.680419921875, 6.5400390625, 7.399658203125, 8.25927734375, 9.118896484375, 9.978515625, 10.838134765625, 11.69775390625, 12.557373046875, 13.4169921875, 14.276611328125, 15.13623046875, 15.995849609375, 16.85546875, 17.715087890625, 18.57470703125, 19.434326171875, 20.2939453125, 21.153564453125, 22.01318359375, 22.872802734375, 23.732421875, 24.592041015625, 25.45166015625, 26.311279296875, 27.1708984375, 28.030517578125, 28.89013671875, 29.749755859375, 30.609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 11.0, 4.0, 8.0, 6.0, 15.0, 19.0, 27.0, 33.0, 33.0, 78.0, 105.0, 175.0, 242.0, 429.0, 600.0, 998.0, 1839.0, 3163.0, 5787.0, 10821.0, 23013.0, 101112.0, 823349.0, 40568.0, 16720.0, 8463.0, 4579.0, 2451.0, 1461.0, 892.0, 486.0, 365.0, 230.0, 138.0, 95.0, 68.0, 54.0, 36.0, 29.0, 16.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.26019287109375, -7.0281982421875, -6.79620361328125, -6.564208984375, -6.33221435546875, -6.1002197265625, -5.86822509765625, -5.63623046875, -5.40423583984375, -5.1722412109375, -4.94024658203125, -4.708251953125, -4.47625732421875, -4.2442626953125, -4.01226806640625, -3.7802734375, -3.54827880859375, -3.3162841796875, -3.08428955078125, -2.852294921875, -2.62030029296875, -2.3883056640625, -2.15631103515625, -1.92431640625, -1.69232177734375, -1.4603271484375, -1.22833251953125, -0.996337890625, -0.76434326171875, -0.5323486328125, -0.30035400390625, -0.068359375, 0.16363525390625, 0.3956298828125, 0.62762451171875, 0.859619140625, 1.09161376953125, 1.3236083984375, 1.55560302734375, 1.78759765625, 2.01959228515625, 2.2515869140625, 2.48358154296875, 2.715576171875, 2.94757080078125, 3.1795654296875, 3.41156005859375, 3.6435546875, 3.87554931640625, 4.1075439453125, 4.33953857421875, 4.571533203125, 4.80352783203125, 5.0355224609375, 5.26751708984375, 5.49951171875, 5.73150634765625, 5.9635009765625, 6.19549560546875, 6.427490234375, 6.65948486328125, 6.8914794921875, 7.12347412109375, 7.35546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 9.0, 9.0, 21.0, 21.0, 28.0, 38.0, 41.0, 59.0, 64.0, 75.0, 77.0, 91.0, 79.0, 68.0, 51.0, 39.0, 25.0, 30.0, 19.0, 18.0, 13.0, 17.0, 16.0, 9.0, 8.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009636133909225464, -0.000932544469833374, -0.0009014755487442017, -0.0008704066276550293, -0.0008393377065658569, -0.0008082687854766846, -0.0007771998643875122, -0.0007461309432983398, -0.0007150620222091675, -0.0006839931011199951, -0.0006529241800308228, -0.0006218552589416504, -0.000590786337852478, -0.0005597174167633057, -0.0005286484956741333, -0.0004975795745849609, -0.0004665106534957886, -0.0004354417324066162, -0.00040437281131744385, -0.0003733038902282715, -0.0003422349691390991, -0.00031116604804992676, -0.0002800971269607544, -0.00024902820587158203, -0.00021795928478240967, -0.0001868903636932373, -0.00015582144260406494, -0.00012475252151489258, -9.368360042572021e-05, -6.261467933654785e-05, -3.154575824737549e-05, -4.76837158203125e-07, 3.059208393096924e-05, 6.16610050201416e-05, 9.272992610931396e-05, 0.00012379884719848633, 0.0001548677682876587, 0.00018593668937683105, 0.00021700561046600342, 0.0002480745315551758, 0.00027914345264434814, 0.0003102123737335205, 0.00034128129482269287, 0.00037235021591186523, 0.0004034191370010376, 0.00043448805809020996, 0.0004655569791793823, 0.0004966259002685547, 0.000527694821357727, 0.0005587637424468994, 0.0005898326635360718, 0.0006209015846252441, 0.0006519705057144165, 0.0006830394268035889, 0.0007141083478927612, 0.0007451772689819336, 0.000776246190071106, 0.0008073151111602783, 0.0008383840322494507, 0.000869452953338623, 0.0009005218744277954, 0.0009315907955169678, 0.0009626597166061401, 0.0009937286376953125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 15.0, 12.0, 25.0, 33.0, 47.0, 65.0, 79.0, 154.0, 198.0, 290.0, 414.0, 638.0, 1054.0, 1535.0, 2600.0, 4377.0, 7614.0, 13250.0, 24151.0, 43480.0, 76554.0, 126405.0, 180612.0, 194406.0, 149415.0, 94911.0, 55291.0, 30497.0, 16927.0, 9409.0, 5391.0, 3200.0, 1925.0, 1267.0, 785.0, 463.0, 332.0, 212.0, 143.0, 103.0, 76.0, 58.0, 33.0, 46.0, 26.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.77734375, -3.666900634765625, -3.55645751953125, -3.446014404296875, -3.3355712890625, -3.225128173828125, -3.11468505859375, -3.004241943359375, -2.893798828125, -2.783355712890625, -2.67291259765625, -2.562469482421875, -2.4520263671875, -2.341583251953125, -2.23114013671875, -2.120697021484375, -2.01025390625, -1.899810791015625, -1.78936767578125, -1.678924560546875, -1.5684814453125, -1.458038330078125, -1.34759521484375, -1.237152099609375, -1.126708984375, -1.016265869140625, -0.90582275390625, -0.795379638671875, -0.6849365234375, -0.574493408203125, -0.46405029296875, -0.353607177734375, -0.2431640625, -0.132720947265625, -0.02227783203125, 0.088165283203125, 0.1986083984375, 0.309051513671875, 0.41949462890625, 0.529937744140625, 0.640380859375, 0.750823974609375, 0.86126708984375, 0.971710205078125, 1.0821533203125, 1.192596435546875, 1.30303955078125, 1.413482666015625, 1.52392578125, 1.634368896484375, 1.74481201171875, 1.855255126953125, 1.9656982421875, 2.076141357421875, 2.18658447265625, 2.297027587890625, 2.407470703125, 2.517913818359375, 2.62835693359375, 2.738800048828125, 2.8492431640625, 2.959686279296875, 3.07012939453125, 3.180572509765625, 3.291015625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 12.0, 11.0, 9.0, 15.0, 25.0, 22.0, 25.0, 45.0, 58.0, 43.0, 64.0, 60.0, 53.0, 80.0, 55.0, 57.0, 61.0, 42.0, 40.0, 37.0, 35.0, 28.0, 24.0, 13.0, 10.0, 6.0, 6.0, 8.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.371368408203125, -1.33258056640625, -1.293792724609375, -1.2550048828125, -1.216217041015625, -1.17742919921875, -1.138641357421875, -1.099853515625, -1.061065673828125, -1.02227783203125, -0.983489990234375, -0.9447021484375, -0.905914306640625, -0.86712646484375, -0.828338623046875, -0.78955078125, -0.750762939453125, -0.71197509765625, -0.673187255859375, -0.6343994140625, -0.595611572265625, -0.55682373046875, -0.518035888671875, -0.479248046875, -0.440460205078125, -0.40167236328125, -0.362884521484375, -0.3240966796875, -0.285308837890625, -0.24652099609375, -0.207733154296875, -0.1689453125, -0.130157470703125, -0.09136962890625, -0.052581787109375, -0.0137939453125, 0.024993896484375, 0.06378173828125, 0.102569580078125, 0.141357421875, 0.180145263671875, 0.21893310546875, 0.257720947265625, 0.2965087890625, 0.335296630859375, 0.37408447265625, 0.412872314453125, 0.45166015625, 0.490447998046875, 0.52923583984375, 0.568023681640625, 0.6068115234375, 0.645599365234375, 0.68438720703125, 0.723175048828125, 0.761962890625, 0.800750732421875, 0.83953857421875, 0.878326416015625, 0.9171142578125, 0.955902099609375, 0.99468994140625, 1.033477783203125, 1.072265625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 13.0, 12.0, 23.0, 22.0, 21.0, 23.0, 31.0, 33.0, 35.0, 47.0, 45.0, 41.0, 44.0, 55.0, 58.0, 58.0, 50.0, 57.0, 52.0, 48.0, 33.0, 35.0, 25.0, 28.0, 28.0, 14.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.869583129882812, -23.966888427734375, -23.064193725585938, -22.1614990234375, -21.258804321289062, -20.356109619140625, -19.453414916992188, -18.55072021484375, -17.648025512695312, -16.745330810546875, -15.842636108398438, -14.93994140625, -14.037246704101562, -13.134552001953125, -12.231856346130371, -11.329161643981934, -10.42646598815918, -9.523771286010742, -8.621076583862305, -7.718381404876709, -6.8156867027282715, -5.912992000579834, -5.010296821594238, -4.107602119445801, -3.2049074172973633, -2.302212715148926, -1.3995177745819092, -0.4968228340148926, 0.4058718681335449, 1.3085665702819824, 2.211261749267578, 3.1139564514160156, 4.016651153564453, 4.919345855712891, 5.822040557861328, 6.724735736846924, 7.627430438995361, 8.53012466430664, 9.432820320129395, 10.335515022277832, 11.23820972442627, 12.140904426574707, 13.043599128723145, 13.946294784545898, 14.848989486694336, 15.751684188842773, 16.65437889099121, 17.55707359313965, 18.459768295288086, 19.362462997436523, 20.26515769958496, 21.1678524017334, 22.070547103881836, 22.973241806030273, 23.875938415527344, 24.77863311767578, 25.68132781982422, 26.584022521972656, 27.486717224121094, 28.38941192626953, 29.29210662841797, 30.194801330566406, 31.097496032714844, 32.00019073486328, 32.90288543701172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 16.0, 9.0, 16.0, 19.0, 20.0, 17.0, 25.0, 26.0, 28.0, 37.0, 38.0, 37.0, 38.0, 51.0, 28.0, 45.0, 54.0, 42.0, 35.0, 42.0, 28.0, 34.0, 30.0, 32.0, 30.0, 27.0, 28.0, 31.0, 20.0, 13.0, 15.0, 27.0, 9.0, 6.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.204423904418945, -22.469974517822266, -21.735523223876953, -21.001073837280273, -20.26662254333496, -19.53217315673828, -18.79772186279297, -18.06327247619629, -17.32882308959961, -16.59437370300293, -15.859922409057617, -15.125473022460938, -14.391021728515625, -13.656572341918945, -12.92212200164795, -12.187671661376953, -11.45322036743164, -10.718770027160645, -9.984319686889648, -9.249870300292969, -8.515419006347656, -7.780969142913818, -7.0465192794799805, -6.312068939208984, -5.577618598937988, -4.843168258666992, -4.108717918395996, -3.374268054962158, -2.639817714691162, -1.905367374420166, -1.1709175109863281, -0.43646717071533203, 0.29798126220703125, 1.0324314832687378, 1.7668817043304443, 2.5013318061828613, 3.2357821464538574, 3.9702324867248535, 4.704682350158691, 5.4391326904296875, 6.173583030700684, 6.90803337097168, 7.642483711242676, 8.376934051513672, 9.111383438110352, 9.845834732055664, 10.580284118652344, 11.31473445892334, 12.049184799194336, 12.783635139465332, 13.518085479736328, 14.252534866333008, 14.98698616027832, 15.721435546875, 16.455886840820312, 17.190336227416992, 17.924785614013672, 18.65923500061035, 19.393686294555664, 20.128135681152344, 20.862586975097656, 21.597036361694336, 22.331485748291016, 23.065937042236328, 23.80038833618164]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 29.0, 37.0, 55.0, 95.0, 143.0, 237.0, 337.0, 530.0, 878.0, 1337.0, 1948.0, 3210.0, 4837.0, 7632.0, 11890.0, 18504.0, 27989.0, 41775.0, 59828.0, 82951.0, 106070.0, 122432.0, 126501.0, 115354.0, 94807.0, 70614.0, 50169.0, 33781.0, 22892.0, 14855.0, 9762.0, 5968.0, 3870.0, 2534.0, 1672.0, 1084.0, 669.0, 425.0, 291.0, 188.0, 118.0, 74.0, 49.0, 37.0, 29.0, 10.0, 9.0, 4.0, 8.0, 4.0, 1.0, 3.0, 3.0], "bins": [-28.765625, -27.900390625, -27.03515625, -26.169921875, -25.3046875, -24.439453125, -23.57421875, -22.708984375, -21.84375, -20.978515625, -20.11328125, -19.248046875, -18.3828125, -17.517578125, -16.65234375, -15.787109375, -14.921875, -14.056640625, -13.19140625, -12.326171875, -11.4609375, -10.595703125, -9.73046875, -8.865234375, -8.0, -7.134765625, -6.26953125, -5.404296875, -4.5390625, -3.673828125, -2.80859375, -1.943359375, -1.078125, -0.212890625, 0.65234375, 1.517578125, 2.3828125, 3.248046875, 4.11328125, 4.978515625, 5.84375, 6.708984375, 7.57421875, 8.439453125, 9.3046875, 10.169921875, 11.03515625, 11.900390625, 12.765625, 13.630859375, 14.49609375, 15.361328125, 16.2265625, 17.091796875, 17.95703125, 18.822265625, 19.6875, 20.552734375, 21.41796875, 22.283203125, 23.1484375, 24.013671875, 24.87890625, 25.744140625, 26.609375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 10.0, 18.0, 7.0, 14.0, 19.0, 24.0, 20.0, 20.0, 38.0, 31.0, 33.0, 28.0, 38.0, 33.0, 46.0, 50.0, 28.0, 47.0, 31.0, 32.0, 43.0, 42.0, 43.0, 36.0, 27.0, 32.0, 19.0, 23.0, 27.0, 21.0, 15.0, 20.0, 17.0, 9.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.098876953125, -20.40087890625, -19.702880859375, -19.0048828125, -18.306884765625, -17.60888671875, -16.910888671875, -16.212890625, -15.514892578125, -14.81689453125, -14.118896484375, -13.4208984375, -12.722900390625, -12.02490234375, -11.326904296875, -10.62890625, -9.930908203125, -9.23291015625, -8.534912109375, -7.8369140625, -7.138916015625, -6.44091796875, -5.742919921875, -5.044921875, -4.346923828125, -3.64892578125, -2.950927734375, -2.2529296875, -1.554931640625, -0.85693359375, -0.158935546875, 0.5390625, 1.237060546875, 1.93505859375, 2.633056640625, 3.3310546875, 4.029052734375, 4.72705078125, 5.425048828125, 6.123046875, 6.821044921875, 7.51904296875, 8.217041015625, 8.9150390625, 9.613037109375, 10.31103515625, 11.009033203125, 11.70703125, 12.405029296875, 13.10302734375, 13.801025390625, 14.4990234375, 15.197021484375, 15.89501953125, 16.593017578125, 17.291015625, 17.989013671875, 18.68701171875, 19.385009765625, 20.0830078125, 20.781005859375, 21.47900390625, 22.177001953125, 22.875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 20.0, 14.0, 23.0, 28.0, 53.0, 82.0, 136.0, 217.0, 325.0, 487.0, 781.0, 1177.0, 1777.0, 2847.0, 4137.0, 6166.0, 9528.0, 13520.0, 19323.0, 27671.0, 38352.0, 50891.0, 65814.0, 80844.0, 93688.0, 101429.0, 102982.0, 94082.0, 82344.0, 66949.0, 52426.0, 39184.0, 28400.0, 20232.0, 14013.0, 9541.0, 6513.0, 4295.0, 2852.0, 1847.0, 1222.0, 848.0, 544.0, 329.0, 211.0, 149.0, 81.0, 76.0, 42.0, 29.0, 17.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.859375, -22.14599609375, -21.4326171875, -20.71923828125, -20.005859375, -19.29248046875, -18.5791015625, -17.86572265625, -17.15234375, -16.43896484375, -15.7255859375, -15.01220703125, -14.298828125, -13.58544921875, -12.8720703125, -12.15869140625, -11.4453125, -10.73193359375, -10.0185546875, -9.30517578125, -8.591796875, -7.87841796875, -7.1650390625, -6.45166015625, -5.73828125, -5.02490234375, -4.3115234375, -3.59814453125, -2.884765625, -2.17138671875, -1.4580078125, -0.74462890625, -0.03125, 0.68212890625, 1.3955078125, 2.10888671875, 2.822265625, 3.53564453125, 4.2490234375, 4.96240234375, 5.67578125, 6.38916015625, 7.1025390625, 7.81591796875, 8.529296875, 9.24267578125, 9.9560546875, 10.66943359375, 11.3828125, 12.09619140625, 12.8095703125, 13.52294921875, 14.236328125, 14.94970703125, 15.6630859375, 16.37646484375, 17.08984375, 17.80322265625, 18.5166015625, 19.22998046875, 19.943359375, 20.65673828125, 21.3701171875, 22.08349609375, 22.796875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 16.0, 13.0, 17.0, 19.0, 25.0, 26.0, 22.0, 32.0, 31.0, 30.0, 33.0, 31.0, 35.0, 37.0, 47.0, 47.0, 30.0, 43.0, 41.0, 31.0, 35.0, 45.0, 32.0, 32.0, 34.0, 37.0, 32.0, 30.0, 16.0, 9.0, 16.0, 15.0, 9.0, 7.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.593505859375, -16.12451171875, -15.655517578125, -15.1865234375, -14.717529296875, -14.24853515625, -13.779541015625, -13.310546875, -12.841552734375, -12.37255859375, -11.903564453125, -11.4345703125, -10.965576171875, -10.49658203125, -10.027587890625, -9.55859375, -9.089599609375, -8.62060546875, -8.151611328125, -7.6826171875, -7.213623046875, -6.74462890625, -6.275634765625, -5.806640625, -5.337646484375, -4.86865234375, -4.399658203125, -3.9306640625, -3.461669921875, -2.99267578125, -2.523681640625, -2.0546875, -1.585693359375, -1.11669921875, -0.647705078125, -0.1787109375, 0.290283203125, 0.75927734375, 1.228271484375, 1.697265625, 2.166259765625, 2.63525390625, 3.104248046875, 3.5732421875, 4.042236328125, 4.51123046875, 4.980224609375, 5.44921875, 5.918212890625, 6.38720703125, 6.856201171875, 7.3251953125, 7.794189453125, 8.26318359375, 8.732177734375, 9.201171875, 9.670166015625, 10.13916015625, 10.608154296875, 11.0771484375, 11.546142578125, 12.01513671875, 12.484130859375, 12.953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 18.0, 20.0, 35.0, 53.0, 81.0, 109.0, 199.0, 256.0, 436.0, 651.0, 1161.0, 2046.0, 3313.0, 5582.0, 9923.0, 17664.0, 31659.0, 56208.0, 95968.0, 149091.0, 189343.0, 176799.0, 127086.0, 77757.0, 44498.0, 25192.0, 14065.0, 7982.0, 4674.0, 2666.0, 1576.0, 896.0, 547.0, 373.0, 204.0, 133.0, 87.0, 56.0, 35.0, 35.0, 19.0, 17.0, 11.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.640625, -13.2247314453125, -12.808837890625, -12.3929443359375, -11.97705078125, -11.5611572265625, -11.145263671875, -10.7293701171875, -10.3134765625, -9.8975830078125, -9.481689453125, -9.0657958984375, -8.64990234375, -8.2340087890625, -7.818115234375, -7.4022216796875, -6.986328125, -6.5704345703125, -6.154541015625, -5.7386474609375, -5.32275390625, -4.9068603515625, -4.490966796875, -4.0750732421875, -3.6591796875, -3.2432861328125, -2.827392578125, -2.4114990234375, -1.99560546875, -1.5797119140625, -1.163818359375, -0.7479248046875, -0.33203125, 0.0838623046875, 0.499755859375, 0.9156494140625, 1.33154296875, 1.7474365234375, 2.163330078125, 2.5792236328125, 2.9951171875, 3.4110107421875, 3.826904296875, 4.2427978515625, 4.65869140625, 5.0745849609375, 5.490478515625, 5.9063720703125, 6.322265625, 6.7381591796875, 7.154052734375, 7.5699462890625, 7.98583984375, 8.4017333984375, 8.817626953125, 9.2335205078125, 9.6494140625, 10.0653076171875, 10.481201171875, 10.8970947265625, 11.31298828125, 11.7288818359375, 12.144775390625, 12.5606689453125, 12.9765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 22.0, 25.0, 18.0, 43.0, 42.0, 48.0, 58.0, 71.0, 82.0, 87.0, 63.0, 80.0, 60.0, 62.0, 34.0, 39.0, 21.0, 31.0, 15.0, 10.0, 9.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00180816650390625, -0.0017583668231964111, -0.0017085671424865723, -0.0016587674617767334, -0.0016089677810668945, -0.0015591681003570557, -0.0015093684196472168, -0.001459568738937378, -0.001409769058227539, -0.0013599693775177002, -0.0013101696968078613, -0.0012603700160980225, -0.0012105703353881836, -0.0011607706546783447, -0.0011109709739685059, -0.001061171293258667, -0.0010113716125488281, -0.0009615719318389893, -0.0009117722511291504, -0.0008619725704193115, -0.0008121728897094727, -0.0007623732089996338, -0.0007125735282897949, -0.0006627738475799561, -0.0006129741668701172, -0.0005631744861602783, -0.0005133748054504395, -0.0004635751247406006, -0.0004137754440307617, -0.00036397576332092285, -0.000314176082611084, -0.0002643764019012451, -0.00021457672119140625, -0.00016477704048156738, -0.00011497735977172852, -6.517767906188965e-05, -1.537799835205078e-05, 3.4421682357788086e-05, 8.422136306762695e-05, 0.00013402104377746582, 0.0001838207244873047, 0.00023362040519714355, 0.0002834200859069824, 0.0003332197666168213, 0.00038301944732666016, 0.000432819128036499, 0.0004826188087463379, 0.0005324184894561768, 0.0005822181701660156, 0.0006320178508758545, 0.0006818175315856934, 0.0007316172122955322, 0.0007814168930053711, 0.00083121657371521, 0.0008810162544250488, 0.0009308159351348877, 0.0009806156158447266, 0.0010304152965545654, 0.0010802149772644043, 0.0011300146579742432, 0.001179814338684082, 0.001229614019393921, 0.0012794137001037598, 0.0013292133808135986, 0.0013790130615234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 11.0, 22.0, 19.0, 38.0, 54.0, 88.0, 121.0, 197.0, 305.0, 521.0, 856.0, 1473.0, 2468.0, 4160.0, 7301.0, 12294.0, 21399.0, 36063.0, 59802.0, 94490.0, 133180.0, 161283.0, 158612.0, 127981.0, 88716.0, 56004.0, 33810.0, 19544.0, 11599.0, 6604.0, 3877.0, 2228.0, 1337.0, 824.0, 477.0, 269.0, 183.0, 125.0, 60.0, 39.0, 32.0, 26.0, 13.0, 17.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.2578125, -9.9365234375, -9.615234375, -9.2939453125, -8.97265625, -8.6513671875, -8.330078125, -8.0087890625, -7.6875, -7.3662109375, -7.044921875, -6.7236328125, -6.40234375, -6.0810546875, -5.759765625, -5.4384765625, -5.1171875, -4.7958984375, -4.474609375, -4.1533203125, -3.83203125, -3.5107421875, -3.189453125, -2.8681640625, -2.546875, -2.2255859375, -1.904296875, -1.5830078125, -1.26171875, -0.9404296875, -0.619140625, -0.2978515625, 0.0234375, 0.3447265625, 0.666015625, 0.9873046875, 1.30859375, 1.6298828125, 1.951171875, 2.2724609375, 2.59375, 2.9150390625, 3.236328125, 3.5576171875, 3.87890625, 4.2001953125, 4.521484375, 4.8427734375, 5.1640625, 5.4853515625, 5.806640625, 6.1279296875, 6.44921875, 6.7705078125, 7.091796875, 7.4130859375, 7.734375, 8.0556640625, 8.376953125, 8.6982421875, 9.01953125, 9.3408203125, 9.662109375, 9.9833984375, 10.3046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 26.0, 18.0, 41.0, 45.0, 52.0, 66.0, 63.0, 75.0, 57.0, 65.0, 56.0, 74.0, 63.0, 44.0, 32.0, 35.0, 22.0, 24.0, 13.0, 16.0, 14.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.74700927734375, -3.6112060546875, -3.47540283203125, -3.339599609375, -3.20379638671875, -3.0679931640625, -2.93218994140625, -2.79638671875, -2.66058349609375, -2.5247802734375, -2.38897705078125, -2.253173828125, -2.11737060546875, -1.9815673828125, -1.84576416015625, -1.7099609375, -1.57415771484375, -1.4383544921875, -1.30255126953125, -1.166748046875, -1.03094482421875, -0.8951416015625, -0.75933837890625, -0.62353515625, -0.48773193359375, -0.3519287109375, -0.21612548828125, -0.080322265625, 0.05548095703125, 0.1912841796875, 0.32708740234375, 0.462890625, 0.59869384765625, 0.7344970703125, 0.87030029296875, 1.006103515625, 1.14190673828125, 1.2777099609375, 1.41351318359375, 1.54931640625, 1.68511962890625, 1.8209228515625, 1.95672607421875, 2.092529296875, 2.22833251953125, 2.3641357421875, 2.49993896484375, 2.6357421875, 2.77154541015625, 2.9073486328125, 3.04315185546875, 3.178955078125, 3.31475830078125, 3.4505615234375, 3.58636474609375, 3.72216796875, 3.85797119140625, 3.9937744140625, 4.12957763671875, 4.265380859375, 4.40118408203125, 4.5369873046875, 4.67279052734375, 4.80859375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 7.0, 13.0, 3.0, 12.0, 16.0, 29.0, 30.0, 30.0, 37.0, 56.0, 44.0, 39.0, 63.0, 57.0, 67.0, 43.0, 37.0, 50.0, 53.0, 44.0, 45.0, 40.0, 38.0, 39.0, 23.0, 12.0, 16.0, 14.0, 5.0, 4.0, 8.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.73617935180664, -25.854040145874023, -24.971899032592773, -24.089759826660156, -23.20762062072754, -22.325481414794922, -21.443340301513672, -20.561201095581055, -19.679061889648438, -18.79692268371582, -17.91478157043457, -17.032642364501953, -16.150503158569336, -15.268362998962402, -14.386222839355469, -13.504083633422852, -12.621942520141602, -11.739802360534668, -10.85766315460205, -9.975522994995117, -9.0933837890625, -8.211243629455566, -7.329103469848633, -6.446963787078857, -5.564824104309082, -4.682684421539307, -3.800544500350952, -2.9184045791625977, -2.0362648963928223, -1.1541252136230469, -0.2719850540161133, 0.6101546287536621, 1.4922924041748047, 2.37443208694458, 3.2565720081329346, 4.138711929321289, 5.0208516120910645, 5.90299129486084, 6.785131454467773, 7.667271137237549, 8.549410820007324, 9.431550979614258, 10.313690185546875, 11.195830345153809, 12.077970504760742, 12.96010971069336, 13.842249870300293, 14.724390029907227, 15.606529235839844, 16.48866844177246, 17.37080955505371, 18.252948760986328, 19.135087966918945, 20.017227172851562, 20.899368286132812, 21.78150749206543, 22.663646697998047, 23.545785903930664, 24.427927017211914, 25.31006622314453, 26.19220542907715, 27.074344635009766, 27.956485748291016, 28.838624954223633, 29.720766067504883]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 11.0, 8.0, 8.0, 11.0, 10.0, 14.0, 7.0, 17.0, 18.0, 25.0, 19.0, 31.0, 22.0, 38.0, 36.0, 40.0, 38.0, 32.0, 51.0, 37.0, 34.0, 38.0, 48.0, 42.0, 32.0, 35.0, 33.0, 21.0, 32.0, 29.0, 23.0, 16.0, 23.0, 14.0, 15.0, 12.0, 13.0, 8.0, 15.0, 11.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.233980178833008, -23.551773071289062, -22.869565963745117, -22.187358856201172, -21.505151748657227, -20.82294464111328, -20.14073944091797, -19.45853042602539, -18.776325225830078, -18.094118118286133, -17.411911010742188, -16.729703903198242, -16.047496795654297, -15.365289688110352, -14.683083534240723, -14.000876426696777, -13.318668365478516, -12.63646125793457, -11.954254150390625, -11.27204704284668, -10.589839935302734, -9.907632827758789, -9.22542667388916, -8.543219566345215, -7.8610124588012695, -7.178805351257324, -6.496598243713379, -5.814391613006592, -5.1321845054626465, -4.449977397918701, -3.767770767211914, -3.0855636596679688, -2.4033584594726562, -1.7211514711380005, -1.0389444828033447, -0.3567376136779785, 0.3254694938659668, 1.007676601409912, 1.6898832321166992, 2.3720903396606445, 3.05429744720459, 3.736504554748535, 4.4187116622924805, 5.100918292999268, 5.783125400543213, 6.465332508087158, 7.147539138793945, 7.829746246337891, 8.511953353881836, 9.194160461425781, 9.876367568969727, 10.558574676513672, 11.240781784057617, 11.922988891601562, 12.605195045471191, 13.287402153015137, 13.969609260559082, 14.651816368103027, 15.334023475646973, 16.0162296295166, 16.698436737060547, 17.380643844604492, 18.062850952148438, 18.745058059692383, 19.427265167236328]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 16.0, 20.0, 39.0, 60.0, 95.0, 133.0, 200.0, 294.0, 509.0, 811.0, 1348.0, 2261.0, 3855.0, 6811.0, 11720.0, 21053.0, 39053.0, 73023.0, 141012.0, 273685.0, 518285.0, 843565.0, 919731.0, 625401.0, 338054.0, 174321.0, 91071.0, 47567.0, 25884.0, 14245.0, 8200.0, 4815.0, 2782.0, 1713.0, 1011.0, 617.0, 371.0, 243.0, 140.0, 107.0, 58.0, 35.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.390625, -26.482421875, -25.57421875, -24.666015625, -23.7578125, -22.849609375, -21.94140625, -21.033203125, -20.125, -19.216796875, -18.30859375, -17.400390625, -16.4921875, -15.583984375, -14.67578125, -13.767578125, -12.859375, -11.951171875, -11.04296875, -10.134765625, -9.2265625, -8.318359375, -7.41015625, -6.501953125, -5.59375, -4.685546875, -3.77734375, -2.869140625, -1.9609375, -1.052734375, -0.14453125, 0.763671875, 1.671875, 2.580078125, 3.48828125, 4.396484375, 5.3046875, 6.212890625, 7.12109375, 8.029296875, 8.9375, 9.845703125, 10.75390625, 11.662109375, 12.5703125, 13.478515625, 14.38671875, 15.294921875, 16.203125, 17.111328125, 18.01953125, 18.927734375, 19.8359375, 20.744140625, 21.65234375, 22.560546875, 23.46875, 24.376953125, 25.28515625, 26.193359375, 27.1015625, 28.009765625, 28.91796875, 29.826171875, 30.734375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 9.0, 7.0, 9.0, 10.0, 9.0, 13.0, 11.0, 14.0, 17.0, 21.0, 21.0, 28.0, 37.0, 42.0, 32.0, 21.0, 35.0, 46.0, 41.0, 42.0, 35.0, 44.0, 39.0, 38.0, 36.0, 42.0, 31.0, 26.0, 26.0, 32.0, 24.0, 23.0, 12.0, 13.0, 15.0, 21.0, 11.0, 11.0, 10.0, 6.0, 6.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.984375, -16.462158203125, -15.93994140625, -15.417724609375, -14.8955078125, -14.373291015625, -13.85107421875, -13.328857421875, -12.806640625, -12.284423828125, -11.76220703125, -11.239990234375, -10.7177734375, -10.195556640625, -9.67333984375, -9.151123046875, -8.62890625, -8.106689453125, -7.58447265625, -7.062255859375, -6.5400390625, -6.017822265625, -5.49560546875, -4.973388671875, -4.451171875, -3.928955078125, -3.40673828125, -2.884521484375, -2.3623046875, -1.840087890625, -1.31787109375, -0.795654296875, -0.2734375, 0.248779296875, 0.77099609375, 1.293212890625, 1.8154296875, 2.337646484375, 2.85986328125, 3.382080078125, 3.904296875, 4.426513671875, 4.94873046875, 5.470947265625, 5.9931640625, 6.515380859375, 7.03759765625, 7.559814453125, 8.08203125, 8.604248046875, 9.12646484375, 9.648681640625, 10.1708984375, 10.693115234375, 11.21533203125, 11.737548828125, 12.259765625, 12.781982421875, 13.30419921875, 13.826416015625, 14.3486328125, 14.870849609375, 15.39306640625, 15.915283203125, 16.4375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 9.0, 22.0, 35.0, 63.0, 99.0, 146.0, 227.0, 345.0, 562.0, 889.0, 1380.0, 2238.0, 3472.0, 5520.0, 8517.0, 13684.0, 21011.0, 33408.0, 52339.0, 82529.0, 127678.0, 196691.0, 295586.0, 423378.0, 556947.0, 618748.0, 542010.0, 405500.0, 280182.0, 186211.0, 121175.0, 78030.0, 49481.0, 31531.0, 20051.0, 12467.0, 7966.0, 4983.0, 3329.0, 2165.0, 1281.0, 878.0, 566.0, 349.0, 225.0, 137.0, 88.0, 62.0, 29.0, 30.0, 16.0, 11.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-18.046875, -17.490478515625, -16.93408203125, -16.377685546875, -15.8212890625, -15.264892578125, -14.70849609375, -14.152099609375, -13.595703125, -13.039306640625, -12.48291015625, -11.926513671875, -11.3701171875, -10.813720703125, -10.25732421875, -9.700927734375, -9.14453125, -8.588134765625, -8.03173828125, -7.475341796875, -6.9189453125, -6.362548828125, -5.80615234375, -5.249755859375, -4.693359375, -4.136962890625, -3.58056640625, -3.024169921875, -2.4677734375, -1.911376953125, -1.35498046875, -0.798583984375, -0.2421875, 0.314208984375, 0.87060546875, 1.427001953125, 1.9833984375, 2.539794921875, 3.09619140625, 3.652587890625, 4.208984375, 4.765380859375, 5.32177734375, 5.878173828125, 6.4345703125, 6.990966796875, 7.54736328125, 8.103759765625, 8.66015625, 9.216552734375, 9.77294921875, 10.329345703125, 10.8857421875, 11.442138671875, 11.99853515625, 12.554931640625, 13.111328125, 13.667724609375, 14.22412109375, 14.780517578125, 15.3369140625, 15.893310546875, 16.44970703125, 17.006103515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 11.0, 5.0, 13.0, 5.0, 18.0, 19.0, 22.0, 33.0, 39.0, 34.0, 55.0, 69.0, 69.0, 110.0, 133.0, 157.0, 158.0, 207.0, 238.0, 240.0, 277.0, 263.0, 258.0, 241.0, 224.0, 222.0, 150.0, 138.0, 114.0, 93.0, 89.0, 86.0, 65.0, 58.0, 40.0, 31.0, 25.0, 17.0, 8.0, 16.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.078125, -8.80615234375, -8.5341796875, -8.26220703125, -7.990234375, -7.71826171875, -7.4462890625, -7.17431640625, -6.90234375, -6.63037109375, -6.3583984375, -6.08642578125, -5.814453125, -5.54248046875, -5.2705078125, -4.99853515625, -4.7265625, -4.45458984375, -4.1826171875, -3.91064453125, -3.638671875, -3.36669921875, -3.0947265625, -2.82275390625, -2.55078125, -2.27880859375, -2.0068359375, -1.73486328125, -1.462890625, -1.19091796875, -0.9189453125, -0.64697265625, -0.375, -0.10302734375, 0.1689453125, 0.44091796875, 0.712890625, 0.98486328125, 1.2568359375, 1.52880859375, 1.80078125, 2.07275390625, 2.3447265625, 2.61669921875, 2.888671875, 3.16064453125, 3.4326171875, 3.70458984375, 3.9765625, 4.24853515625, 4.5205078125, 4.79248046875, 5.064453125, 5.33642578125, 5.6083984375, 5.88037109375, 6.15234375, 6.42431640625, 6.6962890625, 6.96826171875, 7.240234375, 7.51220703125, 7.7841796875, 8.05615234375, 8.328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 9.0, 17.0, 10.0, 13.0, 17.0, 24.0, 32.0, 38.0, 36.0, 46.0, 36.0, 50.0, 44.0, 63.0, 46.0, 45.0, 55.0, 54.0, 59.0, 42.0, 26.0, 40.0, 29.0, 35.0, 19.0, 14.0, 16.0, 15.0, 13.0, 7.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.473526000976562, -24.72777557373047, -23.982027053833008, -23.236276626586914, -22.490528106689453, -21.74477767944336, -20.999027252197266, -20.253278732299805, -19.50752830505371, -18.761777877807617, -18.016029357910156, -17.270278930664062, -16.5245304107666, -15.778779983520508, -15.03303050994873, -14.287281036376953, -13.541531562805176, -12.795782089233398, -12.050032615661621, -11.304283142089844, -10.55853271484375, -9.812783241271973, -9.067033767700195, -8.321283340454102, -7.575534343719482, -6.829784870147705, -6.0840349197387695, -5.338285446166992, -4.592535972595215, -3.8467860221862793, -3.101036548614502, -2.3552865982055664, -1.609537124633789, -0.8637874722480774, -0.11803781986236572, 0.6277117729187012, 1.3734614849090576, 2.119211196899414, 2.8649606704711914, 3.610710620880127, 4.356460094451904, 5.102209568023682, 5.847959518432617, 6.5937089920043945, 7.339458465576172, 8.085208892822266, 8.830957412719727, 9.57670783996582, 10.322457313537598, 11.068206787109375, 11.813956260681152, 12.55970573425293, 13.305456161499023, 14.0512056350708, 14.796955108642578, 15.542705535888672, 16.288454055786133, 17.034204483032227, 17.779953002929688, 18.52570343017578, 19.271451950073242, 20.017202377319336, 20.762950897216797, 21.50870132446289, 22.254451751708984]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 7.0, 3.0, 10.0, 4.0, 6.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 20.0, 28.0, 30.0, 41.0, 25.0, 39.0, 31.0, 37.0, 48.0, 46.0, 34.0, 37.0, 43.0, 35.0, 35.0, 48.0, 20.0, 42.0, 31.0, 29.0, 32.0, 20.0, 21.0, 25.0, 18.0, 19.0, 18.0, 13.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.582006454467773, -20.952877044677734, -20.323745727539062, -19.694616317749023, -19.065486907958984, -18.436357498168945, -17.807228088378906, -17.178096771240234, -16.548967361450195, -15.919837951660156, -15.2907075881958, -14.661577224731445, -14.032447814941406, -13.403318405151367, -12.774188041687012, -12.145057678222656, -11.515928268432617, -10.886798858642578, -10.257668495178223, -9.628538131713867, -8.999408721923828, -8.370279312133789, -7.741148948669434, -7.112019062042236, -6.482889175415039, -5.853759288787842, -5.2246294021606445, -4.595499515533447, -3.96636962890625, -3.3372397422790527, -2.7081098556518555, -2.078979969024658, -1.449850082397461, -0.8207201957702637, -0.1915903091430664, 0.43753957748413086, 1.0666694641113281, 1.6957993507385254, 2.3249292373657227, 2.95405912399292, 3.583189010620117, 4.2123188972473145, 4.841448783874512, 5.470578670501709, 6.099708557128906, 6.7288384437561035, 7.357968330383301, 7.987098217010498, 8.616228103637695, 9.245357513427734, 9.87448787689209, 10.503618240356445, 11.132747650146484, 11.761877059936523, 12.391007423400879, 13.020137786865234, 13.649267196655273, 14.278396606445312, 14.907526969909668, 15.536657333374023, 16.165786743164062, 16.7949161529541, 17.42404556274414, 18.053176879882812, 18.68230628967285]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 11.0, 15.0, 21.0, 37.0, 55.0, 88.0, 157.0, 234.0, 379.0, 650.0, 999.0, 1725.0, 2692.0, 4180.0, 6711.0, 10472.0, 15782.0, 23705.0, 34523.0, 48728.0, 65560.0, 84325.0, 101317.0, 112252.0, 112471.0, 103065.0, 87416.0, 69400.0, 51491.0, 36936.0, 25459.0, 17051.0, 11179.0, 7119.0, 4619.0, 2935.0, 1861.0, 1104.0, 682.0, 405.0, 265.0, 180.0, 131.0, 64.0, 47.0, 25.0, 12.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-13.0546875, -12.6717529296875, -12.288818359375, -11.9058837890625, -11.52294921875, -11.1400146484375, -10.757080078125, -10.3741455078125, -9.9912109375, -9.6082763671875, -9.225341796875, -8.8424072265625, -8.45947265625, -8.0765380859375, -7.693603515625, -7.3106689453125, -6.927734375, -6.5447998046875, -6.161865234375, -5.7789306640625, -5.39599609375, -5.0130615234375, -4.630126953125, -4.2471923828125, -3.8642578125, -3.4813232421875, -3.098388671875, -2.7154541015625, -2.33251953125, -1.9495849609375, -1.566650390625, -1.1837158203125, -0.80078125, -0.4178466796875, -0.034912109375, 0.3480224609375, 0.73095703125, 1.1138916015625, 1.496826171875, 1.8797607421875, 2.2626953125, 2.6456298828125, 3.028564453125, 3.4114990234375, 3.79443359375, 4.1773681640625, 4.560302734375, 4.9432373046875, 5.326171875, 5.7091064453125, 6.092041015625, 6.4749755859375, 6.85791015625, 7.2408447265625, 7.623779296875, 8.0067138671875, 8.3896484375, 8.7725830078125, 9.155517578125, 9.5384521484375, 9.92138671875, 10.3043212890625, 10.687255859375, 11.0701904296875, 11.453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 3.0, 11.0, 10.0, 14.0, 15.0, 11.0, 24.0, 24.0, 35.0, 18.0, 32.0, 37.0, 32.0, 60.0, 41.0, 37.0, 41.0, 41.0, 44.0, 42.0, 41.0, 32.0, 36.0, 38.0, 30.0, 27.0, 27.0, 28.0, 33.0, 27.0, 16.0, 13.0, 17.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.55517578125, -17.0166015625, -16.47802734375, -15.939453125, -15.40087890625, -14.8623046875, -14.32373046875, -13.78515625, -13.24658203125, -12.7080078125, -12.16943359375, -11.630859375, -11.09228515625, -10.5537109375, -10.01513671875, -9.4765625, -8.93798828125, -8.3994140625, -7.86083984375, -7.322265625, -6.78369140625, -6.2451171875, -5.70654296875, -5.16796875, -4.62939453125, -4.0908203125, -3.55224609375, -3.013671875, -2.47509765625, -1.9365234375, -1.39794921875, -0.859375, -0.32080078125, 0.2177734375, 0.75634765625, 1.294921875, 1.83349609375, 2.3720703125, 2.91064453125, 3.44921875, 3.98779296875, 4.5263671875, 5.06494140625, 5.603515625, 6.14208984375, 6.6806640625, 7.21923828125, 7.7578125, 8.29638671875, 8.8349609375, 9.37353515625, 9.912109375, 10.45068359375, 10.9892578125, 11.52783203125, 12.06640625, 12.60498046875, 13.1435546875, 13.68212890625, 14.220703125, 14.75927734375, 15.2978515625, 15.83642578125, 16.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 6.0, 9.0, 17.0, 15.0, 22.0, 41.0, 47.0, 50.0, 81.0, 120.0, 178.0, 205.0, 302.0, 413.0, 627.0, 833.0, 1233.0, 1712.0, 2520.0, 3452.0, 5218.0, 7937.0, 12790.0, 21520.0, 63395.0, 808992.0, 58145.0, 20983.0, 12579.0, 7964.0, 5200.0, 3692.0, 2421.0, 1728.0, 1133.0, 819.0, 619.0, 440.0, 287.0, 211.0, 161.0, 115.0, 81.0, 61.0, 46.0, 37.0, 27.0, 14.0, 17.0, 12.0, 5.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0], "bins": [-36.75, -35.61865234375, -34.4873046875, -33.35595703125, -32.224609375, -31.09326171875, -29.9619140625, -28.83056640625, -27.69921875, -26.56787109375, -25.4365234375, -24.30517578125, -23.173828125, -22.04248046875, -20.9111328125, -19.77978515625, -18.6484375, -17.51708984375, -16.3857421875, -15.25439453125, -14.123046875, -12.99169921875, -11.8603515625, -10.72900390625, -9.59765625, -8.46630859375, -7.3349609375, -6.20361328125, -5.072265625, -3.94091796875, -2.8095703125, -1.67822265625, -0.546875, 0.58447265625, 1.7158203125, 2.84716796875, 3.978515625, 5.10986328125, 6.2412109375, 7.37255859375, 8.50390625, 9.63525390625, 10.7666015625, 11.89794921875, 13.029296875, 14.16064453125, 15.2919921875, 16.42333984375, 17.5546875, 18.68603515625, 19.8173828125, 20.94873046875, 22.080078125, 23.21142578125, 24.3427734375, 25.47412109375, 26.60546875, 27.73681640625, 28.8681640625, 29.99951171875, 31.130859375, 32.26220703125, 33.3935546875, 34.52490234375, 35.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 10.0, 7.0, 8.0, 15.0, 17.0, 14.0, 20.0, 30.0, 29.0, 35.0, 37.0, 30.0, 39.0, 48.0, 40.0, 66.0, 42.0, 51.0, 46.0, 36.0, 39.0, 41.0, 30.0, 30.0, 30.0, 39.0, 15.0, 19.0, 13.0, 17.0, 15.0, 16.0, 11.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-26.359375, -25.589599609375, -24.81982421875, -24.050048828125, -23.2802734375, -22.510498046875, -21.74072265625, -20.970947265625, -20.201171875, -19.431396484375, -18.66162109375, -17.891845703125, -17.1220703125, -16.352294921875, -15.58251953125, -14.812744140625, -14.04296875, -13.273193359375, -12.50341796875, -11.733642578125, -10.9638671875, -10.194091796875, -9.42431640625, -8.654541015625, -7.884765625, -7.114990234375, -6.34521484375, -5.575439453125, -4.8056640625, -4.035888671875, -3.26611328125, -2.496337890625, -1.7265625, -0.956787109375, -0.18701171875, 0.582763671875, 1.3525390625, 2.122314453125, 2.89208984375, 3.661865234375, 4.431640625, 5.201416015625, 5.97119140625, 6.740966796875, 7.5107421875, 8.280517578125, 9.05029296875, 9.820068359375, 10.58984375, 11.359619140625, 12.12939453125, 12.899169921875, 13.6689453125, 14.438720703125, 15.20849609375, 15.978271484375, 16.748046875, 17.517822265625, 18.28759765625, 19.057373046875, 19.8271484375, 20.596923828125, 21.36669921875, 22.136474609375, 22.90625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 15.0, 13.0, 20.0, 34.0, 51.0, 64.0, 92.0, 129.0, 190.0, 324.0, 454.0, 732.0, 1098.0, 1798.0, 2981.0, 5001.0, 8918.0, 17335.0, 48044.0, 801814.0, 110534.0, 22512.0, 11001.0, 5982.0, 3533.0, 2141.0, 1307.0, 831.0, 540.0, 314.0, 220.0, 140.0, 119.0, 83.0, 37.0, 31.0, 35.0, 15.0, 19.0, 12.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 4.0], "bins": [-14.96875, -14.560546875, -14.15234375, -13.744140625, -13.3359375, -12.927734375, -12.51953125, -12.111328125, -11.703125, -11.294921875, -10.88671875, -10.478515625, -10.0703125, -9.662109375, -9.25390625, -8.845703125, -8.4375, -8.029296875, -7.62109375, -7.212890625, -6.8046875, -6.396484375, -5.98828125, -5.580078125, -5.171875, -4.763671875, -4.35546875, -3.947265625, -3.5390625, -3.130859375, -2.72265625, -2.314453125, -1.90625, -1.498046875, -1.08984375, -0.681640625, -0.2734375, 0.134765625, 0.54296875, 0.951171875, 1.359375, 1.767578125, 2.17578125, 2.583984375, 2.9921875, 3.400390625, 3.80859375, 4.216796875, 4.625, 5.033203125, 5.44140625, 5.849609375, 6.2578125, 6.666015625, 7.07421875, 7.482421875, 7.890625, 8.298828125, 8.70703125, 9.115234375, 9.5234375, 9.931640625, 10.33984375, 10.748046875, 11.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 21.0, 18.0, 19.0, 28.0, 38.0, 49.0, 58.0, 79.0, 91.0, 126.0, 95.0, 88.0, 63.0, 43.0, 28.0, 30.0, 15.0, 19.0, 17.0, 14.0, 9.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039005279541015625, -0.0037538111209869385, -0.0036070942878723145, -0.0034603774547576904, -0.0033136606216430664, -0.0031669437885284424, -0.0030202269554138184, -0.0028735101222991943, -0.0027267932891845703, -0.0025800764560699463, -0.0024333596229553223, -0.0022866427898406982, -0.0021399259567260742, -0.00199320912361145, -0.0018464922904968262, -0.0016997754573822021, -0.0015530586242675781, -0.001406341791152954, -0.00125962495803833, -0.001112908124923706, -0.000966191291809082, -0.000819474458694458, -0.000672757625579834, -0.00052604079246521, -0.00037932395935058594, -0.00023260712623596191, -8.589029312133789e-05, 6.082653999328613e-05, 0.00020754337310791016, 0.0003542602062225342, 0.0005009770393371582, 0.0006476938724517822, 0.0007944107055664062, 0.0009411275386810303, 0.0010878443717956543, 0.0012345612049102783, 0.0013812780380249023, 0.0015279948711395264, 0.0016747117042541504, 0.0018214285373687744, 0.0019681453704833984, 0.0021148622035980225, 0.0022615790367126465, 0.0024082958698272705, 0.0025550127029418945, 0.0027017295360565186, 0.0028484463691711426, 0.0029951632022857666, 0.0031418800354003906, 0.0032885968685150146, 0.0034353137016296387, 0.0035820305347442627, 0.0037287473678588867, 0.0038754642009735107, 0.004022181034088135, 0.004168897867202759, 0.004315614700317383, 0.004462331533432007, 0.004609048366546631, 0.004755765199661255, 0.004902482032775879, 0.005049198865890503, 0.005195915699005127, 0.005342632532119751, 0.005489349365234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 8.0, 6.0, 22.0, 27.0, 36.0, 49.0, 67.0, 101.0, 126.0, 189.0, 300.0, 416.0, 616.0, 863.0, 1360.0, 2110.0, 3421.0, 5813.0, 10800.0, 21068.0, 42745.0, 89204.0, 181858.0, 274714.0, 205526.0, 104385.0, 49360.0, 23876.0, 12290.0, 6516.0, 3879.0, 2318.0, 1422.0, 873.0, 640.0, 477.0, 311.0, 239.0, 170.0, 101.0, 82.0, 53.0, 36.0, 30.0, 18.0, 12.0, 5.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.70989990234375, -3.5994873046875, -3.48907470703125, -3.378662109375, -3.26824951171875, -3.1578369140625, -3.04742431640625, -2.93701171875, -2.82659912109375, -2.7161865234375, -2.60577392578125, -2.495361328125, -2.38494873046875, -2.2745361328125, -2.16412353515625, -2.0537109375, -1.94329833984375, -1.8328857421875, -1.72247314453125, -1.612060546875, -1.50164794921875, -1.3912353515625, -1.28082275390625, -1.17041015625, -1.05999755859375, -0.9495849609375, -0.83917236328125, -0.728759765625, -0.61834716796875, -0.5079345703125, -0.39752197265625, -0.287109375, -0.17669677734375, -0.0662841796875, 0.04412841796875, 0.154541015625, 0.26495361328125, 0.3753662109375, 0.48577880859375, 0.59619140625, 0.70660400390625, 0.8170166015625, 0.92742919921875, 1.037841796875, 1.14825439453125, 1.2586669921875, 1.36907958984375, 1.4794921875, 1.58990478515625, 1.7003173828125, 1.81072998046875, 1.921142578125, 2.03155517578125, 2.1419677734375, 2.25238037109375, 2.36279296875, 2.47320556640625, 2.5836181640625, 2.69403076171875, 2.804443359375, 2.91485595703125, 3.0252685546875, 3.13568115234375, 3.24609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 6.0, 12.0, 8.0, 13.0, 17.0, 25.0, 27.0, 27.0, 45.0, 50.0, 59.0, 61.0, 72.0, 79.0, 69.0, 72.0, 73.0, 55.0, 46.0, 36.0, 23.0, 20.0, 22.0, 8.0, 10.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.079315185546875, -1.04534912109375, -1.011383056640625, -0.9774169921875, -0.943450927734375, -0.90948486328125, -0.875518798828125, -0.841552734375, -0.807586669921875, -0.77362060546875, -0.739654541015625, -0.7056884765625, -0.671722412109375, -0.63775634765625, -0.603790283203125, -0.56982421875, -0.535858154296875, -0.50189208984375, -0.467926025390625, -0.4339599609375, -0.399993896484375, -0.36602783203125, -0.332061767578125, -0.298095703125, -0.264129638671875, -0.23016357421875, -0.196197509765625, -0.1622314453125, -0.128265380859375, -0.09429931640625, -0.060333251953125, -0.0263671875, 0.007598876953125, 0.04156494140625, 0.075531005859375, 0.1094970703125, 0.143463134765625, 0.17742919921875, 0.211395263671875, 0.245361328125, 0.279327392578125, 0.31329345703125, 0.347259521484375, 0.3812255859375, 0.415191650390625, 0.44915771484375, 0.483123779296875, 0.51708984375, 0.551055908203125, 0.58502197265625, 0.618988037109375, 0.6529541015625, 0.686920166015625, 0.72088623046875, 0.754852294921875, 0.788818359375, 0.822784423828125, 0.85675048828125, 0.890716552734375, 0.9246826171875, 0.958648681640625, 0.99261474609375, 1.026580810546875, 1.060546875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 2.0, 5.0, 6.0, 16.0, 9.0, 16.0, 19.0, 29.0, 24.0, 32.0, 33.0, 39.0, 32.0, 52.0, 51.0, 50.0, 41.0, 45.0, 55.0, 54.0, 46.0, 48.0, 33.0, 43.0, 33.0, 12.0, 21.0, 31.0, 19.0, 17.0, 19.0, 16.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.877809524536133, -16.325790405273438, -15.773771286010742, -15.221752166748047, -14.669733047485352, -14.117713928222656, -13.565695762634277, -13.013676643371582, -12.461657524108887, -11.909638404846191, -11.357619285583496, -10.8056001663208, -10.253582000732422, -9.701562881469727, -9.149543762207031, -8.597524642944336, -8.04550552368164, -7.493486404418945, -6.94146728515625, -6.389448642730713, -5.837429523468018, -5.285410404205322, -4.733391761779785, -4.18137264251709, -3.6293535232543945, -3.077334403991699, -2.525315523147583, -1.9732965230941772, -1.4212775230407715, -0.8692584037780762, -0.31723952293395996, 0.23477935791015625, 0.7867965698242188, 1.3388155698776245, 1.8908345699310303, 2.4428534507751465, 2.994872570037842, 3.546891689300537, 4.098910331726074, 4.6509294509887695, 5.202948570251465, 5.75496768951416, 6.3069868087768555, 6.859005451202393, 7.411024570465088, 7.963043689727783, 8.51506233215332, 9.067081451416016, 9.619100570678711, 10.171119689941406, 10.723138809204102, 11.275157928466797, 11.827177047729492, 12.379196166992188, 12.931214332580566, 13.483233451843262, 14.035252571105957, 14.587271690368652, 15.139290809631348, 15.691309928894043, 16.243328094482422, 16.795347213745117, 17.347366333007812, 17.899385452270508, 18.451404571533203]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 5.0, 7.0, 12.0, 12.0, 10.0, 22.0, 11.0, 30.0, 24.0, 34.0, 34.0, 34.0, 28.0, 32.0, 49.0, 43.0, 37.0, 39.0, 38.0, 42.0, 33.0, 31.0, 41.0, 42.0, 26.0, 32.0, 26.0, 32.0, 25.0, 26.0, 21.0, 22.0, 17.0, 17.0, 15.0, 3.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.759028434753418, -15.257232666015625, -14.755436897277832, -14.253641128540039, -13.751845359802246, -13.250049591064453, -12.748252868652344, -12.246458053588867, -11.744661331176758, -11.242865562438965, -10.741069793701172, -10.239274024963379, -9.737478256225586, -9.235682487487793, -8.73388671875, -8.23208999633789, -7.730295181274414, -7.228499412536621, -6.726703643798828, -6.224907875061035, -5.723112106323242, -5.221316337585449, -4.719520092010498, -4.217724323272705, -3.715928554534912, -3.214132785797119, -2.712337017059326, -2.210541009902954, -1.7087452411651611, -1.2069494724273682, -0.7051534652709961, -0.20335769653320312, 0.29843711853027344, 0.8002329468727112, 1.302028775215149, 1.8038246631622314, 2.3056204319000244, 2.8074162006378174, 3.3092122077941895, 3.8110079765319824, 4.312803745269775, 4.814599514007568, 5.316395282745361, 5.8181915283203125, 6.3199872970581055, 6.821783065795898, 7.323578834533691, 7.825374603271484, 8.327170372009277, 8.82896614074707, 9.330761909484863, 9.832557678222656, 10.33435344696045, 10.836149215698242, 11.337945938110352, 11.839740753173828, 12.341537475585938, 12.84333324432373, 13.345129013061523, 13.846924781799316, 14.34872055053711, 14.850516319274902, 15.352312088012695, 15.854108810424805, 16.35590362548828]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 17.0, 27.0, 26.0, 42.0, 59.0, 86.0, 119.0, 146.0, 223.0, 364.0, 520.0, 770.0, 1149.0, 1731.0, 2532.0, 3850.0, 5555.0, 8478.0, 12935.0, 19579.0, 29929.0, 44356.0, 64463.0, 89643.0, 114716.0, 131570.0, 129702.0, 111891.0, 86845.0, 61476.0, 42058.0, 28344.0, 18646.0, 12229.0, 8184.0, 5334.0, 3569.0, 2355.0, 1603.0, 1098.0, 743.0, 516.0, 315.0, 229.0, 145.0, 113.0, 74.0, 53.0, 45.0, 32.0, 21.0, 15.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0], "bins": [-13.7890625, -13.3572998046875, -12.925537109375, -12.4937744140625, -12.06201171875, -11.6302490234375, -11.198486328125, -10.7667236328125, -10.3349609375, -9.9031982421875, -9.471435546875, -9.0396728515625, -8.60791015625, -8.1761474609375, -7.744384765625, -7.3126220703125, -6.880859375, -6.4490966796875, -6.017333984375, -5.5855712890625, -5.15380859375, -4.7220458984375, -4.290283203125, -3.8585205078125, -3.4267578125, -2.9949951171875, -2.563232421875, -2.1314697265625, -1.69970703125, -1.2679443359375, -0.836181640625, -0.4044189453125, 0.02734375, 0.4591064453125, 0.890869140625, 1.3226318359375, 1.75439453125, 2.1861572265625, 2.617919921875, 3.0496826171875, 3.4814453125, 3.9132080078125, 4.344970703125, 4.7767333984375, 5.20849609375, 5.6402587890625, 6.072021484375, 6.5037841796875, 6.935546875, 7.3673095703125, 7.799072265625, 8.2308349609375, 8.66259765625, 9.0943603515625, 9.526123046875, 9.9578857421875, 10.3896484375, 10.8214111328125, 11.253173828125, 11.6849365234375, 12.11669921875, 12.5484619140625, 12.980224609375, 13.4119873046875, 13.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 4.0, 2.0, 6.0, 11.0, 9.0, 8.0, 15.0, 14.0, 28.0, 19.0, 20.0, 28.0, 27.0, 31.0, 40.0, 32.0, 36.0, 45.0, 41.0, 34.0, 38.0, 31.0, 44.0, 30.0, 36.0, 30.0, 35.0, 23.0, 24.0, 26.0, 41.0, 28.0, 25.0, 19.0, 22.0, 21.0, 6.0, 11.0, 14.0, 7.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.203125, -12.791259765625, -12.37939453125, -11.967529296875, -11.5556640625, -11.143798828125, -10.73193359375, -10.320068359375, -9.908203125, -9.496337890625, -9.08447265625, -8.672607421875, -8.2607421875, -7.848876953125, -7.43701171875, -7.025146484375, -6.61328125, -6.201416015625, -5.78955078125, -5.377685546875, -4.9658203125, -4.553955078125, -4.14208984375, -3.730224609375, -3.318359375, -2.906494140625, -2.49462890625, -2.082763671875, -1.6708984375, -1.259033203125, -0.84716796875, -0.435302734375, -0.0234375, 0.388427734375, 0.80029296875, 1.212158203125, 1.6240234375, 2.035888671875, 2.44775390625, 2.859619140625, 3.271484375, 3.683349609375, 4.09521484375, 4.507080078125, 4.9189453125, 5.330810546875, 5.74267578125, 6.154541015625, 6.56640625, 6.978271484375, 7.39013671875, 7.802001953125, 8.2138671875, 8.625732421875, 9.03759765625, 9.449462890625, 9.861328125, 10.273193359375, 10.68505859375, 11.096923828125, 11.5087890625, 11.920654296875, 12.33251953125, 12.744384765625, 13.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 14.0, 24.0, 34.0, 60.0, 65.0, 118.0, 151.0, 235.0, 353.0, 520.0, 880.0, 1317.0, 1979.0, 2983.0, 4770.0, 7389.0, 11925.0, 19533.0, 30922.0, 48142.0, 74336.0, 105223.0, 134385.0, 147656.0, 135934.0, 108035.0, 75723.0, 49742.0, 32398.0, 19807.0, 12305.0, 7850.0, 4939.0, 3029.0, 2016.0, 1275.0, 824.0, 559.0, 380.0, 234.0, 138.0, 98.0, 73.0, 56.0, 45.0, 32.0, 17.0, 8.0, 7.0, 1.0, 7.0, 3.0, 0.0, 1.0], "bins": [-15.8046875, -15.3333740234375, -14.862060546875, -14.3907470703125, -13.91943359375, -13.4481201171875, -12.976806640625, -12.5054931640625, -12.0341796875, -11.5628662109375, -11.091552734375, -10.6202392578125, -10.14892578125, -9.6776123046875, -9.206298828125, -8.7349853515625, -8.263671875, -7.7923583984375, -7.321044921875, -6.8497314453125, -6.37841796875, -5.9071044921875, -5.435791015625, -4.9644775390625, -4.4931640625, -4.0218505859375, -3.550537109375, -3.0792236328125, -2.60791015625, -2.1365966796875, -1.665283203125, -1.1939697265625, -0.72265625, -0.2513427734375, 0.219970703125, 0.6912841796875, 1.16259765625, 1.6339111328125, 2.105224609375, 2.5765380859375, 3.0478515625, 3.5191650390625, 3.990478515625, 4.4617919921875, 4.93310546875, 5.4044189453125, 5.875732421875, 6.3470458984375, 6.818359375, 7.2896728515625, 7.760986328125, 8.2322998046875, 8.70361328125, 9.1749267578125, 9.646240234375, 10.1175537109375, 10.5888671875, 11.0601806640625, 11.531494140625, 12.0028076171875, 12.47412109375, 12.9454345703125, 13.416748046875, 13.8880615234375, 14.359375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 15.0, 18.0, 16.0, 27.0, 28.0, 42.0, 32.0, 37.0, 37.0, 43.0, 33.0, 43.0, 35.0, 31.0, 40.0, 42.0, 45.0, 27.0, 44.0, 27.0, 44.0, 30.0, 27.0, 27.0, 14.0, 20.0, 12.0, 18.0, 12.0, 6.0, 11.0, 7.0, 11.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.59539794921875, -7.3275146484375, -7.05963134765625, -6.791748046875, -6.52386474609375, -6.2559814453125, -5.98809814453125, -5.72021484375, -5.45233154296875, -5.1844482421875, -4.91656494140625, -4.648681640625, -4.38079833984375, -4.1129150390625, -3.84503173828125, -3.5771484375, -3.30926513671875, -3.0413818359375, -2.77349853515625, -2.505615234375, -2.23773193359375, -1.9698486328125, -1.70196533203125, -1.43408203125, -1.16619873046875, -0.8983154296875, -0.63043212890625, -0.362548828125, -0.09466552734375, 0.1732177734375, 0.44110107421875, 0.708984375, 0.97686767578125, 1.2447509765625, 1.51263427734375, 1.780517578125, 2.04840087890625, 2.3162841796875, 2.58416748046875, 2.85205078125, 3.11993408203125, 3.3878173828125, 3.65570068359375, 3.923583984375, 4.19146728515625, 4.4593505859375, 4.72723388671875, 4.9951171875, 5.26300048828125, 5.5308837890625, 5.79876708984375, 6.066650390625, 6.33453369140625, 6.6024169921875, 6.87030029296875, 7.13818359375, 7.40606689453125, 7.6739501953125, 7.94183349609375, 8.209716796875, 8.47760009765625, 8.7454833984375, 9.01336669921875, 9.28125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 9.0, 4.0, 18.0, 24.0, 42.0, 60.0, 83.0, 111.0, 160.0, 233.0, 370.0, 561.0, 812.0, 1238.0, 1915.0, 3074.0, 4732.0, 7811.0, 12400.0, 20174.0, 33030.0, 53879.0, 84073.0, 124766.0, 158954.0, 163212.0, 131269.0, 91133.0, 58864.0, 36226.0, 22419.0, 13711.0, 8408.0, 5330.0, 3386.0, 2091.0, 1362.0, 826.0, 592.0, 394.0, 259.0, 184.0, 110.0, 83.0, 54.0, 39.0, 25.0, 19.0, 5.0, 6.0, 11.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.953125, -7.705322265625, -7.45751953125, -7.209716796875, -6.9619140625, -6.714111328125, -6.46630859375, -6.218505859375, -5.970703125, -5.722900390625, -5.47509765625, -5.227294921875, -4.9794921875, -4.731689453125, -4.48388671875, -4.236083984375, -3.98828125, -3.740478515625, -3.49267578125, -3.244873046875, -2.9970703125, -2.749267578125, -2.50146484375, -2.253662109375, -2.005859375, -1.758056640625, -1.51025390625, -1.262451171875, -1.0146484375, -0.766845703125, -0.51904296875, -0.271240234375, -0.0234375, 0.224365234375, 0.47216796875, 0.719970703125, 0.9677734375, 1.215576171875, 1.46337890625, 1.711181640625, 1.958984375, 2.206787109375, 2.45458984375, 2.702392578125, 2.9501953125, 3.197998046875, 3.44580078125, 3.693603515625, 3.94140625, 4.189208984375, 4.43701171875, 4.684814453125, 4.9326171875, 5.180419921875, 5.42822265625, 5.676025390625, 5.923828125, 6.171630859375, 6.41943359375, 6.667236328125, 6.9150390625, 7.162841796875, 7.41064453125, 7.658447265625, 7.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 10.0, 14.0, 20.0, 29.0, 39.0, 55.0, 74.0, 94.0, 98.0, 101.0, 108.0, 103.0, 58.0, 51.0, 36.0, 27.0, 23.0, 17.0, 10.0, 6.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00140380859375, -0.0013559907674789429, -0.0013081729412078857, -0.0012603551149368286, -0.0012125372886657715, -0.0011647194623947144, -0.0011169016361236572, -0.0010690838098526, -0.001021265983581543, -0.0009734481573104858, -0.0009256303310394287, -0.0008778125047683716, -0.0008299946784973145, -0.0007821768522262573, -0.0007343590259552002, -0.0006865411996841431, -0.0006387233734130859, -0.0005909055471420288, -0.0005430877208709717, -0.0004952698945999146, -0.0004474520683288574, -0.0003996342420578003, -0.00035181641578674316, -0.00030399858951568604, -0.0002561807632446289, -0.00020836293697357178, -0.00016054511070251465, -0.00011272728443145752, -6.490945816040039e-05, -1.7091631889343262e-05, 3.072619438171387e-05, 7.8544020652771e-05, 0.00012636184692382812, 0.00017417967319488525, 0.00022199749946594238, 0.0002698153257369995, 0.00031763315200805664, 0.00036545097827911377, 0.0004132688045501709, 0.00046108663082122803, 0.0005089044570922852, 0.0005567222833633423, 0.0006045401096343994, 0.0006523579359054565, 0.0007001757621765137, 0.0007479935884475708, 0.0007958114147186279, 0.0008436292409896851, 0.0008914470672607422, 0.0009392648935317993, 0.0009870827198028564, 0.0010349005460739136, 0.0010827183723449707, 0.0011305361986160278, 0.001178354024887085, 0.001226171851158142, 0.0012739896774291992, 0.0013218075037002563, 0.0013696253299713135, 0.0014174431562423706, 0.0014652609825134277, 0.0015130788087844849, 0.001560896635055542, 0.0016087144613265991, 0.0016565322875976562]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 17.0, 36.0, 32.0, 69.0, 86.0, 153.0, 210.0, 297.0, 442.0, 694.0, 1053.0, 1673.0, 2687.0, 4275.0, 6731.0, 10606.0, 17240.0, 27443.0, 44538.0, 68329.0, 101748.0, 137975.0, 156612.0, 144188.0, 111441.0, 76816.0, 49277.0, 31262.0, 19679.0, 12131.0, 7588.0, 4834.0, 2981.0, 1903.0, 1170.0, 776.0, 525.0, 339.0, 214.0, 155.0, 127.0, 64.0, 45.0, 28.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.0234375, -7.791748046875, -7.56005859375, -7.328369140625, -7.0966796875, -6.864990234375, -6.63330078125, -6.401611328125, -6.169921875, -5.938232421875, -5.70654296875, -5.474853515625, -5.2431640625, -5.011474609375, -4.77978515625, -4.548095703125, -4.31640625, -4.084716796875, -3.85302734375, -3.621337890625, -3.3896484375, -3.157958984375, -2.92626953125, -2.694580078125, -2.462890625, -2.231201171875, -1.99951171875, -1.767822265625, -1.5361328125, -1.304443359375, -1.07275390625, -0.841064453125, -0.609375, -0.377685546875, -0.14599609375, 0.085693359375, 0.3173828125, 0.549072265625, 0.78076171875, 1.012451171875, 1.244140625, 1.475830078125, 1.70751953125, 1.939208984375, 2.1708984375, 2.402587890625, 2.63427734375, 2.865966796875, 3.09765625, 3.329345703125, 3.56103515625, 3.792724609375, 4.0244140625, 4.256103515625, 4.48779296875, 4.719482421875, 4.951171875, 5.182861328125, 5.41455078125, 5.646240234375, 5.8779296875, 6.109619140625, 6.34130859375, 6.572998046875, 6.8046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 14.0, 13.0, 20.0, 19.0, 32.0, 42.0, 40.0, 48.0, 60.0, 61.0, 54.0, 64.0, 58.0, 61.0, 48.0, 53.0, 50.0, 33.0, 39.0, 26.0, 28.0, 21.0, 17.0, 13.0, 20.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.058135986328125, -2.96783447265625, -2.877532958984375, -2.7872314453125, -2.696929931640625, -2.60662841796875, -2.516326904296875, -2.426025390625, -2.335723876953125, -2.24542236328125, -2.155120849609375, -2.0648193359375, -1.974517822265625, -1.88421630859375, -1.793914794921875, -1.70361328125, -1.613311767578125, -1.52301025390625, -1.432708740234375, -1.3424072265625, -1.252105712890625, -1.16180419921875, -1.071502685546875, -0.981201171875, -0.890899658203125, -0.80059814453125, -0.710296630859375, -0.6199951171875, -0.529693603515625, -0.43939208984375, -0.349090576171875, -0.2587890625, -0.168487548828125, -0.07818603515625, 0.012115478515625, 0.1024169921875, 0.192718505859375, 0.28302001953125, 0.373321533203125, 0.463623046875, 0.553924560546875, 0.64422607421875, 0.734527587890625, 0.8248291015625, 0.915130615234375, 1.00543212890625, 1.095733642578125, 1.18603515625, 1.276336669921875, 1.36663818359375, 1.456939697265625, 1.5472412109375, 1.637542724609375, 1.72784423828125, 1.818145751953125, 1.908447265625, 1.998748779296875, 2.08905029296875, 2.179351806640625, 2.2696533203125, 2.359954833984375, 2.45025634765625, 2.540557861328125, 2.630859375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 8.0, 16.0, 7.0, 19.0, 24.0, 26.0, 27.0, 36.0, 36.0, 29.0, 47.0, 46.0, 42.0, 51.0, 49.0, 47.0, 49.0, 45.0, 50.0, 39.0, 41.0, 44.0, 21.0, 22.0, 33.0, 24.0, 18.0, 18.0, 8.0, 12.0, 7.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.070353507995605, -12.58980941772461, -12.10926628112793, -11.62872314453125, -11.148179054260254, -10.667634963989258, -10.187091827392578, -9.706548690795898, -9.226004600524902, -8.745460510253906, -8.264917373657227, -7.784373760223389, -7.303830146789551, -6.823286533355713, -6.342742919921875, -5.862199306488037, -5.381655693054199, -4.901112079620361, -4.420568466186523, -3.9400248527526855, -3.4594812393188477, -2.9789376258850098, -2.498394012451172, -2.017850399017334, -1.537306785583496, -1.0567631721496582, -0.5762195587158203, -0.09567594528198242, 0.38486766815185547, 0.8654112815856934, 1.3459548950195312, 1.8264985084533691, 2.3070430755615234, 2.7875866889953613, 3.268130302429199, 3.748673915863037, 4.229217529296875, 4.709761142730713, 5.190304756164551, 5.670848369598389, 6.151391983032227, 6.6319355964660645, 7.112479209899902, 7.59302282333374, 8.073566436767578, 8.554109573364258, 9.034653663635254, 9.51519775390625, 9.99574089050293, 10.47628402709961, 10.956828117370605, 11.437372207641602, 11.917915344238281, 12.398458480834961, 12.879002571105957, 13.359546661376953, 13.840089797973633, 14.320632934570312, 14.801177024841309, 15.281721115112305, 15.762264251708984, 16.242807388305664, 16.723350524902344, 17.203895568847656, 17.684438705444336]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 11.0, 15.0, 12.0, 14.0, 15.0, 24.0, 20.0, 23.0, 30.0, 34.0, 37.0, 33.0, 38.0, 41.0, 30.0, 46.0, 42.0, 35.0, 36.0, 39.0, 35.0, 41.0, 22.0, 38.0, 25.0, 33.0, 25.0, 30.0, 21.0, 20.0, 13.0, 15.0, 17.0, 9.0, 4.0, 13.0, 4.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.401455879211426, -12.971198081970215, -12.54094123840332, -12.11068344116211, -11.680426597595215, -11.250168800354004, -10.81991195678711, -10.389654159545898, -9.959396362304688, -9.529138565063477, -9.098881721496582, -8.668623924255371, -8.238367080688477, -7.808109283447266, -7.377851963043213, -6.94759464263916, -6.517337799072266, -6.087080478668213, -5.65682315826416, -5.226565361022949, -4.796308517456055, -4.366050720214844, -3.935793399810791, -3.5055360794067383, -3.0752787590026855, -2.645021438598633, -2.21476411819458, -1.7845065593719482, -1.3542492389678955, -0.9239919185638428, -0.49373435974121094, -0.0634770393371582, 0.3667793273925781, 0.7970367074012756, 1.2272940874099731, 1.6575515270233154, 2.087808847427368, 2.518066167831421, 2.9483237266540527, 3.3785810470581055, 3.808838367462158, 4.239095687866211, 4.669353008270264, 5.099610328674316, 5.529868125915527, 5.960124969482422, 6.390382766723633, 6.8206400871276855, 7.250897407531738, 7.681154727935791, 8.111412048339844, 8.541669845581055, 8.97192668914795, 9.40218448638916, 9.832441329956055, 10.262699127197266, 10.692956924438477, 11.123214721679688, 11.553471565246582, 11.983729362487793, 12.413986206054688, 12.844244003295898, 13.27450180053711, 13.704758644104004, 14.135015487670898]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 12.0, 30.0, 21.0, 36.0, 69.0, 87.0, 151.0, 228.0, 365.0, 568.0, 823.0, 1370.0, 2249.0, 3897.0, 6593.0, 11070.0, 19241.0, 33479.0, 58808.0, 106326.0, 195172.0, 353077.0, 578851.0, 763508.0, 754805.0, 555891.0, 332187.0, 182270.0, 99563.0, 55394.0, 31746.0, 18627.0, 10909.0, 6605.0, 3929.0, 2335.0, 1459.0, 903.0, 542.0, 378.0, 239.0, 142.0, 103.0, 69.0, 45.0, 34.0, 24.0, 15.0, 12.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.3515625, -10.0059814453125, -9.660400390625, -9.3148193359375, -8.96923828125, -8.6236572265625, -8.278076171875, -7.9324951171875, -7.5869140625, -7.2413330078125, -6.895751953125, -6.5501708984375, -6.20458984375, -5.8590087890625, -5.513427734375, -5.1678466796875, -4.822265625, -4.4766845703125, -4.131103515625, -3.7855224609375, -3.43994140625, -3.0943603515625, -2.748779296875, -2.4031982421875, -2.0576171875, -1.7120361328125, -1.366455078125, -1.0208740234375, -0.67529296875, -0.3297119140625, 0.015869140625, 0.3614501953125, 0.70703125, 1.0526123046875, 1.398193359375, 1.7437744140625, 2.08935546875, 2.4349365234375, 2.780517578125, 3.1260986328125, 3.4716796875, 3.8172607421875, 4.162841796875, 4.5084228515625, 4.85400390625, 5.1995849609375, 5.545166015625, 5.8907470703125, 6.236328125, 6.5819091796875, 6.927490234375, 7.2730712890625, 7.61865234375, 7.9642333984375, 8.309814453125, 8.6553955078125, 9.0009765625, 9.3465576171875, 9.692138671875, 10.0377197265625, 10.38330078125, 10.7288818359375, 11.074462890625, 11.4200439453125, 11.765625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 14.0, 14.0, 9.0, 9.0, 24.0, 18.0, 26.0, 16.0, 16.0, 29.0, 29.0, 29.0, 25.0, 29.0, 33.0, 49.0, 35.0, 43.0, 37.0, 36.0, 36.0, 26.0, 31.0, 36.0, 31.0, 25.0, 33.0, 24.0, 31.0, 19.0, 18.0, 28.0, 24.0, 11.0, 16.0, 14.0, 9.0, 7.0, 10.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-9.484375, -9.186279296875, -8.88818359375, -8.590087890625, -8.2919921875, -7.993896484375, -7.69580078125, -7.397705078125, -7.099609375, -6.801513671875, -6.50341796875, -6.205322265625, -5.9072265625, -5.609130859375, -5.31103515625, -5.012939453125, -4.71484375, -4.416748046875, -4.11865234375, -3.820556640625, -3.5224609375, -3.224365234375, -2.92626953125, -2.628173828125, -2.330078125, -2.031982421875, -1.73388671875, -1.435791015625, -1.1376953125, -0.839599609375, -0.54150390625, -0.243408203125, 0.0546875, 0.352783203125, 0.65087890625, 0.948974609375, 1.2470703125, 1.545166015625, 1.84326171875, 2.141357421875, 2.439453125, 2.737548828125, 3.03564453125, 3.333740234375, 3.6318359375, 3.929931640625, 4.22802734375, 4.526123046875, 4.82421875, 5.122314453125, 5.42041015625, 5.718505859375, 6.0166015625, 6.314697265625, 6.61279296875, 6.910888671875, 7.208984375, 7.507080078125, 7.80517578125, 8.103271484375, 8.4013671875, 8.699462890625, 8.99755859375, 9.295654296875, 9.59375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 15.0, 25.0, 42.0, 72.0, 95.0, 156.0, 228.0, 366.0, 586.0, 988.0, 1595.0, 2553.0, 3923.0, 6484.0, 10316.0, 17017.0, 27505.0, 45216.0, 72991.0, 117722.0, 187316.0, 290765.0, 427893.0, 573515.0, 640538.0, 568463.0, 422230.0, 287066.0, 184353.0, 115971.0, 72278.0, 44714.0, 27241.0, 16885.0, 10286.0, 6394.0, 3946.0, 2416.0, 1538.0, 941.0, 623.0, 360.0, 231.0, 159.0, 96.0, 54.0, 42.0, 23.0, 20.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0], "bins": [-10.8359375, -10.5123291015625, -10.188720703125, -9.8651123046875, -9.54150390625, -9.2178955078125, -8.894287109375, -8.5706787109375, -8.2470703125, -7.9234619140625, -7.599853515625, -7.2762451171875, -6.95263671875, -6.6290283203125, -6.305419921875, -5.9818115234375, -5.658203125, -5.3345947265625, -5.010986328125, -4.6873779296875, -4.36376953125, -4.0401611328125, -3.716552734375, -3.3929443359375, -3.0693359375, -2.7457275390625, -2.422119140625, -2.0985107421875, -1.77490234375, -1.4512939453125, -1.127685546875, -0.8040771484375, -0.48046875, -0.1568603515625, 0.166748046875, 0.4903564453125, 0.81396484375, 1.1375732421875, 1.461181640625, 1.7847900390625, 2.1083984375, 2.4320068359375, 2.755615234375, 3.0792236328125, 3.40283203125, 3.7264404296875, 4.050048828125, 4.3736572265625, 4.697265625, 5.0208740234375, 5.344482421875, 5.6680908203125, 5.99169921875, 6.3153076171875, 6.638916015625, 6.9625244140625, 7.2861328125, 7.6097412109375, 7.933349609375, 8.2569580078125, 8.58056640625, 8.9041748046875, 9.227783203125, 9.5513916015625, 9.875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 12.0, 18.0, 17.0, 25.0, 44.0, 43.0, 65.0, 71.0, 95.0, 98.0, 123.0, 135.0, 165.0, 193.0, 227.0, 223.0, 244.0, 265.0, 262.0, 257.0, 221.0, 221.0, 197.0, 150.0, 149.0, 109.0, 96.0, 88.0, 44.0, 46.0, 39.0, 23.0, 25.0, 21.0, 15.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.76953125, -5.6160888671875, -5.462646484375, -5.3092041015625, -5.15576171875, -5.0023193359375, -4.848876953125, -4.6954345703125, -4.5419921875, -4.3885498046875, -4.235107421875, -4.0816650390625, -3.92822265625, -3.7747802734375, -3.621337890625, -3.4678955078125, -3.314453125, -3.1610107421875, -3.007568359375, -2.8541259765625, -2.70068359375, -2.5472412109375, -2.393798828125, -2.2403564453125, -2.0869140625, -1.9334716796875, -1.780029296875, -1.6265869140625, -1.47314453125, -1.3197021484375, -1.166259765625, -1.0128173828125, -0.859375, -0.7059326171875, -0.552490234375, -0.3990478515625, -0.24560546875, -0.0921630859375, 0.061279296875, 0.2147216796875, 0.3681640625, 0.5216064453125, 0.675048828125, 0.8284912109375, 0.98193359375, 1.1353759765625, 1.288818359375, 1.4422607421875, 1.595703125, 1.7491455078125, 1.902587890625, 2.0560302734375, 2.20947265625, 2.3629150390625, 2.516357421875, 2.6697998046875, 2.8232421875, 2.9766845703125, 3.130126953125, 3.2835693359375, 3.43701171875, 3.5904541015625, 3.743896484375, 3.8973388671875, 4.05078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 4.0, 4.0, 8.0, 14.0, 17.0, 19.0, 25.0, 34.0, 41.0, 41.0, 45.0, 37.0, 48.0, 57.0, 57.0, 66.0, 46.0, 55.0, 53.0, 52.0, 52.0, 40.0, 32.0, 22.0, 22.0, 15.0, 14.0, 11.0, 8.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.228116989135742, -13.775860786437988, -13.323604583740234, -12.871347427368164, -12.41909122467041, -11.966835021972656, -11.514578819274902, -11.062322616577148, -10.610065460205078, -10.157809257507324, -9.70555305480957, -9.2532958984375, -8.801039695739746, -8.348783493041992, -7.896527290344238, -7.444271087646484, -6.9920148849487305, -6.539758682250977, -6.0875020027160645, -5.6352458000183105, -5.182989120483398, -4.7307329177856445, -4.278476715087891, -3.8262202739715576, -3.3739638328552246, -2.9217073917388916, -2.4694509506225586, -2.0171947479248047, -1.5649383068084717, -1.1126818656921387, -0.6604256629943848, -0.20816922187805176, 0.24408817291259766, 0.6963445544242859, 1.1486009359359741, 1.6008572578430176, 2.0531136989593506, 2.5053701400756836, 2.9576263427734375, 3.4098827838897705, 3.8621392250061035, 4.314395427703857, 4.7666521072387695, 5.218908309936523, 5.671164512634277, 6.1234211921691895, 6.575677394866943, 7.0279340744018555, 7.480190277099609, 7.932446479797363, 8.384702682495117, 8.836959838867188, 9.289216041564941, 9.741472244262695, 10.19372844696045, 10.645984649658203, 11.098241806030273, 11.550498008728027, 12.002754211425781, 12.455011367797852, 12.907267570495605, 13.35952377319336, 13.811779975891113, 14.264036178588867, 14.716292381286621]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 13.0, 11.0, 12.0, 10.0, 14.0, 16.0, 22.0, 19.0, 20.0, 27.0, 26.0, 24.0, 33.0, 52.0, 40.0, 35.0, 41.0, 30.0, 44.0, 35.0, 41.0, 35.0, 40.0, 34.0, 30.0, 38.0, 28.0, 27.0, 28.0, 19.0, 21.0, 19.0, 18.0, 22.0, 13.0, 11.0, 10.0, 4.0, 4.0, 7.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.525537490844727, -10.185063362121582, -9.844590187072754, -9.50411605834961, -9.163642883300781, -8.823168754577637, -8.482694625854492, -8.142221450805664, -7.801747798919678, -7.461274147033691, -7.120800495147705, -6.780326843261719, -6.439852714538574, -6.099379539489746, -5.758905410766602, -5.418431758880615, -5.077958106994629, -4.737484455108643, -4.397010803222656, -4.056536674499512, -3.7160632610321045, -3.375589609146118, -3.0351157188415527, -2.6946420669555664, -2.35416841506958, -2.0136947631835938, -1.6732209920883179, -1.332747220993042, -0.9922735691070557, -0.6517999172210693, -0.3113260269165039, 0.029147624969482422, 0.36962223052978516, 0.7100959420204163, 1.0505696535110474, 1.3910434246063232, 1.7315170764923096, 2.071990728378296, 2.4124646186828613, 2.7529382705688477, 3.093411922454834, 3.4338855743408203, 3.7743592262268066, 4.114832878112793, 4.4553070068359375, 4.795780181884766, 5.13625431060791, 5.4767279624938965, 5.817201614379883, 6.157675266265869, 6.4981489181518555, 6.838623046875, 7.179096221923828, 7.519570350646973, 7.860044002532959, 8.200517654418945, 8.540990829467773, 8.881464958190918, 9.221938133239746, 9.56241226196289, 9.902885437011719, 10.243359565734863, 10.583833694458008, 10.924306869506836, 11.26478099822998]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 15.0, 25.0, 40.0, 53.0, 76.0, 129.0, 167.0, 269.0, 410.0, 627.0, 962.0, 1504.0, 2238.0, 3293.0, 4812.0, 7283.0, 10814.0, 15949.0, 23721.0, 35060.0, 51081.0, 74672.0, 104481.0, 135839.0, 147348.0, 127751.0, 94001.0, 66203.0, 44949.0, 30923.0, 20660.0, 14231.0, 9551.0, 6479.0, 4356.0, 2888.0, 1980.0, 1249.0, 829.0, 556.0, 355.0, 245.0, 148.0, 108.0, 66.0, 50.0, 37.0, 16.0, 15.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-9.0390625, -8.7679443359375, -8.496826171875, -8.2257080078125, -7.95458984375, -7.6834716796875, -7.412353515625, -7.1412353515625, -6.8701171875, -6.5989990234375, -6.327880859375, -6.0567626953125, -5.78564453125, -5.5145263671875, -5.243408203125, -4.9722900390625, -4.701171875, -4.4300537109375, -4.158935546875, -3.8878173828125, -3.61669921875, -3.3455810546875, -3.074462890625, -2.8033447265625, -2.5322265625, -2.2611083984375, -1.989990234375, -1.7188720703125, -1.44775390625, -1.1766357421875, -0.905517578125, -0.6343994140625, -0.36328125, -0.0921630859375, 0.178955078125, 0.4500732421875, 0.72119140625, 0.9923095703125, 1.263427734375, 1.5345458984375, 1.8056640625, 2.0767822265625, 2.347900390625, 2.6190185546875, 2.89013671875, 3.1612548828125, 3.432373046875, 3.7034912109375, 3.974609375, 4.2457275390625, 4.516845703125, 4.7879638671875, 5.05908203125, 5.3302001953125, 5.601318359375, 5.8724365234375, 6.1435546875, 6.4146728515625, 6.685791015625, 6.9569091796875, 7.22802734375, 7.4991455078125, 7.770263671875, 8.0413818359375, 8.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 8.0, 8.0, 18.0, 11.0, 17.0, 14.0, 25.0, 20.0, 21.0, 25.0, 28.0, 31.0, 20.0, 36.0, 29.0, 40.0, 43.0, 36.0, 42.0, 33.0, 37.0, 32.0, 41.0, 38.0, 29.0, 27.0, 30.0, 24.0, 31.0, 21.0, 23.0, 20.0, 15.0, 11.0, 10.0, 13.0, 16.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3333740234375, -9.026123046875, -8.7188720703125, -8.41162109375, -8.1043701171875, -7.797119140625, -7.4898681640625, -7.1826171875, -6.8753662109375, -6.568115234375, -6.2608642578125, -5.95361328125, -5.6463623046875, -5.339111328125, -5.0318603515625, -4.724609375, -4.4173583984375, -4.110107421875, -3.8028564453125, -3.49560546875, -3.1883544921875, -2.881103515625, -2.5738525390625, -2.2666015625, -1.9593505859375, -1.652099609375, -1.3448486328125, -1.03759765625, -0.7303466796875, -0.423095703125, -0.1158447265625, 0.19140625, 0.4986572265625, 0.805908203125, 1.1131591796875, 1.42041015625, 1.7276611328125, 2.034912109375, 2.3421630859375, 2.6494140625, 2.9566650390625, 3.263916015625, 3.5711669921875, 3.87841796875, 4.1856689453125, 4.492919921875, 4.8001708984375, 5.107421875, 5.4146728515625, 5.721923828125, 6.0291748046875, 6.33642578125, 6.6436767578125, 6.950927734375, 7.2581787109375, 7.5654296875, 7.8726806640625, 8.179931640625, 8.4871826171875, 8.79443359375, 9.1016845703125, 9.408935546875, 9.7161865234375, 10.0234375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 12.0, 18.0, 25.0, 29.0, 57.0, 55.0, 84.0, 145.0, 157.0, 205.0, 294.0, 452.0, 609.0, 851.0, 1287.0, 1793.0, 2717.0, 3863.0, 5919.0, 9275.0, 15152.0, 28784.0, 396290.0, 506438.0, 30269.0, 15679.0, 9420.0, 5863.0, 3813.0, 2723.0, 1873.0, 1226.0, 936.0, 609.0, 435.0, 352.0, 231.0, 175.0, 127.0, 84.0, 59.0, 43.0, 25.0, 26.0, 21.0, 12.0, 8.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-14.9765625, -14.5089111328125, -14.041259765625, -13.5736083984375, -13.10595703125, -12.6383056640625, -12.170654296875, -11.7030029296875, -11.2353515625, -10.7677001953125, -10.300048828125, -9.8323974609375, -9.36474609375, -8.8970947265625, -8.429443359375, -7.9617919921875, -7.494140625, -7.0264892578125, -6.558837890625, -6.0911865234375, -5.62353515625, -5.1558837890625, -4.688232421875, -4.2205810546875, -3.7529296875, -3.2852783203125, -2.817626953125, -2.3499755859375, -1.88232421875, -1.4146728515625, -0.947021484375, -0.4793701171875, -0.01171875, 0.4559326171875, 0.923583984375, 1.3912353515625, 1.85888671875, 2.3265380859375, 2.794189453125, 3.2618408203125, 3.7294921875, 4.1971435546875, 4.664794921875, 5.1324462890625, 5.60009765625, 6.0677490234375, 6.535400390625, 7.0030517578125, 7.470703125, 7.9383544921875, 8.406005859375, 8.8736572265625, 9.34130859375, 9.8089599609375, 10.276611328125, 10.7442626953125, 11.2119140625, 11.6795654296875, 12.147216796875, 12.6148681640625, 13.08251953125, 13.5501708984375, 14.017822265625, 14.4854736328125, 14.953125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 10.0, 16.0, 13.0, 14.0, 16.0, 25.0, 30.0, 34.0, 38.0, 38.0, 36.0, 47.0, 46.0, 41.0, 40.0, 57.0, 36.0, 46.0, 56.0, 39.0, 38.0, 31.0, 33.0, 25.0, 31.0, 25.0, 28.0, 19.0, 10.0, 10.0, 10.0, 8.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.5859375, -10.2733154296875, -9.960693359375, -9.6480712890625, -9.33544921875, -9.0228271484375, -8.710205078125, -8.3975830078125, -8.0849609375, -7.7723388671875, -7.459716796875, -7.1470947265625, -6.83447265625, -6.5218505859375, -6.209228515625, -5.8966064453125, -5.583984375, -5.2713623046875, -4.958740234375, -4.6461181640625, -4.33349609375, -4.0208740234375, -3.708251953125, -3.3956298828125, -3.0830078125, -2.7703857421875, -2.457763671875, -2.1451416015625, -1.83251953125, -1.5198974609375, -1.207275390625, -0.8946533203125, -0.58203125, -0.2694091796875, 0.043212890625, 0.3558349609375, 0.66845703125, 0.9810791015625, 1.293701171875, 1.6063232421875, 1.9189453125, 2.2315673828125, 2.544189453125, 2.8568115234375, 3.16943359375, 3.4820556640625, 3.794677734375, 4.1072998046875, 4.419921875, 4.7325439453125, 5.045166015625, 5.3577880859375, 5.67041015625, 5.9830322265625, 6.295654296875, 6.6082763671875, 6.9208984375, 7.2335205078125, 7.546142578125, 7.8587646484375, 8.17138671875, 8.4840087890625, 8.796630859375, 9.1092529296875, 9.421875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 19.0, 21.0, 25.0, 18.0, 41.0, 62.0, 91.0, 120.0, 134.0, 225.0, 284.0, 440.0, 697.0, 1014.0, 1618.0, 2767.0, 4744.0, 8478.0, 17236.0, 49938.0, 843003.0, 73936.0, 20300.0, 9616.0, 5299.0, 3085.0, 1802.0, 1135.0, 698.0, 497.0, 314.0, 223.0, 161.0, 122.0, 84.0, 80.0, 47.0, 37.0, 35.0, 19.0, 18.0, 13.0, 5.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0], "bins": [-8.3515625, -8.116943359375, -7.88232421875, -7.647705078125, -7.4130859375, -7.178466796875, -6.94384765625, -6.709228515625, -6.474609375, -6.239990234375, -6.00537109375, -5.770751953125, -5.5361328125, -5.301513671875, -5.06689453125, -4.832275390625, -4.59765625, -4.363037109375, -4.12841796875, -3.893798828125, -3.6591796875, -3.424560546875, -3.18994140625, -2.955322265625, -2.720703125, -2.486083984375, -2.25146484375, -2.016845703125, -1.7822265625, -1.547607421875, -1.31298828125, -1.078369140625, -0.84375, -0.609130859375, -0.37451171875, -0.139892578125, 0.0947265625, 0.329345703125, 0.56396484375, 0.798583984375, 1.033203125, 1.267822265625, 1.50244140625, 1.737060546875, 1.9716796875, 2.206298828125, 2.44091796875, 2.675537109375, 2.91015625, 3.144775390625, 3.37939453125, 3.614013671875, 3.8486328125, 4.083251953125, 4.31787109375, 4.552490234375, 4.787109375, 5.021728515625, 5.25634765625, 5.490966796875, 5.7255859375, 5.960205078125, 6.19482421875, 6.429443359375, 6.6640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 13.0, 8.0, 9.0, 17.0, 22.0, 29.0, 35.0, 67.0, 88.0, 151.0, 156.0, 119.0, 62.0, 46.0, 31.0, 27.0, 20.0, 15.0, 10.0, 8.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010576248168945312, -0.0010138154029846191, -0.000970005989074707, -0.0009261965751647949, -0.0008823871612548828, -0.0008385777473449707, -0.0007947683334350586, -0.0007509589195251465, -0.0007071495056152344, -0.0006633400917053223, -0.0006195306777954102, -0.000575721263885498, -0.0005319118499755859, -0.00048810243606567383, -0.0004442930221557617, -0.0004004836082458496, -0.0003566741943359375, -0.0003128647804260254, -0.0002690553665161133, -0.00022524595260620117, -0.00018143653869628906, -0.00013762712478637695, -9.381771087646484e-05, -5.0008296966552734e-05, -6.198883056640625e-06, 3.7610530853271484e-05, 8.14199447631836e-05, 0.0001252293586730957, 0.0001690387725830078, 0.00021284818649291992, 0.00025665760040283203, 0.00030046701431274414, 0.00034427642822265625, 0.00038808584213256836, 0.00043189525604248047, 0.0004757046699523926, 0.0005195140838623047, 0.0005633234977722168, 0.0006071329116821289, 0.000650942325592041, 0.0006947517395019531, 0.0007385611534118652, 0.0007823705673217773, 0.0008261799812316895, 0.0008699893951416016, 0.0009137988090515137, 0.0009576082229614258, 0.0010014176368713379, 0.00104522705078125, 0.0010890364646911621, 0.0011328458786010742, 0.0011766552925109863, 0.0012204647064208984, 0.0012642741203308105, 0.0013080835342407227, 0.0013518929481506348, 0.0013957023620605469, 0.001439511775970459, 0.001483321189880371, 0.0015271306037902832, 0.0015709400177001953, 0.0016147494316101074, 0.0016585588455200195, 0.0017023682594299316, 0.0017461776733398438]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 10.0, 17.0, 12.0, 17.0, 25.0, 33.0, 48.0, 68.0, 81.0, 134.0, 158.0, 257.0, 392.0, 614.0, 981.0, 1658.0, 2742.0, 4794.0, 8730.0, 17221.0, 38524.0, 94946.0, 230141.0, 326906.0, 184924.0, 72890.0, 30321.0, 14060.0, 7190.0, 4092.0, 2389.0, 1513.0, 905.0, 551.0, 382.0, 256.0, 171.0, 125.0, 79.0, 41.0, 46.0, 29.0, 24.0, 11.0, 13.0, 7.0, 11.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.232421875, -3.132537841796875, -3.03265380859375, -2.932769775390625, -2.8328857421875, -2.733001708984375, -2.63311767578125, -2.533233642578125, -2.433349609375, -2.333465576171875, -2.23358154296875, -2.133697509765625, -2.0338134765625, -1.933929443359375, -1.83404541015625, -1.734161376953125, -1.63427734375, -1.534393310546875, -1.43450927734375, -1.334625244140625, -1.2347412109375, -1.134857177734375, -1.03497314453125, -0.935089111328125, -0.835205078125, -0.735321044921875, -0.63543701171875, -0.535552978515625, -0.4356689453125, -0.335784912109375, -0.23590087890625, -0.136016845703125, -0.0361328125, 0.063751220703125, 0.16363525390625, 0.263519287109375, 0.3634033203125, 0.463287353515625, 0.56317138671875, 0.663055419921875, 0.762939453125, 0.862823486328125, 0.96270751953125, 1.062591552734375, 1.1624755859375, 1.262359619140625, 1.36224365234375, 1.462127685546875, 1.56201171875, 1.661895751953125, 1.76177978515625, 1.861663818359375, 1.9615478515625, 2.061431884765625, 2.16131591796875, 2.261199951171875, 2.361083984375, 2.460968017578125, 2.56085205078125, 2.660736083984375, 2.7606201171875, 2.860504150390625, 2.96038818359375, 3.060272216796875, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 5.0, 8.0, 10.0, 12.0, 14.0, 22.0, 21.0, 21.0, 30.0, 36.0, 40.0, 65.0, 53.0, 78.0, 65.0, 67.0, 80.0, 53.0, 60.0, 46.0, 41.0, 26.0, 21.0, 25.0, 8.0, 6.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5145263671875, -0.495361328125, -0.4761962890625, -0.45703125, -0.4378662109375, -0.418701171875, -0.3995361328125, -0.38037109375, -0.3612060546875, -0.342041015625, -0.3228759765625, -0.3037109375, -0.2845458984375, -0.265380859375, -0.2462158203125, -0.22705078125, -0.2078857421875, -0.188720703125, -0.1695556640625, -0.150390625, -0.1312255859375, -0.112060546875, -0.0928955078125, -0.07373046875, -0.0545654296875, -0.035400390625, -0.0162353515625, 0.0029296875, 0.0220947265625, 0.041259765625, 0.0604248046875, 0.07958984375, 0.0987548828125, 0.117919921875, 0.1370849609375, 0.15625, 0.1754150390625, 0.194580078125, 0.2137451171875, 0.23291015625, 0.2520751953125, 0.271240234375, 0.2904052734375, 0.3095703125, 0.3287353515625, 0.347900390625, 0.3670654296875, 0.38623046875, 0.4053955078125, 0.424560546875, 0.4437255859375, 0.462890625, 0.4820556640625, 0.501220703125, 0.5203857421875, 0.53955078125, 0.5587158203125, 0.577880859375, 0.5970458984375, 0.6162109375, 0.6353759765625, 0.654541015625, 0.6737060546875, 0.69287109375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 15.0, 6.0, 14.0, 11.0, 10.0, 18.0, 18.0, 30.0, 34.0, 42.0, 55.0, 49.0, 53.0, 48.0, 55.0, 45.0, 66.0, 50.0, 51.0, 56.0, 52.0, 37.0, 39.0, 19.0, 28.0, 10.0, 15.0, 16.0, 14.0, 5.0, 6.0, 11.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.213982582092285, -13.781763076782227, -13.349544525146484, -12.917325019836426, -12.485105514526367, -12.052886009216309, -11.62066650390625, -11.188447952270508, -10.75622844696045, -10.32400894165039, -9.891790390014648, -9.45957088470459, -9.027351379394531, -8.595131874084473, -8.162912368774414, -7.730693817138672, -7.298474311828613, -6.866254806518555, -6.434035778045654, -6.001816749572754, -5.569597244262695, -5.137377738952637, -4.705158710479736, -4.272939682006836, -3.8407201766967773, -3.408500909805298, -2.9762816429138184, -2.544062376022339, -2.1118431091308594, -1.6796238422393799, -1.2474045753479004, -0.8151853084564209, -0.3829669952392578, 0.04925227165222168, 0.48147153854370117, 0.9136908054351807, 1.3459100723266602, 1.7781293392181396, 2.210348606109619, 2.6425678730010986, 3.074787139892578, 3.5070064067840576, 3.939225673675537, 4.3714447021484375, 4.803664207458496, 5.235883712768555, 5.668102741241455, 6.1003217697143555, 6.532541275024414, 6.964760780334473, 7.396979808807373, 7.829198837280273, 8.261418342590332, 8.69363784790039, 9.125856399536133, 9.558075904846191, 9.99029541015625, 10.422514915466309, 10.854734420776367, 11.28695297241211, 11.719172477722168, 12.151391983032227, 12.583610534667969, 13.015830039978027, 13.448049545288086]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 15.0, 11.0, 13.0, 15.0, 19.0, 24.0, 24.0, 20.0, 26.0, 31.0, 41.0, 42.0, 32.0, 36.0, 41.0, 40.0, 39.0, 40.0, 36.0, 41.0, 41.0, 29.0, 34.0, 28.0, 27.0, 29.0, 29.0, 18.0, 19.0, 20.0, 25.0, 14.0, 8.0, 18.0, 7.0, 6.0, 5.0, 6.0, 1.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.732009887695312, -9.416609764099121, -9.101210594177246, -8.785810470581055, -8.47041130065918, -8.155011177062988, -7.839611530303955, -7.524211883544922, -7.208812236785889, -6.8934125900268555, -6.578012943267822, -6.262613296508789, -5.947213172912598, -5.631814002990723, -5.316413879394531, -5.001014232635498, -4.685614585876465, -4.370214939117432, -4.054815292358398, -3.739415407180786, -3.424015760421753, -3.1086161136627197, -2.7932162284851074, -2.477816581726074, -2.162416934967041, -1.8470172882080078, -1.531617522239685, -1.2162177562713623, -0.9008181095123291, -0.5854184627532959, -0.27001869678497314, 0.04538106918334961, 0.3607816696166992, 0.6761813759803772, 0.9915810823440552, 1.306980848312378, 1.6223804950714111, 1.9377801418304443, 2.2531800270080566, 2.56857967376709, 2.883979320526123, 3.1993789672851562, 3.5147786140441895, 3.8301784992218018, 4.145578384399414, 4.460977554321289, 4.7763776779174805, 5.091777324676514, 5.407176971435547, 5.72257661819458, 6.037976264953613, 6.3533759117126465, 6.66877555847168, 6.984175682067871, 7.299575328826904, 7.6149749755859375, 7.930374622344971, 8.245774269104004, 8.561174392700195, 8.87657356262207, 9.191973686218262, 9.507372856140137, 9.822772979736328, 10.138172149658203, 10.453572273254395]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 18.0, 30.0, 47.0, 79.0, 154.0, 268.0, 515.0, 876.0, 1592.0, 3057.0, 5713.0, 10713.0, 19830.0, 36602.0, 64949.0, 106147.0, 152297.0, 179042.0, 165238.0, 123306.0, 78149.0, 45754.0, 25138.0, 13640.0, 7211.0, 3730.0, 1978.0, 1090.0, 605.0, 336.0, 149.0, 94.0, 80.0, 30.0, 31.0, 15.0, 15.0, 2.0, 1.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.5703125, -14.1619873046875, -13.753662109375, -13.3453369140625, -12.93701171875, -12.5286865234375, -12.120361328125, -11.7120361328125, -11.3037109375, -10.8953857421875, -10.487060546875, -10.0787353515625, -9.67041015625, -9.2620849609375, -8.853759765625, -8.4454345703125, -8.037109375, -7.6287841796875, -7.220458984375, -6.8121337890625, -6.40380859375, -5.9954833984375, -5.587158203125, -5.1788330078125, -4.7705078125, -4.3621826171875, -3.953857421875, -3.5455322265625, -3.13720703125, -2.7288818359375, -2.320556640625, -1.9122314453125, -1.50390625, -1.0955810546875, -0.687255859375, -0.2789306640625, 0.12939453125, 0.5377197265625, 0.946044921875, 1.3543701171875, 1.7626953125, 2.1710205078125, 2.579345703125, 2.9876708984375, 3.39599609375, 3.8043212890625, 4.212646484375, 4.6209716796875, 5.029296875, 5.4376220703125, 5.845947265625, 6.2542724609375, 6.66259765625, 7.0709228515625, 7.479248046875, 7.8875732421875, 8.2958984375, 8.7042236328125, 9.112548828125, 9.5208740234375, 9.92919921875, 10.3375244140625, 10.745849609375, 11.1541748046875, 11.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 12.0, 12.0, 22.0, 22.0, 16.0, 25.0, 21.0, 22.0, 14.0, 32.0, 36.0, 32.0, 48.0, 45.0, 57.0, 37.0, 47.0, 50.0, 34.0, 41.0, 41.0, 44.0, 38.0, 32.0, 28.0, 34.0, 26.0, 15.0, 15.0, 18.0, 21.0, 15.0, 9.0, 9.0, 1.0, 5.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.3125, -9.988525390625, -9.66455078125, -9.340576171875, -9.0166015625, -8.692626953125, -8.36865234375, -8.044677734375, -7.720703125, -7.396728515625, -7.07275390625, -6.748779296875, -6.4248046875, -6.100830078125, -5.77685546875, -5.452880859375, -5.12890625, -4.804931640625, -4.48095703125, -4.156982421875, -3.8330078125, -3.509033203125, -3.18505859375, -2.861083984375, -2.537109375, -2.213134765625, -1.88916015625, -1.565185546875, -1.2412109375, -0.917236328125, -0.59326171875, -0.269287109375, 0.0546875, 0.378662109375, 0.70263671875, 1.026611328125, 1.3505859375, 1.674560546875, 1.99853515625, 2.322509765625, 2.646484375, 2.970458984375, 3.29443359375, 3.618408203125, 3.9423828125, 4.266357421875, 4.59033203125, 4.914306640625, 5.23828125, 5.562255859375, 5.88623046875, 6.210205078125, 6.5341796875, 6.858154296875, 7.18212890625, 7.506103515625, 7.830078125, 8.154052734375, 8.47802734375, 8.802001953125, 9.1259765625, 9.449951171875, 9.77392578125, 10.097900390625, 10.421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 21.0, 33.0, 50.0, 78.0, 135.0, 173.0, 267.0, 425.0, 748.0, 1246.0, 2127.0, 3528.0, 6155.0, 10332.0, 17578.0, 28821.0, 46972.0, 73088.0, 104807.0, 136400.0, 151487.0, 141885.0, 112424.0, 79260.0, 51377.0, 31819.0, 19121.0, 11491.0, 6712.0, 3992.0, 2427.0, 1375.0, 862.0, 510.0, 318.0, 183.0, 120.0, 70.0, 47.0, 31.0, 15.0, 8.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.554931640625, -9.24267578125, -8.930419921875, -8.6181640625, -8.305908203125, -7.99365234375, -7.681396484375, -7.369140625, -7.056884765625, -6.74462890625, -6.432373046875, -6.1201171875, -5.807861328125, -5.49560546875, -5.183349609375, -4.87109375, -4.558837890625, -4.24658203125, -3.934326171875, -3.6220703125, -3.309814453125, -2.99755859375, -2.685302734375, -2.373046875, -2.060791015625, -1.74853515625, -1.436279296875, -1.1240234375, -0.811767578125, -0.49951171875, -0.187255859375, 0.125, 0.437255859375, 0.74951171875, 1.061767578125, 1.3740234375, 1.686279296875, 1.99853515625, 2.310791015625, 2.623046875, 2.935302734375, 3.24755859375, 3.559814453125, 3.8720703125, 4.184326171875, 4.49658203125, 4.808837890625, 5.12109375, 5.433349609375, 5.74560546875, 6.057861328125, 6.3701171875, 6.682373046875, 6.99462890625, 7.306884765625, 7.619140625, 7.931396484375, 8.24365234375, 8.555908203125, 8.8681640625, 9.180419921875, 9.49267578125, 9.804931640625, 10.1171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 6.0, 11.0, 5.0, 17.0, 18.0, 24.0, 28.0, 29.0, 33.0, 28.0, 26.0, 38.0, 46.0, 32.0, 39.0, 47.0, 63.0, 40.0, 48.0, 50.0, 31.0, 40.0, 36.0, 38.0, 33.0, 20.0, 33.0, 21.0, 15.0, 15.0, 21.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.145751953125, -5.93603515625, -5.726318359375, -5.5166015625, -5.306884765625, -5.09716796875, -4.887451171875, -4.677734375, -4.468017578125, -4.25830078125, -4.048583984375, -3.8388671875, -3.629150390625, -3.41943359375, -3.209716796875, -3.0, -2.790283203125, -2.58056640625, -2.370849609375, -2.1611328125, -1.951416015625, -1.74169921875, -1.531982421875, -1.322265625, -1.112548828125, -0.90283203125, -0.693115234375, -0.4833984375, -0.273681640625, -0.06396484375, 0.145751953125, 0.35546875, 0.565185546875, 0.77490234375, 0.984619140625, 1.1943359375, 1.404052734375, 1.61376953125, 1.823486328125, 2.033203125, 2.242919921875, 2.45263671875, 2.662353515625, 2.8720703125, 3.081787109375, 3.29150390625, 3.501220703125, 3.7109375, 3.920654296875, 4.13037109375, 4.340087890625, 4.5498046875, 4.759521484375, 4.96923828125, 5.178955078125, 5.388671875, 5.598388671875, 5.80810546875, 6.017822265625, 6.2275390625, 6.437255859375, 6.64697265625, 6.856689453125, 7.06640625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 16.0, 25.0, 37.0, 50.0, 89.0, 180.0, 286.0, 492.0, 1047.0, 2105.0, 4813.0, 11940.0, 31999.0, 91204.0, 242333.0, 354366.0, 195095.0, 70508.0, 24867.0, 9466.0, 3923.0, 1781.0, 834.0, 446.0, 238.0, 154.0, 82.0, 52.0, 28.0, 17.0, 25.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.5013427734375, -13.041748046875, -12.5821533203125, -12.12255859375, -11.6629638671875, -11.203369140625, -10.7437744140625, -10.2841796875, -9.8245849609375, -9.364990234375, -8.9053955078125, -8.44580078125, -7.9862060546875, -7.526611328125, -7.0670166015625, -6.607421875, -6.1478271484375, -5.688232421875, -5.2286376953125, -4.76904296875, -4.3094482421875, -3.849853515625, -3.3902587890625, -2.9306640625, -2.4710693359375, -2.011474609375, -1.5518798828125, -1.09228515625, -0.6326904296875, -0.173095703125, 0.2864990234375, 0.74609375, 1.2056884765625, 1.665283203125, 2.1248779296875, 2.58447265625, 3.0440673828125, 3.503662109375, 3.9632568359375, 4.4228515625, 4.8824462890625, 5.342041015625, 5.8016357421875, 6.26123046875, 6.7208251953125, 7.180419921875, 7.6400146484375, 8.099609375, 8.5592041015625, 9.018798828125, 9.4783935546875, 9.93798828125, 10.3975830078125, 10.857177734375, 11.3167724609375, 11.7763671875, 12.2359619140625, 12.695556640625, 13.1551513671875, 13.61474609375, 14.0743408203125, 14.533935546875, 14.9935302734375, 15.453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 13.0, 18.0, 32.0, 32.0, 36.0, 51.0, 71.0, 77.0, 89.0, 82.0, 83.0, 65.0, 60.0, 60.0, 28.0, 34.0, 29.0, 22.0, 20.0, 9.0, 12.0, 9.0, 8.0, 3.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008578747510910034, -0.0008278787136077881, -0.0007978826761245728, -0.0007678866386413574, -0.0007378906011581421, -0.0007078945636749268, -0.0006778985261917114, -0.0006479024887084961, -0.0006179064512252808, -0.0005879104137420654, -0.0005579143762588501, -0.0005279183387756348, -0.0004979223012924194, -0.0004679262638092041, -0.00043793022632598877, -0.00040793418884277344, -0.0003779381513595581, -0.0003479421138763428, -0.00031794607639312744, -0.0002879500389099121, -0.0002579540014266968, -0.00022795796394348145, -0.0001979619264602661, -0.00016796588897705078, -0.00013796985149383545, -0.00010797381401062012, -7.797777652740479e-05, -4.798173904418945e-05, -1.798570156097412e-05, 1.2010335922241211e-05, 4.200637340545654e-05, 7.200241088867188e-05, 0.00010199844837188721, 0.00013199448585510254, 0.00016199052333831787, 0.0001919865608215332, 0.00022198259830474854, 0.00025197863578796387, 0.0002819746732711792, 0.00031197071075439453, 0.00034196674823760986, 0.0003719627857208252, 0.00040195882320404053, 0.00043195486068725586, 0.0004619508981704712, 0.0004919469356536865, 0.0005219429731369019, 0.0005519390106201172, 0.0005819350481033325, 0.0006119310855865479, 0.0006419271230697632, 0.0006719231605529785, 0.0007019191980361938, 0.0007319152355194092, 0.0007619112730026245, 0.0007919073104858398, 0.0008219033479690552, 0.0008518993854522705, 0.0008818954229354858, 0.0009118914604187012, 0.0009418874979019165, 0.0009718835353851318, 0.0010018795728683472, 0.0010318756103515625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 30.0, 23.0, 32.0, 48.0, 59.0, 92.0, 137.0, 192.0, 335.0, 450.0, 840.0, 1352.0, 2395.0, 4413.0, 8617.0, 17424.0, 37035.0, 78320.0, 155757.0, 238713.0, 228306.0, 139716.0, 69449.0, 32429.0, 15288.0, 7760.0, 3930.0, 2242.0, 1173.0, 729.0, 403.0, 238.0, 179.0, 127.0, 90.0, 53.0, 53.0, 28.0, 17.0, 15.0, 15.0, 8.0, 12.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.8001708984375, -9.483154296875, -9.1661376953125, -8.84912109375, -8.5321044921875, -8.215087890625, -7.8980712890625, -7.5810546875, -7.2640380859375, -6.947021484375, -6.6300048828125, -6.31298828125, -5.9959716796875, -5.678955078125, -5.3619384765625, -5.044921875, -4.7279052734375, -4.410888671875, -4.0938720703125, -3.77685546875, -3.4598388671875, -3.142822265625, -2.8258056640625, -2.5087890625, -2.1917724609375, -1.874755859375, -1.5577392578125, -1.24072265625, -0.9237060546875, -0.606689453125, -0.2896728515625, 0.02734375, 0.3443603515625, 0.661376953125, 0.9783935546875, 1.29541015625, 1.6124267578125, 1.929443359375, 2.2464599609375, 2.5634765625, 2.8804931640625, 3.197509765625, 3.5145263671875, 3.83154296875, 4.1485595703125, 4.465576171875, 4.7825927734375, 5.099609375, 5.4166259765625, 5.733642578125, 6.0506591796875, 6.36767578125, 6.6846923828125, 7.001708984375, 7.3187255859375, 7.6357421875, 7.9527587890625, 8.269775390625, 8.5867919921875, 8.90380859375, 9.2208251953125, 9.537841796875, 9.8548583984375, 10.171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 14.0, 18.0, 16.0, 20.0, 19.0, 33.0, 46.0, 43.0, 53.0, 53.0, 67.0, 63.0, 64.0, 77.0, 60.0, 64.0, 65.0, 44.0, 30.0, 25.0, 17.0, 19.0, 14.0, 8.0, 11.0, 1.0, 10.0, 4.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.5179443359375, -2.434326171875, -2.3507080078125, -2.26708984375, -2.1834716796875, -2.099853515625, -2.0162353515625, -1.9326171875, -1.8489990234375, -1.765380859375, -1.6817626953125, -1.59814453125, -1.5145263671875, -1.430908203125, -1.3472900390625, -1.263671875, -1.1800537109375, -1.096435546875, -1.0128173828125, -0.92919921875, -0.8455810546875, -0.761962890625, -0.6783447265625, -0.5947265625, -0.5111083984375, -0.427490234375, -0.3438720703125, -0.26025390625, -0.1766357421875, -0.093017578125, -0.0093994140625, 0.07421875, 0.1578369140625, 0.241455078125, 0.3250732421875, 0.40869140625, 0.4923095703125, 0.575927734375, 0.6595458984375, 0.7431640625, 0.8267822265625, 0.910400390625, 0.9940185546875, 1.07763671875, 1.1612548828125, 1.244873046875, 1.3284912109375, 1.412109375, 1.4957275390625, 1.579345703125, 1.6629638671875, 1.74658203125, 1.8302001953125, 1.913818359375, 1.9974365234375, 2.0810546875, 2.1646728515625, 2.248291015625, 2.3319091796875, 2.41552734375, 2.4991455078125, 2.582763671875, 2.6663818359375, 2.75]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 12.0, 8.0, 8.0, 12.0, 15.0, 9.0, 19.0, 33.0, 25.0, 33.0, 36.0, 37.0, 34.0, 37.0, 60.0, 43.0, 39.0, 43.0, 35.0, 56.0, 45.0, 50.0, 45.0, 38.0, 25.0, 26.0, 19.0, 18.0, 17.0, 14.0, 14.0, 17.0, 9.0, 12.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.719067573547363, -9.397351264953613, -9.07563591003418, -8.75391960144043, -8.43220329284668, -8.11048698425293, -7.788771152496338, -7.467055320739746, -7.145339012145996, -6.823622703552246, -6.501906871795654, -6.1801910400390625, -5.8584747314453125, -5.5367584228515625, -5.215042591094971, -4.893326759338379, -4.571610450744629, -4.249894142150879, -3.928178310394287, -3.606462240219116, -3.2847461700439453, -2.9630300998687744, -2.6413140296936035, -2.3195979595184326, -1.9978818893432617, -1.6761658191680908, -1.35444974899292, -1.032733678817749, -0.7110176086425781, -0.3893015384674072, -0.06758546829223633, 0.25413060188293457, 0.5758476257324219, 0.8975636959075928, 1.2192797660827637, 1.5409958362579346, 1.8627119064331055, 2.1844279766082764, 2.5061440467834473, 2.827860116958618, 3.149576187133789, 3.47129225730896, 3.793008327484131, 4.114724159240723, 4.436440467834473, 4.758156776428223, 5.0798726081848145, 5.401588439941406, 5.723304748535156, 6.045021057128906, 6.366736888885498, 6.68845272064209, 7.01016902923584, 7.33188533782959, 7.653601169586182, 7.975317001342773, 8.297033309936523, 8.618749618530273, 8.940465927124023, 9.262181282043457, 9.583897590637207, 9.905613899230957, 10.22732925415039, 10.54904556274414, 10.87076187133789]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 6.0, 6.0, 3.0, 17.0, 15.0, 19.0, 16.0, 20.0, 12.0, 27.0, 35.0, 27.0, 35.0, 34.0, 29.0, 49.0, 39.0, 44.0, 41.0, 40.0, 44.0, 36.0, 38.0, 44.0, 38.0, 33.0, 36.0, 24.0, 21.0, 24.0, 20.0, 22.0, 21.0, 20.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.343703269958496, -10.032953262329102, -9.722203254699707, -9.411454200744629, -9.100704193115234, -8.78995418548584, -8.479204177856445, -8.16845417022705, -7.8577046394348145, -7.54695463180542, -7.236205101013184, -6.925455093383789, -6.6147050857543945, -6.303955554962158, -5.993205547332764, -5.682456016540527, -5.371706008911133, -5.060956001281738, -4.750206470489502, -4.439456462860107, -4.128706932067871, -3.8179569244384766, -3.507206916809082, -3.1964571475982666, -2.885707378387451, -2.5749576091766357, -2.2642078399658203, -1.9534578323364258, -1.6427080631256104, -1.331958293914795, -1.02120840549469, -0.710458517074585, -0.39970970153808594, -0.08895987272262573, 0.22178995609283447, 0.5325397849082947, 0.8432896137237549, 1.1540393829345703, 1.4647892713546753, 1.7755391597747803, 2.0862889289855957, 2.397038698196411, 2.7077884674072266, 3.018538475036621, 3.3292882442474365, 3.640038013458252, 3.9507880210876465, 4.261537551879883, 4.572287559509277, 4.883037567138672, 5.193787097930908, 5.504537105560303, 5.815286636352539, 6.126036643981934, 6.436786651611328, 6.747536659240723, 7.058286190032959, 7.3690361976623535, 7.67978572845459, 7.990535736083984, 8.301285743713379, 8.612035751342773, 8.922784805297852, 9.233534812927246, 9.54428482055664]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 17.0, 24.0, 44.0, 53.0, 70.0, 121.0, 180.0, 290.0, 477.0, 692.0, 1167.0, 1808.0, 2929.0, 4538.0, 7566.0, 12299.0, 20815.0, 35748.0, 62829.0, 112185.0, 203305.0, 370422.0, 610841.0, 800621.0, 751076.0, 518889.0, 298203.0, 162118.0, 88962.0, 50514.0, 29569.0, 17444.0, 10642.0, 6377.0, 4108.0, 2582.0, 1609.0, 1039.0, 712.0, 479.0, 318.0, 196.0, 119.0, 85.0, 66.0, 47.0, 19.0, 18.0, 14.0, 15.0, 4.0, 9.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.234375, -7.9755859375, -7.716796875, -7.4580078125, -7.19921875, -6.9404296875, -6.681640625, -6.4228515625, -6.1640625, -5.9052734375, -5.646484375, -5.3876953125, -5.12890625, -4.8701171875, -4.611328125, -4.3525390625, -4.09375, -3.8349609375, -3.576171875, -3.3173828125, -3.05859375, -2.7998046875, -2.541015625, -2.2822265625, -2.0234375, -1.7646484375, -1.505859375, -1.2470703125, -0.98828125, -0.7294921875, -0.470703125, -0.2119140625, 0.046875, 0.3056640625, 0.564453125, 0.8232421875, 1.08203125, 1.3408203125, 1.599609375, 1.8583984375, 2.1171875, 2.3759765625, 2.634765625, 2.8935546875, 3.15234375, 3.4111328125, 3.669921875, 3.9287109375, 4.1875, 4.4462890625, 4.705078125, 4.9638671875, 5.22265625, 5.4814453125, 5.740234375, 5.9990234375, 6.2578125, 6.5166015625, 6.775390625, 7.0341796875, 7.29296875, 7.5517578125, 7.810546875, 8.0693359375, 8.328125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 8.0, 8.0, 8.0, 9.0, 11.0, 18.0, 17.0, 24.0, 15.0, 30.0, 25.0, 30.0, 30.0, 31.0, 29.0, 34.0, 51.0, 28.0, 43.0, 49.0, 38.0, 42.0, 36.0, 25.0, 43.0, 46.0, 30.0, 30.0, 33.0, 19.0, 14.0, 17.0, 21.0, 16.0, 20.0, 10.0, 9.0, 14.0, 5.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.015625, -6.80096435546875, -6.5863037109375, -6.37164306640625, -6.156982421875, -5.94232177734375, -5.7276611328125, -5.51300048828125, -5.29833984375, -5.08367919921875, -4.8690185546875, -4.65435791015625, -4.439697265625, -4.22503662109375, -4.0103759765625, -3.79571533203125, -3.5810546875, -3.36639404296875, -3.1517333984375, -2.93707275390625, -2.722412109375, -2.50775146484375, -2.2930908203125, -2.07843017578125, -1.86376953125, -1.64910888671875, -1.4344482421875, -1.21978759765625, -1.005126953125, -0.79046630859375, -0.5758056640625, -0.36114501953125, -0.146484375, 0.06817626953125, 0.2828369140625, 0.49749755859375, 0.712158203125, 0.92681884765625, 1.1414794921875, 1.35614013671875, 1.57080078125, 1.78546142578125, 2.0001220703125, 2.21478271484375, 2.429443359375, 2.64410400390625, 2.8587646484375, 3.07342529296875, 3.2880859375, 3.50274658203125, 3.7174072265625, 3.93206787109375, 4.146728515625, 4.36138916015625, 4.5760498046875, 4.79071044921875, 5.00537109375, 5.22003173828125, 5.4346923828125, 5.64935302734375, 5.864013671875, 6.07867431640625, 6.2933349609375, 6.50799560546875, 6.72265625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 18.0, 21.0, 26.0, 41.0, 82.0, 122.0, 178.0, 306.0, 454.0, 785.0, 1216.0, 2084.0, 3358.0, 5603.0, 9921.0, 17056.0, 29552.0, 52403.0, 93519.0, 167999.0, 296895.0, 495000.0, 721810.0, 788104.0, 611985.0, 386256.0, 222038.0, 125412.0, 69962.0, 39324.0, 21911.0, 12688.0, 7206.0, 4317.0, 2609.0, 1491.0, 919.0, 607.0, 381.0, 240.0, 123.0, 93.0, 68.0, 27.0, 25.0, 17.0, 8.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.2734375, -8.98583984375, -8.6982421875, -8.41064453125, -8.123046875, -7.83544921875, -7.5478515625, -7.26025390625, -6.97265625, -6.68505859375, -6.3974609375, -6.10986328125, -5.822265625, -5.53466796875, -5.2470703125, -4.95947265625, -4.671875, -4.38427734375, -4.0966796875, -3.80908203125, -3.521484375, -3.23388671875, -2.9462890625, -2.65869140625, -2.37109375, -2.08349609375, -1.7958984375, -1.50830078125, -1.220703125, -0.93310546875, -0.6455078125, -0.35791015625, -0.0703125, 0.21728515625, 0.5048828125, 0.79248046875, 1.080078125, 1.36767578125, 1.6552734375, 1.94287109375, 2.23046875, 2.51806640625, 2.8056640625, 3.09326171875, 3.380859375, 3.66845703125, 3.9560546875, 4.24365234375, 4.53125, 4.81884765625, 5.1064453125, 5.39404296875, 5.681640625, 5.96923828125, 6.2568359375, 6.54443359375, 6.83203125, 7.11962890625, 7.4072265625, 7.69482421875, 7.982421875, 8.27001953125, 8.5576171875, 8.84521484375, 9.1328125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 10.0, 11.0, 12.0, 18.0, 20.0, 39.0, 36.0, 54.0, 66.0, 92.0, 113.0, 150.0, 162.0, 212.0, 234.0, 253.0, 265.0, 278.0, 281.0, 259.0, 245.0, 222.0, 224.0, 164.0, 147.0, 108.0, 112.0, 80.0, 61.0, 44.0, 29.0, 19.0, 9.0, 8.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.089874267578125, -3.96881103515625, -3.847747802734375, -3.7266845703125, -3.605621337890625, -3.48455810546875, -3.363494873046875, -3.242431640625, -3.121368408203125, -3.00030517578125, -2.879241943359375, -2.7581787109375, -2.637115478515625, -2.51605224609375, -2.394989013671875, -2.27392578125, -2.152862548828125, -2.03179931640625, -1.910736083984375, -1.7896728515625, -1.668609619140625, -1.54754638671875, -1.426483154296875, -1.305419921875, -1.184356689453125, -1.06329345703125, -0.942230224609375, -0.8211669921875, -0.700103759765625, -0.57904052734375, -0.457977294921875, -0.3369140625, -0.215850830078125, -0.09478759765625, 0.026275634765625, 0.1473388671875, 0.268402099609375, 0.38946533203125, 0.510528564453125, 0.631591796875, 0.752655029296875, 0.87371826171875, 0.994781494140625, 1.1158447265625, 1.236907958984375, 1.35797119140625, 1.479034423828125, 1.60009765625, 1.721160888671875, 1.84222412109375, 1.963287353515625, 2.0843505859375, 2.205413818359375, 2.32647705078125, 2.447540283203125, 2.568603515625, 2.689666748046875, 2.81072998046875, 2.931793212890625, 3.0528564453125, 3.173919677734375, 3.29498291015625, 3.416046142578125, 3.537109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 1.0, 9.0, 8.0, 5.0, 8.0, 15.0, 8.0, 15.0, 26.0, 18.0, 21.0, 23.0, 17.0, 36.0, 38.0, 44.0, 58.0, 44.0, 53.0, 53.0, 46.0, 43.0, 47.0, 55.0, 36.0, 38.0, 33.0, 42.0, 19.0, 25.0, 18.0, 20.0, 13.0, 10.0, 14.0, 4.0, 12.0, 9.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.56761646270752, -9.275262832641602, -8.982908248901367, -8.69055461883545, -8.398200035095215, -8.105846405029297, -7.813492298126221, -7.5211381912231445, -7.228784561157227, -6.93643045425415, -6.644076347351074, -6.351722717285156, -6.05936861038208, -5.767014503479004, -5.474660396575928, -5.182306289672852, -4.889952182769775, -4.597598075866699, -4.305243968963623, -4.012889862060547, -3.720536231994629, -3.4281821250915527, -3.1358280181884766, -2.8434741497039795, -2.5511200428009033, -2.258765935897827, -1.96641206741333, -1.674057960510254, -1.3817039728164673, -1.0893499851226807, -0.7969958782196045, -0.5046420097351074, -0.21228790283203125, 0.08006611466407776, 0.37242013216018677, 0.6647741794586182, 0.9571281671524048, 1.2494821548461914, 1.5418362617492676, 1.8341901302337646, 2.126544237136841, 2.418898344039917, 2.711252212524414, 3.0036063194274902, 3.2959604263305664, 3.5883142948150635, 3.8806684017181396, 4.173022270202637, 4.465376377105713, 4.757730484008789, 5.050084590911865, 5.342438697814941, 5.634792327880859, 5.9271464347839355, 6.219500541687012, 6.51185417175293, 6.804208755493164, 7.09656286239624, 7.388916969299316, 7.681270599365234, 7.9736247062683105, 8.265978813171387, 8.558332443237305, 8.850687026977539, 9.143040657043457]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 2.0, 6.0, 16.0, 12.0, 8.0, 15.0, 20.0, 14.0, 25.0, 30.0, 34.0, 27.0, 43.0, 42.0, 36.0, 42.0, 45.0, 45.0, 41.0, 39.0, 45.0, 44.0, 29.0, 42.0, 39.0, 36.0, 26.0, 21.0, 25.0, 23.0, 16.0, 12.0, 20.0, 10.0, 10.0, 13.0, 10.0, 6.0, 1.0, 2.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.662756443023682, -7.401858806610107, -7.140961647033691, -6.880064010620117, -6.619166851043701, -6.358269214630127, -6.097372055053711, -5.836474418640137, -5.5755767822265625, -5.314679145812988, -5.053781986236572, -4.792884349822998, -4.531987190246582, -4.271089553833008, -4.010191917419434, -3.7492947578430176, -3.4883975982666016, -3.2275002002716064, -2.9666028022766113, -2.705705165863037, -2.444808006286621, -2.183910369873047, -1.9230129718780518, -1.6621155738830566, -1.4012181758880615, -1.1403207778930664, -0.8794233202934265, -0.6185258626937866, -0.3576284646987915, -0.09673106670379639, 0.16416645050048828, 0.4250638484954834, 0.6859617233276367, 0.9468591213226318, 1.207756519317627, 1.4686540365219116, 1.7295514345169067, 1.9904488325119019, 2.2513463497161865, 2.5122437477111816, 2.7731411457061768, 3.034038543701172, 3.294935941696167, 3.555833339691162, 3.8167309761047363, 4.077628135681152, 4.338525772094727, 4.599423408508301, 4.860320568084717, 5.121218204498291, 5.382115364074707, 5.643013000488281, 5.903910160064697, 6.1648077964782715, 6.4257049560546875, 6.686602592468262, 6.947500228881836, 7.20839786529541, 7.469295024871826, 7.7301926612854, 7.991089820861816, 8.25198745727539, 8.512885093688965, 8.773782730102539, 9.034679412841797]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 29.0, 53.0, 83.0, 130.0, 157.0, 259.0, 388.0, 647.0, 922.0, 1470.0, 2454.0, 3909.0, 6557.0, 12383.0, 24185.0, 49598.0, 105272.0, 205733.0, 270700.0, 183630.0, 90225.0, 42556.0, 20627.0, 10956.0, 6044.0, 3522.0, 2118.0, 1384.0, 895.0, 559.0, 366.0, 230.0, 161.0, 106.0, 81.0, 37.0, 28.0, 20.0, 15.0, 15.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2890625, -8.033203125, -7.77734375, -7.521484375, -7.265625, -7.009765625, -6.75390625, -6.498046875, -6.2421875, -5.986328125, -5.73046875, -5.474609375, -5.21875, -4.962890625, -4.70703125, -4.451171875, -4.1953125, -3.939453125, -3.68359375, -3.427734375, -3.171875, -2.916015625, -2.66015625, -2.404296875, -2.1484375, -1.892578125, -1.63671875, -1.380859375, -1.125, -0.869140625, -0.61328125, -0.357421875, -0.1015625, 0.154296875, 0.41015625, 0.666015625, 0.921875, 1.177734375, 1.43359375, 1.689453125, 1.9453125, 2.201171875, 2.45703125, 2.712890625, 2.96875, 3.224609375, 3.48046875, 3.736328125, 3.9921875, 4.248046875, 4.50390625, 4.759765625, 5.015625, 5.271484375, 5.52734375, 5.783203125, 6.0390625, 6.294921875, 6.55078125, 6.806640625, 7.0625, 7.318359375, 7.57421875, 7.830078125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 6.0, 8.0, 7.0, 8.0, 12.0, 16.0, 13.0, 15.0, 11.0, 18.0, 22.0, 16.0, 29.0, 32.0, 41.0, 32.0, 42.0, 51.0, 42.0, 30.0, 41.0, 38.0, 40.0, 49.0, 34.0, 38.0, 37.0, 29.0, 27.0, 32.0, 32.0, 12.0, 14.0, 17.0, 17.0, 11.0, 16.0, 14.0, 6.0, 8.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.14453125, -6.89788818359375, -6.6512451171875, -6.40460205078125, -6.157958984375, -5.91131591796875, -5.6646728515625, -5.41802978515625, -5.17138671875, -4.92474365234375, -4.6781005859375, -4.43145751953125, -4.184814453125, -3.93817138671875, -3.6915283203125, -3.44488525390625, -3.1982421875, -2.95159912109375, -2.7049560546875, -2.45831298828125, -2.211669921875, -1.96502685546875, -1.7183837890625, -1.47174072265625, -1.22509765625, -0.97845458984375, -0.7318115234375, -0.48516845703125, -0.238525390625, 0.00811767578125, 0.2547607421875, 0.50140380859375, 0.748046875, 0.99468994140625, 1.2413330078125, 1.48797607421875, 1.734619140625, 1.98126220703125, 2.2279052734375, 2.47454833984375, 2.72119140625, 2.96783447265625, 3.2144775390625, 3.46112060546875, 3.707763671875, 3.95440673828125, 4.2010498046875, 4.44769287109375, 4.6943359375, 4.94097900390625, 5.1876220703125, 5.43426513671875, 5.680908203125, 5.92755126953125, 6.1741943359375, 6.42083740234375, 6.66748046875, 6.91412353515625, 7.1607666015625, 7.40740966796875, 7.654052734375, 7.90069580078125, 8.1473388671875, 8.39398193359375, 8.640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 15.0, 13.0, 23.0, 31.0, 51.0, 47.0, 88.0, 135.0, 193.0, 272.0, 431.0, 625.0, 1057.0, 1512.0, 2485.0, 4049.0, 6672.0, 11366.0, 21519.0, 64316.0, 843820.0, 44243.0, 18870.0, 10463.0, 5959.0, 3735.0, 2368.0, 1402.0, 910.0, 635.0, 400.0, 252.0, 201.0, 128.0, 83.0, 47.0, 33.0, 29.0, 23.0, 25.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.28125, -9.9908447265625, -9.700439453125, -9.4100341796875, -9.11962890625, -8.8292236328125, -8.538818359375, -8.2484130859375, -7.9580078125, -7.6676025390625, -7.377197265625, -7.0867919921875, -6.79638671875, -6.5059814453125, -6.215576171875, -5.9251708984375, -5.634765625, -5.3443603515625, -5.053955078125, -4.7635498046875, -4.47314453125, -4.1827392578125, -3.892333984375, -3.6019287109375, -3.3115234375, -3.0211181640625, -2.730712890625, -2.4403076171875, -2.14990234375, -1.8594970703125, -1.569091796875, -1.2786865234375, -0.98828125, -0.6978759765625, -0.407470703125, -0.1170654296875, 0.17333984375, 0.4637451171875, 0.754150390625, 1.0445556640625, 1.3349609375, 1.6253662109375, 1.915771484375, 2.2061767578125, 2.49658203125, 2.7869873046875, 3.077392578125, 3.3677978515625, 3.658203125, 3.9486083984375, 4.239013671875, 4.5294189453125, 4.81982421875, 5.1102294921875, 5.400634765625, 5.6910400390625, 5.9814453125, 6.2718505859375, 6.562255859375, 6.8526611328125, 7.14306640625, 7.4334716796875, 7.723876953125, 8.0142822265625, 8.3046875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 11.0, 8.0, 19.0, 13.0, 14.0, 22.0, 20.0, 17.0, 29.0, 36.0, 24.0, 31.0, 43.0, 36.0, 31.0, 50.0, 34.0, 42.0, 39.0, 43.0, 36.0, 41.0, 40.0, 34.0, 33.0, 22.0, 28.0, 24.0, 24.0, 19.0, 22.0, 10.0, 12.0, 14.0, 8.0, 6.0, 8.0, 12.0, 4.0, 4.0, 10.0, 2.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.78448486328125, -5.5845947265625, -5.38470458984375, -5.184814453125, -4.98492431640625, -4.7850341796875, -4.58514404296875, -4.38525390625, -4.18536376953125, -3.9854736328125, -3.78558349609375, -3.585693359375, -3.38580322265625, -3.1859130859375, -2.98602294921875, -2.7861328125, -2.58624267578125, -2.3863525390625, -2.18646240234375, -1.986572265625, -1.78668212890625, -1.5867919921875, -1.38690185546875, -1.18701171875, -0.98712158203125, -0.7872314453125, -0.58734130859375, -0.387451171875, -0.18756103515625, 0.0123291015625, 0.21221923828125, 0.412109375, 0.61199951171875, 0.8118896484375, 1.01177978515625, 1.211669921875, 1.41156005859375, 1.6114501953125, 1.81134033203125, 2.01123046875, 2.21112060546875, 2.4110107421875, 2.61090087890625, 2.810791015625, 3.01068115234375, 3.2105712890625, 3.41046142578125, 3.6103515625, 3.81024169921875, 4.0101318359375, 4.21002197265625, 4.409912109375, 4.60980224609375, 4.8096923828125, 5.00958251953125, 5.20947265625, 5.40936279296875, 5.6092529296875, 5.80914306640625, 6.009033203125, 6.20892333984375, 6.4088134765625, 6.60870361328125, 6.80859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 9.0, 7.0, 11.0, 25.0, 29.0, 41.0, 59.0, 104.0, 144.0, 219.0, 329.0, 557.0, 896.0, 1604.0, 2985.0, 5978.0, 13948.0, 44478.0, 903255.0, 45795.0, 14525.0, 6409.0, 3140.0, 1557.0, 979.0, 506.0, 354.0, 190.0, 130.0, 87.0, 63.0, 27.0, 30.0, 17.0, 13.0, 12.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.32501220703125, -6.1031494140625, -5.88128662109375, -5.659423828125, -5.43756103515625, -5.2156982421875, -4.99383544921875, -4.77197265625, -4.55010986328125, -4.3282470703125, -4.10638427734375, -3.884521484375, -3.66265869140625, -3.4407958984375, -3.21893310546875, -2.9970703125, -2.77520751953125, -2.5533447265625, -2.33148193359375, -2.109619140625, -1.88775634765625, -1.6658935546875, -1.44403076171875, -1.22216796875, -1.00030517578125, -0.7784423828125, -0.55657958984375, -0.334716796875, -0.11285400390625, 0.1090087890625, 0.33087158203125, 0.552734375, 0.77459716796875, 0.9964599609375, 1.21832275390625, 1.440185546875, 1.66204833984375, 1.8839111328125, 2.10577392578125, 2.32763671875, 2.54949951171875, 2.7713623046875, 2.99322509765625, 3.215087890625, 3.43695068359375, 3.6588134765625, 3.88067626953125, 4.1025390625, 4.32440185546875, 4.5462646484375, 4.76812744140625, 4.989990234375, 5.21185302734375, 5.4337158203125, 5.65557861328125, 5.87744140625, 6.09930419921875, 6.3211669921875, 6.54302978515625, 6.764892578125, 6.98675537109375, 7.2086181640625, 7.43048095703125, 7.65234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 8.0, 10.0, 10.0, 21.0, 23.0, 26.0, 55.0, 69.0, 85.0, 126.0, 132.0, 115.0, 81.0, 60.0, 45.0, 16.0, 21.0, 19.0, 8.0, 15.0, 15.0, 5.0, 5.0, 6.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005664825439453125, -0.0005449503660202026, -0.0005234181880950928, -0.0005018860101699829, -0.00048035383224487305, -0.0004588216543197632, -0.0004372894763946533, -0.00041575729846954346, -0.0003942251205444336, -0.00037269294261932373, -0.00035116076469421387, -0.000329628586769104, -0.00030809640884399414, -0.0002865642309188843, -0.0002650320529937744, -0.00024349987506866455, -0.0002219676971435547, -0.00020043551921844482, -0.00017890334129333496, -0.0001573711633682251, -0.00013583898544311523, -0.00011430680751800537, -9.277462959289551e-05, -7.124245166778564e-05, -4.971027374267578e-05, -2.8178095817565918e-05, -6.645917892456055e-06, 1.4886260032653809e-05, 3.641843795776367e-05, 5.7950615882873535e-05, 7.94827938079834e-05, 0.00010101497173309326, 0.00012254714965820312, 0.000144079327583313, 0.00016561150550842285, 0.00018714368343353271, 0.00020867586135864258, 0.00023020803928375244, 0.0002517402172088623, 0.00027327239513397217, 0.00029480457305908203, 0.0003163367509841919, 0.00033786892890930176, 0.0003594011068344116, 0.0003809332847595215, 0.00040246546268463135, 0.0004239976406097412, 0.0004455298185348511, 0.00046706199645996094, 0.0004885941743850708, 0.0005101263523101807, 0.0005316585302352905, 0.0005531907081604004, 0.0005747228860855103, 0.0005962550640106201, 0.00061778724193573, 0.0006393194198608398, 0.0006608515977859497, 0.0006823837757110596, 0.0007039159536361694, 0.0007254481315612793, 0.0007469803094863892, 0.000768512487411499, 0.0007900446653366089, 0.0008115768432617188]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 11.0, 22.0, 33.0, 47.0, 59.0, 78.0, 105.0, 199.0, 286.0, 400.0, 640.0, 1040.0, 1559.0, 2497.0, 3764.0, 6036.0, 9585.0, 15677.0, 26419.0, 45234.0, 80064.0, 139462.0, 212095.0, 201431.0, 126590.0, 71734.0, 40948.0, 23863.0, 14519.0, 8981.0, 5420.0, 3468.0, 2239.0, 1375.0, 894.0, 583.0, 411.0, 252.0, 181.0, 118.0, 81.0, 43.0, 35.0, 32.0, 13.0, 9.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9306640625, -1.8719940185546875, -1.813323974609375, -1.7546539306640625, -1.69598388671875, -1.6373138427734375, -1.578643798828125, -1.5199737548828125, -1.4613037109375, -1.4026336669921875, -1.343963623046875, -1.2852935791015625, -1.22662353515625, -1.1679534912109375, -1.109283447265625, -1.0506134033203125, -0.991943359375, -0.9332733154296875, -0.874603271484375, -0.8159332275390625, -0.75726318359375, -0.6985931396484375, -0.639923095703125, -0.5812530517578125, -0.5225830078125, -0.4639129638671875, -0.405242919921875, -0.3465728759765625, -0.28790283203125, -0.2292327880859375, -0.170562744140625, -0.1118927001953125, -0.05322265625, 0.0054473876953125, 0.064117431640625, 0.1227874755859375, 0.18145751953125, 0.2401275634765625, 0.298797607421875, 0.3574676513671875, 0.4161376953125, 0.4748077392578125, 0.533477783203125, 0.5921478271484375, 0.65081787109375, 0.7094879150390625, 0.768157958984375, 0.8268280029296875, 0.885498046875, 0.9441680908203125, 1.002838134765625, 1.0615081787109375, 1.12017822265625, 1.1788482666015625, 1.237518310546875, 1.2961883544921875, 1.3548583984375, 1.4135284423828125, 1.472198486328125, 1.5308685302734375, 1.58953857421875, 1.6482086181640625, 1.706878662109375, 1.7655487060546875, 1.82421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 10.0, 12.0, 7.0, 18.0, 26.0, 20.0, 12.0, 28.0, 25.0, 31.0, 30.0, 43.0, 35.0, 53.0, 46.0, 51.0, 51.0, 63.0, 54.0, 43.0, 42.0, 36.0, 32.0, 32.0, 25.0, 22.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 12.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.563812255859375, -0.54754638671875, -0.531280517578125, -0.5150146484375, -0.498748779296875, -0.48248291015625, -0.466217041015625, -0.449951171875, -0.433685302734375, -0.41741943359375, -0.401153564453125, -0.3848876953125, -0.368621826171875, -0.35235595703125, -0.336090087890625, -0.31982421875, -0.303558349609375, -0.28729248046875, -0.271026611328125, -0.2547607421875, -0.238494873046875, -0.22222900390625, -0.205963134765625, -0.189697265625, -0.173431396484375, -0.15716552734375, -0.140899658203125, -0.1246337890625, -0.108367919921875, -0.09210205078125, -0.075836181640625, -0.0595703125, -0.043304443359375, -0.02703857421875, -0.010772705078125, 0.0054931640625, 0.021759033203125, 0.03802490234375, 0.054290771484375, 0.070556640625, 0.086822509765625, 0.10308837890625, 0.119354248046875, 0.1356201171875, 0.151885986328125, 0.16815185546875, 0.184417724609375, 0.20068359375, 0.216949462890625, 0.23321533203125, 0.249481201171875, 0.2657470703125, 0.282012939453125, 0.29827880859375, 0.314544677734375, 0.330810546875, 0.347076416015625, 0.36334228515625, 0.379608154296875, 0.3958740234375, 0.412139892578125, 0.42840576171875, 0.444671630859375, 0.4609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 5.0, 12.0, 13.0, 12.0, 21.0, 10.0, 31.0, 21.0, 24.0, 18.0, 37.0, 40.0, 48.0, 42.0, 48.0, 46.0, 54.0, 44.0, 51.0, 37.0, 47.0, 52.0, 50.0, 32.0, 32.0, 34.0, 16.0, 10.0, 15.0, 13.0, 17.0, 11.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.060894012451172, -9.771018028259277, -9.4811429977417, -9.191267013549805, -8.901391983032227, -8.611515998840332, -8.321640968322754, -8.03176498413086, -7.741889476776123, -7.452013969421387, -7.16213846206665, -6.872262954711914, -6.5823869705200195, -6.292511940002441, -6.002635955810547, -5.7127604484558105, -5.422884941101074, -5.133009433746338, -4.843133926391602, -4.553258419036865, -4.263382911682129, -3.9735071659088135, -3.683631420135498, -3.3937559127807617, -3.1038804054260254, -2.814004898071289, -2.5241293907165527, -2.2342536449432373, -1.944378137588501, -1.6545026302337646, -1.3646270036697388, -1.074751377105713, -0.7848758697509766, -0.49500030279159546, -0.20512473583221436, 0.08475083112716675, 0.37462639808654785, 0.6645019054412842, 0.9543775320053101, 1.244253158569336, 1.5341286659240723, 1.8240041732788086, 2.113879680633545, 2.4037554264068604, 2.6936309337615967, 2.983506441116333, 3.2733821868896484, 3.5632576942443848, 3.853133201599121, 4.143008708953857, 4.432884216308594, 4.72275972366333, 5.012635231018066, 5.302511215209961, 5.592386722564697, 5.882262229919434, 6.17213773727417, 6.462013244628906, 6.751888751983643, 7.041764259338379, 7.331640243530273, 7.621515274047852, 7.911391258239746, 8.20126724243164, 8.491142272949219]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 8.0, 14.0, 5.0, 16.0, 9.0, 13.0, 17.0, 24.0, 22.0, 26.0, 30.0, 45.0, 37.0, 38.0, 46.0, 38.0, 40.0, 50.0, 43.0, 43.0, 49.0, 35.0, 33.0, 39.0, 35.0, 34.0, 31.0, 18.0, 22.0, 19.0, 26.0, 12.0, 11.0, 13.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855771541595459, -7.594684600830078, -7.3335981369018555, -7.072511196136475, -6.811424255371094, -6.550337791442871, -6.28925085067749, -6.028163909912109, -5.767077445983887, -5.505990505218506, -5.244904041290283, -4.983817100524902, -4.72273063659668, -4.461643695831299, -4.200556755065918, -3.939470052719116, -3.6783833503723145, -3.4172966480255127, -3.156209945678711, -2.89512300491333, -2.6340363025665283, -2.3729496002197266, -2.1118626594543457, -1.850775957107544, -1.5896892547607422, -1.3286025524139404, -1.0675157308578491, -0.8064289689064026, -0.545342206954956, -0.2842555046081543, -0.02316868305206299, 0.23791813850402832, 0.4990043640136719, 0.7600911259651184, 1.021177887916565, 1.2822647094726562, 1.543351411819458, 1.8044381141662598, 2.0655250549316406, 2.3266117572784424, 2.587698459625244, 2.848785161972046, 3.1098718643188477, 3.3709588050842285, 3.6320455074310303, 3.893132209777832, 4.154219150543213, 4.415306091308594, 4.676392555236816, 4.937479496002197, 5.19856595993042, 5.459652900695801, 5.720739364624023, 5.981826305389404, 6.242913246154785, 6.503999710083008, 6.765086650848389, 7.0261735916137695, 7.287260055541992, 7.548346996307373, 7.809433937072754, 8.070520401000977, 8.3316068649292, 8.592694282531738, 8.853780746459961]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 11.0, 11.0, 22.0, 31.0, 54.0, 83.0, 137.0, 178.0, 315.0, 464.0, 862.0, 1225.0, 1957.0, 3137.0, 4978.0, 7774.0, 12057.0, 18977.0, 29103.0, 43546.0, 63881.0, 88546.0, 113429.0, 129365.0, 129841.0, 114158.0, 90403.0, 65683.0, 44813.0, 29899.0, 19306.0, 12518.0, 8036.0, 5036.0, 3167.0, 2001.0, 1315.0, 780.0, 529.0, 329.0, 242.0, 140.0, 75.0, 41.0, 36.0, 22.0, 15.0, 12.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-9.7421875, -9.4559326171875, -9.169677734375, -8.8834228515625, -8.59716796875, -8.3109130859375, -8.024658203125, -7.7384033203125, -7.4521484375, -7.1658935546875, -6.879638671875, -6.5933837890625, -6.30712890625, -6.0208740234375, -5.734619140625, -5.4483642578125, -5.162109375, -4.8758544921875, -4.589599609375, -4.3033447265625, -4.01708984375, -3.7308349609375, -3.444580078125, -3.1583251953125, -2.8720703125, -2.5858154296875, -2.299560546875, -2.0133056640625, -1.72705078125, -1.4407958984375, -1.154541015625, -0.8682861328125, -0.58203125, -0.2957763671875, -0.009521484375, 0.2767333984375, 0.56298828125, 0.8492431640625, 1.135498046875, 1.4217529296875, 1.7080078125, 1.9942626953125, 2.280517578125, 2.5667724609375, 2.85302734375, 3.1392822265625, 3.425537109375, 3.7117919921875, 3.998046875, 4.2843017578125, 4.570556640625, 4.8568115234375, 5.14306640625, 5.4293212890625, 5.715576171875, 6.0018310546875, 6.2880859375, 6.5743408203125, 6.860595703125, 7.1468505859375, 7.43310546875, 7.7193603515625, 8.005615234375, 8.2918701171875, 8.578125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 5.0, 5.0, 10.0, 6.0, 15.0, 13.0, 13.0, 10.0, 12.0, 16.0, 23.0, 25.0, 13.0, 27.0, 38.0, 40.0, 30.0, 41.0, 33.0, 37.0, 41.0, 43.0, 44.0, 39.0, 37.0, 27.0, 37.0, 34.0, 25.0, 33.0, 32.0, 31.0, 28.0, 10.0, 16.0, 7.0, 16.0, 15.0, 15.0, 11.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.0625, -6.8468017578125, -6.631103515625, -6.4154052734375, -6.19970703125, -5.9840087890625, -5.768310546875, -5.5526123046875, -5.3369140625, -5.1212158203125, -4.905517578125, -4.6898193359375, -4.47412109375, -4.2584228515625, -4.042724609375, -3.8270263671875, -3.611328125, -3.3956298828125, -3.179931640625, -2.9642333984375, -2.74853515625, -2.5328369140625, -2.317138671875, -2.1014404296875, -1.8857421875, -1.6700439453125, -1.454345703125, -1.2386474609375, -1.02294921875, -0.8072509765625, -0.591552734375, -0.3758544921875, -0.16015625, 0.0555419921875, 0.271240234375, 0.4869384765625, 0.70263671875, 0.9183349609375, 1.134033203125, 1.3497314453125, 1.5654296875, 1.7811279296875, 1.996826171875, 2.2125244140625, 2.42822265625, 2.6439208984375, 2.859619140625, 3.0753173828125, 3.291015625, 3.5067138671875, 3.722412109375, 3.9381103515625, 4.15380859375, 4.3695068359375, 4.585205078125, 4.8009033203125, 5.0166015625, 5.2322998046875, 5.447998046875, 5.6636962890625, 5.87939453125, 6.0950927734375, 6.310791015625, 6.5264892578125, 6.7421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 27.0, 34.0, 53.0, 75.0, 135.0, 196.0, 294.0, 426.0, 610.0, 961.0, 1530.0, 2176.0, 3489.0, 4966.0, 7708.0, 11825.0, 17313.0, 25558.0, 36354.0, 50381.0, 68076.0, 87439.0, 104432.0, 113779.0, 112589.0, 100717.0, 82802.0, 63753.0, 46737.0, 33383.0, 23103.0, 15772.0, 10533.0, 7175.0, 4839.0, 3165.0, 2170.0, 1403.0, 858.0, 580.0, 368.0, 252.0, 182.0, 116.0, 67.0, 42.0, 37.0, 21.0, 9.0, 9.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.08203125, -6.85272216796875, -6.6234130859375, -6.39410400390625, -6.164794921875, -5.93548583984375, -5.7061767578125, -5.47686767578125, -5.24755859375, -5.01824951171875, -4.7889404296875, -4.55963134765625, -4.330322265625, -4.10101318359375, -3.8717041015625, -3.64239501953125, -3.4130859375, -3.18377685546875, -2.9544677734375, -2.72515869140625, -2.495849609375, -2.26654052734375, -2.0372314453125, -1.80792236328125, -1.57861328125, -1.34930419921875, -1.1199951171875, -0.89068603515625, -0.661376953125, -0.43206787109375, -0.2027587890625, 0.02655029296875, 0.255859375, 0.48516845703125, 0.7144775390625, 0.94378662109375, 1.173095703125, 1.40240478515625, 1.6317138671875, 1.86102294921875, 2.09033203125, 2.31964111328125, 2.5489501953125, 2.77825927734375, 3.007568359375, 3.23687744140625, 3.4661865234375, 3.69549560546875, 3.9248046875, 4.15411376953125, 4.3834228515625, 4.61273193359375, 4.842041015625, 5.07135009765625, 5.3006591796875, 5.52996826171875, 5.75927734375, 5.98858642578125, 6.2178955078125, 6.44720458984375, 6.676513671875, 6.90582275390625, 7.1351318359375, 7.36444091796875, 7.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 4.0, 11.0, 19.0, 8.0, 11.0, 25.0, 26.0, 30.0, 33.0, 29.0, 42.0, 28.0, 39.0, 38.0, 32.0, 36.0, 38.0, 43.0, 53.0, 47.0, 38.0, 52.0, 37.0, 40.0, 28.0, 23.0, 23.0, 22.0, 21.0, 18.0, 17.0, 17.0, 12.0, 17.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.68511962890625, -4.5225830078125, -4.36004638671875, -4.197509765625, -4.03497314453125, -3.8724365234375, -3.70989990234375, -3.54736328125, -3.38482666015625, -3.2222900390625, -3.05975341796875, -2.897216796875, -2.73468017578125, -2.5721435546875, -2.40960693359375, -2.2470703125, -2.08453369140625, -1.9219970703125, -1.75946044921875, -1.596923828125, -1.43438720703125, -1.2718505859375, -1.10931396484375, -0.94677734375, -0.78424072265625, -0.6217041015625, -0.45916748046875, -0.296630859375, -0.13409423828125, 0.0284423828125, 0.19097900390625, 0.353515625, 0.51605224609375, 0.6785888671875, 0.84112548828125, 1.003662109375, 1.16619873046875, 1.3287353515625, 1.49127197265625, 1.65380859375, 1.81634521484375, 1.9788818359375, 2.14141845703125, 2.303955078125, 2.46649169921875, 2.6290283203125, 2.79156494140625, 2.9541015625, 3.11663818359375, 3.2791748046875, 3.44171142578125, 3.604248046875, 3.76678466796875, 3.9293212890625, 4.09185791015625, 4.25439453125, 4.41693115234375, 4.5794677734375, 4.74200439453125, 4.904541015625, 5.06707763671875, 5.2296142578125, 5.39215087890625, 5.5546875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 16.0, 18.0, 25.0, 38.0, 62.0, 68.0, 122.0, 173.0, 294.0, 509.0, 783.0, 1303.0, 2260.0, 3947.0, 7121.0, 13454.0, 26432.0, 54661.0, 124783.0, 268067.0, 283316.0, 139514.0, 60150.0, 28810.0, 14613.0, 7825.0, 4260.0, 2395.0, 1325.0, 852.0, 503.0, 296.0, 190.0, 134.0, 78.0, 51.0, 34.0, 26.0, 21.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.807373046875, -11.42724609375, -11.047119140625, -10.6669921875, -10.286865234375, -9.90673828125, -9.526611328125, -9.146484375, -8.766357421875, -8.38623046875, -8.006103515625, -7.6259765625, -7.245849609375, -6.86572265625, -6.485595703125, -6.10546875, -5.725341796875, -5.34521484375, -4.965087890625, -4.5849609375, -4.204833984375, -3.82470703125, -3.444580078125, -3.064453125, -2.684326171875, -2.30419921875, -1.924072265625, -1.5439453125, -1.163818359375, -0.78369140625, -0.403564453125, -0.0234375, 0.356689453125, 0.73681640625, 1.116943359375, 1.4970703125, 1.877197265625, 2.25732421875, 2.637451171875, 3.017578125, 3.397705078125, 3.77783203125, 4.157958984375, 4.5380859375, 4.918212890625, 5.29833984375, 5.678466796875, 6.05859375, 6.438720703125, 6.81884765625, 7.198974609375, 7.5791015625, 7.959228515625, 8.33935546875, 8.719482421875, 9.099609375, 9.479736328125, 9.85986328125, 10.239990234375, 10.6201171875, 11.000244140625, 11.38037109375, 11.760498046875, 12.140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 1.0, 9.0, 10.0, 13.0, 14.0, 14.0, 20.0, 22.0, 17.0, 26.0, 35.0, 48.0, 53.0, 65.0, 71.0, 79.0, 78.0, 75.0, 60.0, 51.0, 43.0, 42.0, 32.0, 24.0, 18.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008592531085014343, -0.0008306354284286499, -0.0008020177483558655, -0.0007734000682830811, -0.0007447823882102966, -0.0007161647081375122, -0.0006875470280647278, -0.0006589293479919434, -0.0006303116679191589, -0.0006016939878463745, -0.0005730763077735901, -0.0005444586277008057, -0.0005158409476280212, -0.0004872232675552368, -0.0004586055874824524, -0.00042998790740966797, -0.00040137022733688354, -0.0003727525472640991, -0.0003441348671913147, -0.0003155171871185303, -0.00028689950704574585, -0.0002582818269729614, -0.000229664146900177, -0.00020104646682739258, -0.00017242878675460815, -0.00014381110668182373, -0.0001151934266090393, -8.657574653625488e-05, -5.795806646347046e-05, -2.9340386390686035e-05, -7.227063179016113e-07, 2.7894973754882812e-05, 5.6512653827667236e-05, 8.513033390045166e-05, 0.00011374801397323608, 0.0001423656940460205, 0.00017098337411880493, 0.00019960105419158936, 0.00022821873426437378, 0.0002568364143371582, 0.0002854540944099426, 0.00031407177448272705, 0.0003426894545555115, 0.0003713071346282959, 0.0003999248147010803, 0.00042854249477386475, 0.00045716017484664917, 0.0004857778549194336, 0.000514395534992218, 0.0005430132150650024, 0.0005716308951377869, 0.0006002485752105713, 0.0006288662552833557, 0.0006574839353561401, 0.0006861016154289246, 0.000714719295501709, 0.0007433369755744934, 0.0007719546556472778, 0.0008005723357200623, 0.0008291900157928467, 0.0008578076958656311, 0.0008864253759384155, 0.0009150430560112, 0.0009436607360839844]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 1.0, 10.0, 11.0, 21.0, 32.0, 40.0, 52.0, 75.0, 115.0, 192.0, 240.0, 379.0, 554.0, 797.0, 1303.0, 2050.0, 3091.0, 4856.0, 7722.0, 12611.0, 20275.0, 33985.0, 57398.0, 96471.0, 152021.0, 190058.0, 171335.0, 116294.0, 70379.0, 41409.0, 24411.0, 14709.0, 9266.0, 5786.0, 3638.0, 2368.0, 1565.0, 945.0, 656.0, 463.0, 325.0, 191.0, 139.0, 105.0, 63.0, 45.0, 28.0, 23.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.55859375, -6.35162353515625, -6.1446533203125, -5.93768310546875, -5.730712890625, -5.52374267578125, -5.3167724609375, -5.10980224609375, -4.90283203125, -4.69586181640625, -4.4888916015625, -4.28192138671875, -4.074951171875, -3.86798095703125, -3.6610107421875, -3.45404052734375, -3.2470703125, -3.04010009765625, -2.8331298828125, -2.62615966796875, -2.419189453125, -2.21221923828125, -2.0052490234375, -1.79827880859375, -1.59130859375, -1.38433837890625, -1.1773681640625, -0.97039794921875, -0.763427734375, -0.55645751953125, -0.3494873046875, -0.14251708984375, 0.064453125, 0.27142333984375, 0.4783935546875, 0.68536376953125, 0.892333984375, 1.09930419921875, 1.3062744140625, 1.51324462890625, 1.72021484375, 1.92718505859375, 2.1341552734375, 2.34112548828125, 2.548095703125, 2.75506591796875, 2.9620361328125, 3.16900634765625, 3.3759765625, 3.58294677734375, 3.7899169921875, 3.99688720703125, 4.203857421875, 4.41082763671875, 4.6177978515625, 4.82476806640625, 5.03173828125, 5.23870849609375, 5.4456787109375, 5.65264892578125, 5.859619140625, 6.06658935546875, 6.2735595703125, 6.48052978515625, 6.6875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 8.0, 8.0, 9.0, 18.0, 30.0, 29.0, 35.0, 55.0, 50.0, 97.0, 94.0, 89.0, 78.0, 92.0, 55.0, 56.0, 49.0, 23.0, 30.0, 18.0, 11.0, 18.0, 7.0, 3.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.585357666015625, -3.47540283203125, -3.365447998046875, -3.2554931640625, -3.145538330078125, -3.03558349609375, -2.925628662109375, -2.815673828125, -2.705718994140625, -2.59576416015625, -2.485809326171875, -2.3758544921875, -2.265899658203125, -2.15594482421875, -2.045989990234375, -1.93603515625, -1.826080322265625, -1.71612548828125, -1.606170654296875, -1.4962158203125, -1.386260986328125, -1.27630615234375, -1.166351318359375, -1.056396484375, -0.946441650390625, -0.83648681640625, -0.726531982421875, -0.6165771484375, -0.506622314453125, -0.39666748046875, -0.286712646484375, -0.1767578125, -0.066802978515625, 0.04315185546875, 0.153106689453125, 0.2630615234375, 0.373016357421875, 0.48297119140625, 0.592926025390625, 0.702880859375, 0.812835693359375, 0.92279052734375, 1.032745361328125, 1.1427001953125, 1.252655029296875, 1.36260986328125, 1.472564697265625, 1.58251953125, 1.692474365234375, 1.80242919921875, 1.912384033203125, 2.0223388671875, 2.132293701171875, 2.24224853515625, 2.352203369140625, 2.462158203125, 2.572113037109375, 2.68206787109375, 2.792022705078125, 2.9019775390625, 3.011932373046875, 3.12188720703125, 3.231842041015625, 3.341796875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 11.0, 13.0, 12.0, 16.0, 23.0, 25.0, 25.0, 33.0, 35.0, 37.0, 47.0, 39.0, 44.0, 50.0, 63.0, 57.0, 58.0, 55.0, 37.0, 37.0, 31.0, 39.0, 37.0, 29.0, 19.0, 17.0, 21.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-10.720756530761719, -10.420270919799805, -10.119786262512207, -9.819300651550293, -9.518815994262695, -9.218330383300781, -8.917844772338867, -8.617359161376953, -8.316874504089355, -8.016388893127441, -7.715904235839844, -7.41541862487793, -7.114933490753174, -6.814448356628418, -6.513962745666504, -6.213477611541748, -5.912992477416992, -5.612507343292236, -5.3120222091674805, -5.011536598205566, -4.7110514640808105, -4.410566329956055, -4.110080718994141, -3.8095955848693848, -3.509110450744629, -3.208625316619873, -2.908139944076538, -2.607654571533203, -2.3071694374084473, -2.0066843032836914, -1.7061989307403564, -1.4057135581970215, -1.105229377746582, -0.8047441244125366, -0.5042588710784912, -0.2037736177444458, 0.09671163558959961, 0.397196888923645, 0.6976821422576904, 0.9981675148010254, 1.2986526489257812, 1.5991379022598267, 1.899623155593872, 2.200108528137207, 2.500593662261963, 2.8010787963867188, 3.1015641689300537, 3.4020495414733887, 3.7025346755981445, 4.0030198097229, 4.303504943847656, 4.60399055480957, 4.904475688934326, 5.204960823059082, 5.505446434020996, 5.805931568145752, 6.106416702270508, 6.406901836395264, 6.7073869705200195, 7.007872581481934, 7.3083577156066895, 7.608842849731445, 7.909328460693359, 8.209814071655273, 8.510298728942871]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 12.0, 9.0, 12.0, 11.0, 15.0, 13.0, 16.0, 15.0, 21.0, 24.0, 25.0, 36.0, 38.0, 29.0, 48.0, 34.0, 41.0, 42.0, 28.0, 35.0, 52.0, 39.0, 26.0, 33.0, 33.0, 36.0, 26.0, 26.0, 25.0, 27.0, 18.0, 12.0, 23.0, 10.0, 16.0, 16.0, 10.0, 7.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-7.543928146362305, -7.321154594421387, -7.098381042480469, -6.875607490539551, -6.652833938598633, -6.430060386657715, -6.207286834716797, -5.984513759613037, -5.761740207672119, -5.538966655731201, -5.316193103790283, -5.093419551849365, -4.870645999908447, -4.6478729248046875, -4.4250993728637695, -4.202325820922852, -3.9795520305633545, -3.7567784786224365, -3.5340049266815186, -3.3112316131591797, -3.0884580612182617, -2.8656845092773438, -2.642910957336426, -2.420137405395508, -2.19736385345459, -1.9745903015136719, -1.7518168687820435, -1.5290433168411255, -1.306269884109497, -1.083496332168579, -0.8607227802276611, -0.6379493474960327, -0.4151759147644043, -0.1924024075269699, 0.030371099710464478, 0.25314462184906006, 0.47591811418533325, 0.6986916065216064, 0.9214651584625244, 1.1442385911941528, 1.3670121431350708, 1.5897856950759888, 1.8125591278076172, 2.035332679748535, 2.258106231689453, 2.480879783630371, 2.703653335571289, 2.926426649093628, 3.149200201034546, 3.371973752975464, 3.594747304916382, 3.8175206184387207, 4.040294170379639, 4.263067722320557, 4.485841274261475, 4.708614826202393, 4.9313883781433105, 5.1541619300842285, 5.3769354820251465, 5.5997090339660645, 5.822482585906982, 6.045255661010742, 6.26802921295166, 6.490802764892578, 6.713576316833496]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 17.0, 31.0, 32.0, 56.0, 78.0, 109.0, 168.0, 303.0, 417.0, 651.0, 1078.0, 1719.0, 2944.0, 4770.0, 8296.0, 14328.0, 25254.0, 45626.0, 86464.0, 166599.0, 331000.0, 614813.0, 894592.0, 850681.0, 545320.0, 283812.0, 144057.0, 75290.0, 40789.0, 22880.0, 12857.0, 7482.0, 4476.0, 2689.0, 1700.0, 1025.0, 644.0, 400.0, 266.0, 204.0, 113.0, 93.0, 50.0, 27.0, 27.0, 23.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.3515625, -7.11358642578125, -6.8756103515625, -6.63763427734375, -6.399658203125, -6.16168212890625, -5.9237060546875, -5.68572998046875, -5.44775390625, -5.20977783203125, -4.9718017578125, -4.73382568359375, -4.495849609375, -4.25787353515625, -4.0198974609375, -3.78192138671875, -3.5439453125, -3.30596923828125, -3.0679931640625, -2.83001708984375, -2.592041015625, -2.35406494140625, -2.1160888671875, -1.87811279296875, -1.64013671875, -1.40216064453125, -1.1641845703125, -0.92620849609375, -0.688232421875, -0.45025634765625, -0.2122802734375, 0.02569580078125, 0.263671875, 0.50164794921875, 0.7396240234375, 0.97760009765625, 1.215576171875, 1.45355224609375, 1.6915283203125, 1.92950439453125, 2.16748046875, 2.40545654296875, 2.6434326171875, 2.88140869140625, 3.119384765625, 3.35736083984375, 3.5953369140625, 3.83331298828125, 4.0712890625, 4.30926513671875, 4.5472412109375, 4.78521728515625, 5.023193359375, 5.26116943359375, 5.4991455078125, 5.73712158203125, 5.97509765625, 6.21307373046875, 6.4510498046875, 6.68902587890625, 6.927001953125, 7.16497802734375, 7.4029541015625, 7.64093017578125, 7.87890625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 8.0, 18.0, 14.0, 25.0, 19.0, 27.0, 23.0, 24.0, 41.0, 52.0, 33.0, 36.0, 53.0, 42.0, 48.0, 46.0, 33.0, 29.0, 34.0, 33.0, 36.0, 27.0, 22.0, 32.0, 24.0, 22.0, 20.0, 20.0, 17.0, 17.0, 15.0, 6.0, 9.0, 6.0, 5.0, 3.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.4296875, -5.2633056640625, -5.096923828125, -4.9305419921875, -4.76416015625, -4.5977783203125, -4.431396484375, -4.2650146484375, -4.0986328125, -3.9322509765625, -3.765869140625, -3.5994873046875, -3.43310546875, -3.2667236328125, -3.100341796875, -2.9339599609375, -2.767578125, -2.6011962890625, -2.434814453125, -2.2684326171875, -2.10205078125, -1.9356689453125, -1.769287109375, -1.6029052734375, -1.4365234375, -1.2701416015625, -1.103759765625, -0.9373779296875, -0.77099609375, -0.6046142578125, -0.438232421875, -0.2718505859375, -0.10546875, 0.0609130859375, 0.227294921875, 0.3936767578125, 0.56005859375, 0.7264404296875, 0.892822265625, 1.0592041015625, 1.2255859375, 1.3919677734375, 1.558349609375, 1.7247314453125, 1.89111328125, 2.0574951171875, 2.223876953125, 2.3902587890625, 2.556640625, 2.7230224609375, 2.889404296875, 3.0557861328125, 3.22216796875, 3.3885498046875, 3.554931640625, 3.7213134765625, 3.8876953125, 4.0540771484375, 4.220458984375, 4.3868408203125, 4.55322265625, 4.7196044921875, 4.885986328125, 5.0523681640625, 5.21875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 11.0, 31.0, 54.0, 78.0, 118.0, 204.0, 321.0, 506.0, 877.0, 1415.0, 2497.0, 4007.0, 6859.0, 12094.0, 21487.0, 38404.0, 70958.0, 132556.0, 245837.0, 447001.0, 730841.0, 887211.0, 687002.0, 410612.0, 225317.0, 121236.0, 65149.0, 35214.0, 19747.0, 11207.0, 6421.0, 3602.0, 2090.0, 1287.0, 805.0, 461.0, 277.0, 171.0, 98.0, 60.0, 50.0, 33.0, 21.0, 9.0, 5.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-8.171875, -7.91986083984375, -7.6678466796875, -7.41583251953125, -7.163818359375, -6.91180419921875, -6.6597900390625, -6.40777587890625, -6.15576171875, -5.90374755859375, -5.6517333984375, -5.39971923828125, -5.147705078125, -4.89569091796875, -4.6436767578125, -4.39166259765625, -4.1396484375, -3.88763427734375, -3.6356201171875, -3.38360595703125, -3.131591796875, -2.87957763671875, -2.6275634765625, -2.37554931640625, -2.12353515625, -1.87152099609375, -1.6195068359375, -1.36749267578125, -1.115478515625, -0.86346435546875, -0.6114501953125, -0.35943603515625, -0.107421875, 0.14459228515625, 0.3966064453125, 0.64862060546875, 0.900634765625, 1.15264892578125, 1.4046630859375, 1.65667724609375, 1.90869140625, 2.16070556640625, 2.4127197265625, 2.66473388671875, 2.916748046875, 3.16876220703125, 3.4207763671875, 3.67279052734375, 3.9248046875, 4.17681884765625, 4.4288330078125, 4.68084716796875, 4.932861328125, 5.18487548828125, 5.4368896484375, 5.68890380859375, 5.94091796875, 6.19293212890625, 6.4449462890625, 6.69696044921875, 6.948974609375, 7.20098876953125, 7.4530029296875, 7.70501708984375, 7.95703125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 19.0, 23.0, 24.0, 39.0, 50.0, 42.0, 68.0, 81.0, 105.0, 128.0, 133.0, 173.0, 183.0, 204.0, 222.0, 251.0, 240.0, 261.0, 246.0, 210.0, 229.0, 195.0, 197.0, 153.0, 123.0, 94.0, 91.0, 63.0, 33.0, 43.0, 29.0, 27.0, 12.0, 18.0, 7.0, 11.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.365692138671875, -2.28216552734375, -2.198638916015625, -2.1151123046875, -2.031585693359375, -1.94805908203125, -1.864532470703125, -1.781005859375, -1.697479248046875, -1.61395263671875, -1.530426025390625, -1.4468994140625, -1.363372802734375, -1.27984619140625, -1.196319580078125, -1.11279296875, -1.029266357421875, -0.94573974609375, -0.862213134765625, -0.7786865234375, -0.695159912109375, -0.61163330078125, -0.528106689453125, -0.444580078125, -0.361053466796875, -0.27752685546875, -0.194000244140625, -0.1104736328125, -0.026947021484375, 0.05657958984375, 0.140106201171875, 0.2236328125, 0.307159423828125, 0.39068603515625, 0.474212646484375, 0.5577392578125, 0.641265869140625, 0.72479248046875, 0.808319091796875, 0.891845703125, 0.975372314453125, 1.05889892578125, 1.142425537109375, 1.2259521484375, 1.309478759765625, 1.39300537109375, 1.476531982421875, 1.56005859375, 1.643585205078125, 1.72711181640625, 1.810638427734375, 1.8941650390625, 1.977691650390625, 2.06121826171875, 2.144744873046875, 2.228271484375, 2.311798095703125, 2.39532470703125, 2.478851318359375, 2.5623779296875, 2.645904541015625, 2.72943115234375, 2.812957763671875, 2.896484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 8.0, 6.0, 10.0, 10.0, 13.0, 26.0, 28.0, 29.0, 50.0, 30.0, 37.0, 44.0, 69.0, 54.0, 49.0, 64.0, 58.0, 48.0, 47.0, 53.0, 55.0, 32.0, 28.0, 29.0, 26.0, 3.0, 19.0, 14.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.61583137512207, -8.329607009887695, -8.04338264465332, -7.757158279418945, -7.47093391418457, -7.184709548950195, -6.898484706878662, -6.612260341644287, -6.326035976409912, -6.039811611175537, -5.753587245941162, -5.467362880706787, -5.181138038635254, -4.894913673400879, -4.608689308166504, -4.322464942932129, -4.036240577697754, -3.750016212463379, -3.463791847229004, -3.17756724357605, -2.891342878341675, -2.6051185131073, -2.3188939094543457, -2.0326695442199707, -1.7464451789855957, -1.4602208137512207, -1.1739963293075562, -0.8877719044685364, -0.6015474796295166, -0.3153231143951416, -0.02909862995147705, 0.2571258544921875, 0.5433511734008789, 0.8295755982398987, 1.1158000230789185, 1.402024507522583, 1.688248872756958, 1.974473237991333, 2.260697841644287, 2.546922206878662, 2.833146572113037, 3.119370937347412, 3.405595302581787, 3.691819906234741, 3.978044271469116, 4.26426887512207, 4.550493240356445, 4.83671760559082, 5.122941970825195, 5.40916633605957, 5.695390701293945, 5.98161506652832, 6.267839431762695, 6.55406379699707, 6.8402886390686035, 7.1265130043029785, 7.4127373695373535, 7.6989617347717285, 7.9851861000061035, 8.271410942077637, 8.557635307312012, 8.843859672546387, 9.130084037780762, 9.416308403015137, 9.702532768249512]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 12.0, 18.0, 25.0, 17.0, 26.0, 29.0, 30.0, 30.0, 48.0, 29.0, 34.0, 37.0, 37.0, 40.0, 44.0, 24.0, 42.0, 40.0, 32.0, 35.0, 41.0, 30.0, 32.0, 21.0, 23.0, 21.0, 22.0, 17.0, 11.0, 15.0, 13.0, 13.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.515998840332031, -5.333995819091797, -5.151993274688721, -4.969990253448486, -4.78798770904541, -4.605984687805176, -4.423981666564941, -4.241978645324707, -4.059976100921631, -3.8779733180999756, -3.6959705352783203, -3.513967514038086, -3.3319647312164307, -3.1499619483947754, -2.967958927154541, -2.7859561443328857, -2.6039533615112305, -2.421950578689575, -2.23994779586792, -2.0579447746276855, -1.8759419918060303, -1.693939208984375, -1.5119363069534302, -1.3299334049224854, -1.14793062210083, -0.96592777967453, -0.78392493724823, -0.6019220948219299, -0.4199192523956299, -0.23791640996932983, -0.055913567543029785, 0.12608933448791504, 0.3080916404724121, 0.49009448289871216, 0.6720973253250122, 0.8541001677513123, 1.0361030101776123, 1.2181057929992676, 1.4001086950302124, 1.5821115970611572, 1.7641143798828125, 1.9461171627044678, 2.128119945526123, 2.3101229667663574, 2.4921257495880127, 2.674128532409668, 2.8561315536499023, 3.0381343364715576, 3.220137119293213, 3.402139902114868, 3.5841426849365234, 3.766145706176758, 3.948148488998413, 4.130151271820068, 4.312154293060303, 4.494156837463379, 4.676159858703613, 4.858162879943848, 5.040165424346924, 5.222168445587158, 5.404170989990234, 5.586174011230469, 5.768177032470703, 5.9501800537109375, 6.132182598114014]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 5.0, 9.0, 11.0, 18.0, 25.0, 42.0, 50.0, 69.0, 101.0, 146.0, 222.0, 308.0, 482.0, 682.0, 978.0, 1488.0, 2288.0, 3346.0, 5112.0, 7630.0, 11771.0, 17443.0, 27202.0, 41491.0, 63116.0, 90782.0, 124535.0, 148296.0, 143223.0, 114674.0, 81227.0, 55246.0, 36433.0, 24295.0, 15561.0, 10003.0, 6655.0, 4499.0, 2857.0, 2060.0, 1370.0, 922.0, 576.0, 414.0, 280.0, 203.0, 115.0, 95.0, 67.0, 47.0, 35.0, 23.0, 22.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.3515625, -2.27532958984375, -2.1990966796875, -2.12286376953125, -2.046630859375, -1.97039794921875, -1.8941650390625, -1.81793212890625, -1.74169921875, -1.66546630859375, -1.5892333984375, -1.51300048828125, -1.436767578125, -1.36053466796875, -1.2843017578125, -1.20806884765625, -1.1318359375, -1.05560302734375, -0.9793701171875, -0.90313720703125, -0.826904296875, -0.75067138671875, -0.6744384765625, -0.59820556640625, -0.52197265625, -0.44573974609375, -0.3695068359375, -0.29327392578125, -0.217041015625, -0.14080810546875, -0.0645751953125, 0.01165771484375, 0.087890625, 0.16412353515625, 0.2403564453125, 0.31658935546875, 0.392822265625, 0.46905517578125, 0.5452880859375, 0.62152099609375, 0.69775390625, 0.77398681640625, 0.8502197265625, 0.92645263671875, 1.002685546875, 1.07891845703125, 1.1551513671875, 1.23138427734375, 1.3076171875, 1.38385009765625, 1.4600830078125, 1.53631591796875, 1.612548828125, 1.68878173828125, 1.7650146484375, 1.84124755859375, 1.91748046875, 1.99371337890625, 2.0699462890625, 2.14617919921875, 2.222412109375, 2.29864501953125, 2.3748779296875, 2.45111083984375, 2.52734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 8.0, 14.0, 14.0, 19.0, 18.0, 14.0, 25.0, 18.0, 38.0, 30.0, 41.0, 39.0, 40.0, 46.0, 37.0, 40.0, 39.0, 33.0, 42.0, 35.0, 39.0, 41.0, 36.0, 24.0, 25.0, 29.0, 27.0, 15.0, 17.0, 21.0, 10.0, 22.0, 9.0, 17.0, 8.0, 10.0, 6.0, 5.0, 10.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1484375, -5.950439453125, -5.75244140625, -5.554443359375, -5.3564453125, -5.158447265625, -4.96044921875, -4.762451171875, -4.564453125, -4.366455078125, -4.16845703125, -3.970458984375, -3.7724609375, -3.574462890625, -3.37646484375, -3.178466796875, -2.98046875, -2.782470703125, -2.58447265625, -2.386474609375, -2.1884765625, -1.990478515625, -1.79248046875, -1.594482421875, -1.396484375, -1.198486328125, -1.00048828125, -0.802490234375, -0.6044921875, -0.406494140625, -0.20849609375, -0.010498046875, 0.1875, 0.385498046875, 0.58349609375, 0.781494140625, 0.9794921875, 1.177490234375, 1.37548828125, 1.573486328125, 1.771484375, 1.969482421875, 2.16748046875, 2.365478515625, 2.5634765625, 2.761474609375, 2.95947265625, 3.157470703125, 3.35546875, 3.553466796875, 3.75146484375, 3.949462890625, 4.1474609375, 4.345458984375, 4.54345703125, 4.741455078125, 4.939453125, 5.137451171875, 5.33544921875, 5.533447265625, 5.7314453125, 5.929443359375, 6.12744140625, 6.325439453125, 6.5234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 20.0, 24.0, 35.0, 62.0, 87.0, 123.0, 218.0, 324.0, 526.0, 832.0, 1275.0, 2083.0, 3514.0, 6024.0, 10588.0, 20403.0, 56507.0, 858412.0, 44531.0, 18681.0, 9906.0, 5435.0, 3466.0, 1990.0, 1286.0, 736.0, 505.0, 333.0, 193.0, 143.0, 94.0, 68.0, 43.0, 30.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-8.859375, -8.63470458984375, -8.4100341796875, -8.18536376953125, -7.960693359375, -7.73602294921875, -7.5113525390625, -7.28668212890625, -7.06201171875, -6.83734130859375, -6.6126708984375, -6.38800048828125, -6.163330078125, -5.93865966796875, -5.7139892578125, -5.48931884765625, -5.2646484375, -5.03997802734375, -4.8153076171875, -4.59063720703125, -4.365966796875, -4.14129638671875, -3.9166259765625, -3.69195556640625, -3.46728515625, -3.24261474609375, -3.0179443359375, -2.79327392578125, -2.568603515625, -2.34393310546875, -2.1192626953125, -1.89459228515625, -1.669921875, -1.44525146484375, -1.2205810546875, -0.99591064453125, -0.771240234375, -0.54656982421875, -0.3218994140625, -0.09722900390625, 0.12744140625, 0.35211181640625, 0.5767822265625, 0.80145263671875, 1.026123046875, 1.25079345703125, 1.4754638671875, 1.70013427734375, 1.9248046875, 2.14947509765625, 2.3741455078125, 2.59881591796875, 2.823486328125, 3.04815673828125, 3.2728271484375, 3.49749755859375, 3.72216796875, 3.94683837890625, 4.1715087890625, 4.39617919921875, 4.620849609375, 4.84552001953125, 5.0701904296875, 5.29486083984375, 5.51953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 10.0, 4.0, 11.0, 13.0, 11.0, 20.0, 18.0, 29.0, 23.0, 24.0, 30.0, 30.0, 29.0, 34.0, 30.0, 35.0, 38.0, 41.0, 41.0, 36.0, 33.0, 36.0, 50.0, 42.0, 30.0, 35.0, 44.0, 26.0, 27.0, 23.0, 18.0, 23.0, 24.0, 14.0, 17.0, 8.0, 7.0, 4.0, 14.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.69732666015625, -4.5430908203125, -4.38885498046875, -4.234619140625, -4.08038330078125, -3.9261474609375, -3.77191162109375, -3.61767578125, -3.46343994140625, -3.3092041015625, -3.15496826171875, -3.000732421875, -2.84649658203125, -2.6922607421875, -2.53802490234375, -2.3837890625, -2.22955322265625, -2.0753173828125, -1.92108154296875, -1.766845703125, -1.61260986328125, -1.4583740234375, -1.30413818359375, -1.14990234375, -0.99566650390625, -0.8414306640625, -0.68719482421875, -0.532958984375, -0.37872314453125, -0.2244873046875, -0.07025146484375, 0.083984375, 0.23822021484375, 0.3924560546875, 0.54669189453125, 0.700927734375, 0.85516357421875, 1.0093994140625, 1.16363525390625, 1.31787109375, 1.47210693359375, 1.6263427734375, 1.78057861328125, 1.934814453125, 2.08905029296875, 2.2432861328125, 2.39752197265625, 2.5517578125, 2.70599365234375, 2.8602294921875, 3.01446533203125, 3.168701171875, 3.32293701171875, 3.4771728515625, 3.63140869140625, 3.78564453125, 3.93988037109375, 4.0941162109375, 4.24835205078125, 4.402587890625, 4.55682373046875, 4.7110595703125, 4.86529541015625, 5.01953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 9.0, 14.0, 23.0, 41.0, 57.0, 100.0, 158.0, 229.0, 413.0, 720.0, 1285.0, 2416.0, 4514.0, 9502.0, 24101.0, 615508.0, 348575.0, 22511.0, 9077.0, 4207.0, 2184.0, 1217.0, 660.0, 379.0, 196.0, 113.0, 96.0, 59.0, 39.0, 30.0, 19.0, 18.0, 15.0, 11.0, 11.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.05078125, -4.8975830078125, -4.744384765625, -4.5911865234375, -4.43798828125, -4.2847900390625, -4.131591796875, -3.9783935546875, -3.8251953125, -3.6719970703125, -3.518798828125, -3.3656005859375, -3.21240234375, -3.0592041015625, -2.906005859375, -2.7528076171875, -2.599609375, -2.4464111328125, -2.293212890625, -2.1400146484375, -1.98681640625, -1.8336181640625, -1.680419921875, -1.5272216796875, -1.3740234375, -1.2208251953125, -1.067626953125, -0.9144287109375, -0.76123046875, -0.6080322265625, -0.454833984375, -0.3016357421875, -0.1484375, 0.0047607421875, 0.157958984375, 0.3111572265625, 0.46435546875, 0.6175537109375, 0.770751953125, 0.9239501953125, 1.0771484375, 1.2303466796875, 1.383544921875, 1.5367431640625, 1.68994140625, 1.8431396484375, 1.996337890625, 2.1495361328125, 2.302734375, 2.4559326171875, 2.609130859375, 2.7623291015625, 2.91552734375, 3.0687255859375, 3.221923828125, 3.3751220703125, 3.5283203125, 3.6815185546875, 3.834716796875, 3.9879150390625, 4.14111328125, 4.2943115234375, 4.447509765625, 4.6007080078125, 4.75390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 16.0, 10.0, 10.0, 12.0, 19.0, 21.0, 18.0, 23.0, 36.0, 41.0, 60.0, 60.0, 59.0, 67.0, 67.0, 64.0, 55.0, 40.0, 41.0, 46.0, 33.0, 35.0, 26.0, 19.0, 10.0, 18.0, 11.0, 19.0, 5.0, 9.0, 10.0, 6.0, 4.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002180337905883789, -0.00021154806017875671, -0.00020506232976913452, -0.00019857659935951233, -0.00019209086894989014, -0.00018560513854026794, -0.00017911940813064575, -0.00017263367772102356, -0.00016614794731140137, -0.00015966221690177917, -0.00015317648649215698, -0.0001466907560825348, -0.0001402050256729126, -0.0001337192952632904, -0.0001272335648536682, -0.00012074783444404602, -0.00011426210403442383, -0.00010777637362480164, -0.00010129064321517944, -9.480491280555725e-05, -8.831918239593506e-05, -8.183345198631287e-05, -7.534772157669067e-05, -6.886199116706848e-05, -6.237626075744629e-05, -5.58905303478241e-05, -4.9404799938201904e-05, -4.291906952857971e-05, -3.643333911895752e-05, -2.9947608709335327e-05, -2.3461878299713135e-05, -1.6976147890090942e-05, -1.049041748046875e-05, -4.004687070846558e-06, 2.4810433387756348e-06, 8.966773748397827e-06, 1.545250415802002e-05, 2.1938234567642212e-05, 2.8423964977264404e-05, 3.49096953868866e-05, 4.139542579650879e-05, 4.788115620613098e-05, 5.4366886615753174e-05, 6.0852617025375366e-05, 6.733834743499756e-05, 7.382407784461975e-05, 8.030980825424194e-05, 8.679553866386414e-05, 9.328126907348633e-05, 9.976699948310852e-05, 0.00010625272989273071, 0.0001127384603023529, 0.0001192241907119751, 0.0001257099211215973, 0.00013219565153121948, 0.00013868138194084167, 0.00014516711235046387, 0.00015165284276008606, 0.00015813857316970825, 0.00016462430357933044, 0.00017111003398895264, 0.00017759576439857483, 0.00018408149480819702, 0.00019056722521781921, 0.0001970529556274414]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 14.0, 17.0, 17.0, 37.0, 43.0, 82.0, 131.0, 166.0, 272.0, 421.0, 699.0, 1196.0, 1910.0, 3174.0, 5535.0, 10072.0, 18396.0, 35723.0, 69917.0, 139327.0, 249604.0, 240833.0, 131793.0, 65405.0, 33467.0, 17510.0, 9578.0, 5307.0, 3128.0, 1801.0, 1128.0, 657.0, 396.0, 285.0, 162.0, 116.0, 78.0, 52.0, 39.0, 19.0, 13.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4430389404296875, -1.394866943359375, -1.3466949462890625, -1.29852294921875, -1.2503509521484375, -1.202178955078125, -1.1540069580078125, -1.1058349609375, -1.0576629638671875, -1.009490966796875, -0.9613189697265625, -0.91314697265625, -0.8649749755859375, -0.816802978515625, -0.7686309814453125, -0.720458984375, -0.6722869873046875, -0.624114990234375, -0.5759429931640625, -0.52777099609375, -0.4795989990234375, -0.431427001953125, -0.3832550048828125, -0.3350830078125, -0.2869110107421875, -0.238739013671875, -0.1905670166015625, -0.14239501953125, -0.0942230224609375, -0.046051025390625, 0.0021209716796875, 0.05029296875, 0.0984649658203125, 0.146636962890625, 0.1948089599609375, 0.24298095703125, 0.2911529541015625, 0.339324951171875, 0.3874969482421875, 0.4356689453125, 0.4838409423828125, 0.532012939453125, 0.5801849365234375, 0.62835693359375, 0.6765289306640625, 0.724700927734375, 0.7728729248046875, 0.821044921875, 0.8692169189453125, 0.917388916015625, 0.9655609130859375, 1.01373291015625, 1.0619049072265625, 1.110076904296875, 1.1582489013671875, 1.2064208984375, 1.2545928955078125, 1.302764892578125, 1.3509368896484375, 1.39910888671875, 1.4472808837890625, 1.495452880859375, 1.5436248779296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 5.0, 9.0, 11.0, 11.0, 15.0, 14.0, 25.0, 27.0, 33.0, 37.0, 47.0, 45.0, 42.0, 47.0, 54.0, 48.0, 53.0, 60.0, 49.0, 36.0, 30.0, 37.0, 46.0, 41.0, 25.0, 23.0, 15.0, 10.0, 13.0, 13.0, 16.0, 11.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.36554718017578125, -0.3531646728515625, -0.34078216552734375, -0.328399658203125, -0.31601715087890625, -0.3036346435546875, -0.29125213623046875, -0.27886962890625, -0.26648712158203125, -0.2541046142578125, -0.24172210693359375, -0.229339599609375, -0.21695709228515625, -0.2045745849609375, -0.19219207763671875, -0.1798095703125, -0.16742706298828125, -0.1550445556640625, -0.14266204833984375, -0.130279541015625, -0.11789703369140625, -0.1055145263671875, -0.09313201904296875, -0.08074951171875, -0.06836700439453125, -0.0559844970703125, -0.04360198974609375, -0.031219482421875, -0.01883697509765625, -0.0064544677734375, 0.00592803955078125, 0.018310546875, 0.03069305419921875, 0.0430755615234375, 0.05545806884765625, 0.067840576171875, 0.08022308349609375, 0.0926055908203125, 0.10498809814453125, 0.11737060546875, 0.12975311279296875, 0.1421356201171875, 0.15451812744140625, 0.166900634765625, 0.17928314208984375, 0.1916656494140625, 0.20404815673828125, 0.2164306640625, 0.22881317138671875, 0.2411956787109375, 0.25357818603515625, 0.265960693359375, 0.27834320068359375, 0.2907257080078125, 0.30310821533203125, 0.31549072265625, 0.32787322998046875, 0.3402557373046875, 0.35263824462890625, 0.365020751953125, 0.37740325927734375, 0.3897857666015625, 0.40216827392578125, 0.41455078125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 15.0, 13.0, 12.0, 29.0, 33.0, 28.0, 40.0, 38.0, 53.0, 37.0, 46.0, 61.0, 72.0, 56.0, 55.0, 51.0, 48.0, 55.0, 25.0, 44.0, 30.0, 28.0, 17.0, 14.0, 14.0, 14.0, 7.0, 7.0, 9.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.376655578613281, -8.093968391418457, -7.811281204223633, -7.528594493865967, -7.245907306671143, -6.963220119476318, -6.680533409118652, -6.397846221923828, -6.115159034729004, -5.83247184753418, -5.5497846603393555, -5.2670979499816895, -4.984410762786865, -4.701723575592041, -4.419036865234375, -4.136349678039551, -3.8536624908447266, -3.5709753036499023, -3.2882883548736572, -3.005601406097412, -2.722914218902588, -2.4402270317077637, -2.1575400829315186, -1.8748530149459839, -1.5921659469604492, -1.3094788789749146, -1.0267918109893799, -0.7441047430038452, -0.46141767501831055, -0.17873060703277588, 0.10395646095275879, 0.38664352893829346, 0.6693305969238281, 0.9520176649093628, 1.2347047328948975, 1.5173918008804321, 1.8000788688659668, 2.082766056060791, 2.365453004837036, 2.6481399536132812, 2.9308271408081055, 3.2135143280029297, 3.496201276779175, 3.77888822555542, 4.061575412750244, 4.344262599945068, 4.626949310302734, 4.909636497497559, 5.192323684692383, 5.475010871887207, 5.757698059082031, 6.040384769439697, 6.3230719566345215, 6.605759143829346, 6.888445854187012, 7.171133041381836, 7.45382022857666, 7.736507415771484, 8.019194602966309, 8.301881790161133, 8.58456802368164, 8.867255210876465, 9.149942398071289, 9.432629585266113, 9.715316772460938]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 13.0, 5.0, 16.0, 10.0, 14.0, 16.0, 26.0, 18.0, 34.0, 26.0, 32.0, 34.0, 30.0, 30.0, 48.0, 33.0, 41.0, 34.0, 36.0, 30.0, 47.0, 36.0, 37.0, 45.0, 28.0, 24.0, 27.0, 25.0, 27.0, 20.0, 23.0, 10.0, 19.0, 13.0, 11.0, 14.0, 7.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.696194648742676, -5.513446807861328, -5.3306989669799805, -5.147950649261475, -4.965202808380127, -4.782454967498779, -4.599706649780273, -4.416958808898926, -4.234210968017578, -4.0514631271362305, -3.8687150478363037, -3.685966968536377, -3.5032191276550293, -3.3204712867736816, -3.137723207473755, -2.954975128173828, -2.7722272872924805, -2.589479446411133, -2.406731367111206, -2.2239832878112793, -2.0412354469299316, -1.8584874868392944, -1.6757395267486572, -1.49299156665802, -1.3102436065673828, -1.1274956464767456, -0.9447476863861084, -0.7619997262954712, -0.579251766204834, -0.3965038061141968, -0.21375584602355957, -0.031007885932922363, 0.15174007415771484, 0.33448803424835205, 0.5172359943389893, 0.6999839544296265, 0.8827319145202637, 1.0654798746109009, 1.248227834701538, 1.4309757947921753, 1.6137237548828125, 1.7964717149734497, 1.979219675064087, 2.1619677543640137, 2.3447155952453613, 2.527463436126709, 2.7102115154266357, 2.8929595947265625, 3.07570743560791, 3.258455276489258, 3.4412033557891846, 3.6239514350891113, 3.806699275970459, 3.9894471168518066, 4.1721954345703125, 4.35494327545166, 4.537691116333008, 4.7204389572143555, 4.903186798095703, 5.085935115814209, 5.268682956695557, 5.451430797576904, 5.63417911529541, 5.816926956176758, 5.9996747970581055]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 12.0, 29.0, 44.0, 57.0, 95.0, 141.0, 197.0, 327.0, 534.0, 864.0, 1299.0, 2252.0, 3612.0, 6233.0, 10835.0, 19725.0, 35065.0, 62495.0, 105398.0, 158284.0, 191417.0, 169097.0, 116923.0, 70843.0, 39878.0, 22475.0, 12461.0, 7202.0, 4141.0, 2519.0, 1460.0, 950.0, 604.0, 394.0, 247.0, 166.0, 97.0, 68.0, 37.0, 20.0, 20.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9638671875, -7.685546875, -7.4072265625, -7.12890625, -6.8505859375, -6.572265625, -6.2939453125, -6.015625, -5.7373046875, -5.458984375, -5.1806640625, -4.90234375, -4.6240234375, -4.345703125, -4.0673828125, -3.7890625, -3.5107421875, -3.232421875, -2.9541015625, -2.67578125, -2.3974609375, -2.119140625, -1.8408203125, -1.5625, -1.2841796875, -1.005859375, -0.7275390625, -0.44921875, -0.1708984375, 0.107421875, 0.3857421875, 0.6640625, 0.9423828125, 1.220703125, 1.4990234375, 1.77734375, 2.0556640625, 2.333984375, 2.6123046875, 2.890625, 3.1689453125, 3.447265625, 3.7255859375, 4.00390625, 4.2822265625, 4.560546875, 4.8388671875, 5.1171875, 5.3955078125, 5.673828125, 5.9521484375, 6.23046875, 6.5087890625, 6.787109375, 7.0654296875, 7.34375, 7.6220703125, 7.900390625, 8.1787109375, 8.45703125, 8.7353515625, 9.013671875, 9.2919921875, 9.5703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 3.0, 12.0, 7.0, 13.0, 10.0, 8.0, 15.0, 19.0, 23.0, 25.0, 17.0, 36.0, 30.0, 29.0, 40.0, 31.0, 46.0, 49.0, 38.0, 38.0, 36.0, 39.0, 25.0, 41.0, 41.0, 38.0, 37.0, 28.0, 31.0, 26.0, 29.0, 16.0, 22.0, 15.0, 15.0, 11.0, 7.0, 10.0, 4.0, 9.0, 5.0, 5.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.21771240234375, -5.0369873046875, -4.85626220703125, -4.675537109375, -4.49481201171875, -4.3140869140625, -4.13336181640625, -3.95263671875, -3.77191162109375, -3.5911865234375, -3.41046142578125, -3.229736328125, -3.04901123046875, -2.8682861328125, -2.68756103515625, -2.5068359375, -2.32611083984375, -2.1453857421875, -1.96466064453125, -1.783935546875, -1.60321044921875, -1.4224853515625, -1.24176025390625, -1.06103515625, -0.88031005859375, -0.6995849609375, -0.51885986328125, -0.338134765625, -0.15740966796875, 0.0233154296875, 0.20404052734375, 0.384765625, 0.56549072265625, 0.7462158203125, 0.92694091796875, 1.107666015625, 1.28839111328125, 1.4691162109375, 1.64984130859375, 1.83056640625, 2.01129150390625, 2.1920166015625, 2.37274169921875, 2.553466796875, 2.73419189453125, 2.9149169921875, 3.09564208984375, 3.2763671875, 3.45709228515625, 3.6378173828125, 3.81854248046875, 3.999267578125, 4.17999267578125, 4.3607177734375, 4.54144287109375, 4.72216796875, 4.90289306640625, 5.0836181640625, 5.26434326171875, 5.445068359375, 5.62579345703125, 5.8065185546875, 5.98724365234375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [8.0, 0.0, 2.0, 6.0, 12.0, 11.0, 15.0, 18.0, 39.0, 46.0, 64.0, 101.0, 153.0, 185.0, 294.0, 420.0, 598.0, 878.0, 1310.0, 1821.0, 2803.0, 4013.0, 6337.0, 9505.0, 14818.0, 22867.0, 36199.0, 55581.0, 83225.0, 115698.0, 142173.0, 147786.0, 126237.0, 93705.0, 63336.0, 41552.0, 26814.0, 17025.0, 11082.0, 7167.0, 4661.0, 3196.0, 2079.0, 1414.0, 1046.0, 663.0, 494.0, 313.0, 242.0, 158.0, 130.0, 65.0, 56.0, 45.0, 37.0, 25.0, 15.0, 8.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.828125, -5.64111328125, -5.4541015625, -5.26708984375, -5.080078125, -4.89306640625, -4.7060546875, -4.51904296875, -4.33203125, -4.14501953125, -3.9580078125, -3.77099609375, -3.583984375, -3.39697265625, -3.2099609375, -3.02294921875, -2.8359375, -2.64892578125, -2.4619140625, -2.27490234375, -2.087890625, -1.90087890625, -1.7138671875, -1.52685546875, -1.33984375, -1.15283203125, -0.9658203125, -0.77880859375, -0.591796875, -0.40478515625, -0.2177734375, -0.03076171875, 0.15625, 0.34326171875, 0.5302734375, 0.71728515625, 0.904296875, 1.09130859375, 1.2783203125, 1.46533203125, 1.65234375, 1.83935546875, 2.0263671875, 2.21337890625, 2.400390625, 2.58740234375, 2.7744140625, 2.96142578125, 3.1484375, 3.33544921875, 3.5224609375, 3.70947265625, 3.896484375, 4.08349609375, 4.2705078125, 4.45751953125, 4.64453125, 4.83154296875, 5.0185546875, 5.20556640625, 5.392578125, 5.57958984375, 5.7666015625, 5.95361328125, 6.140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 20.0, 23.0, 23.0, 28.0, 27.0, 36.0, 35.0, 27.0, 40.0, 42.0, 42.0, 39.0, 39.0, 33.0, 37.0, 49.0, 46.0, 22.0, 37.0, 34.0, 38.0, 33.0, 31.0, 25.0, 25.0, 18.0, 16.0, 11.0, 11.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.765625, -4.63037109375, -4.4951171875, -4.35986328125, -4.224609375, -4.08935546875, -3.9541015625, -3.81884765625, -3.68359375, -3.54833984375, -3.4130859375, -3.27783203125, -3.142578125, -3.00732421875, -2.8720703125, -2.73681640625, -2.6015625, -2.46630859375, -2.3310546875, -2.19580078125, -2.060546875, -1.92529296875, -1.7900390625, -1.65478515625, -1.51953125, -1.38427734375, -1.2490234375, -1.11376953125, -0.978515625, -0.84326171875, -0.7080078125, -0.57275390625, -0.4375, -0.30224609375, -0.1669921875, -0.03173828125, 0.103515625, 0.23876953125, 0.3740234375, 0.50927734375, 0.64453125, 0.77978515625, 0.9150390625, 1.05029296875, 1.185546875, 1.32080078125, 1.4560546875, 1.59130859375, 1.7265625, 1.86181640625, 1.9970703125, 2.13232421875, 2.267578125, 2.40283203125, 2.5380859375, 2.67333984375, 2.80859375, 2.94384765625, 3.0791015625, 3.21435546875, 3.349609375, 3.48486328125, 3.6201171875, 3.75537109375, 3.890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 15.0, 19.0, 42.0, 60.0, 55.0, 79.0, 113.0, 193.0, 310.0, 568.0, 957.0, 1871.0, 3903.0, 9381.0, 24283.0, 78425.0, 274249.0, 418800.0, 161109.0, 46024.0, 15751.0, 6096.0, 2835.0, 1412.0, 732.0, 452.0, 266.0, 162.0, 103.0, 80.0, 63.0, 39.0, 25.0, 10.0, 7.0, 10.0, 7.0, 10.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.38623046875, -18.8037109375, -18.22119140625, -17.638671875, -17.05615234375, -16.4736328125, -15.89111328125, -15.30859375, -14.72607421875, -14.1435546875, -13.56103515625, -12.978515625, -12.39599609375, -11.8134765625, -11.23095703125, -10.6484375, -10.06591796875, -9.4833984375, -8.90087890625, -8.318359375, -7.73583984375, -7.1533203125, -6.57080078125, -5.98828125, -5.40576171875, -4.8232421875, -4.24072265625, -3.658203125, -3.07568359375, -2.4931640625, -1.91064453125, -1.328125, -0.74560546875, -0.1630859375, 0.41943359375, 1.001953125, 1.58447265625, 2.1669921875, 2.74951171875, 3.33203125, 3.91455078125, 4.4970703125, 5.07958984375, 5.662109375, 6.24462890625, 6.8271484375, 7.40966796875, 7.9921875, 8.57470703125, 9.1572265625, 9.73974609375, 10.322265625, 10.90478515625, 11.4873046875, 12.06982421875, 12.65234375, 13.23486328125, 13.8173828125, 14.39990234375, 14.982421875, 15.56494140625, 16.1474609375, 16.72998046875, 17.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 13.0, 13.0, 6.0, 17.0, 23.0, 24.0, 51.0, 51.0, 66.0, 91.0, 108.0, 121.0, 100.0, 80.0, 55.0, 38.0, 38.0, 30.0, 19.0, 12.0, 16.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009517073631286621, -0.0009087324142456055, -0.0008657574653625488, -0.0008227825164794922, -0.0007798075675964355, -0.0007368326187133789, -0.0006938576698303223, -0.0006508827209472656, -0.000607907772064209, -0.0005649328231811523, -0.0005219578742980957, -0.00047898292541503906, -0.0004360079765319824, -0.0003930330276489258, -0.00035005807876586914, -0.0003070831298828125, -0.00026410818099975586, -0.00022113323211669922, -0.00017815828323364258, -0.00013518333435058594, -9.22083854675293e-05, -4.9233436584472656e-05, -6.258487701416016e-06, 3.6716461181640625e-05, 7.969141006469727e-05, 0.0001226663589477539, 0.00016564130783081055, 0.0002086162567138672, 0.00025159120559692383, 0.00029456615447998047, 0.0003375411033630371, 0.00038051605224609375, 0.0004234910011291504, 0.00046646595001220703, 0.0005094408988952637, 0.0005524158477783203, 0.000595390796661377, 0.0006383657455444336, 0.0006813406944274902, 0.0007243156433105469, 0.0007672905921936035, 0.0008102655410766602, 0.0008532404899597168, 0.0008962154388427734, 0.0009391903877258301, 0.0009821653366088867, 0.0010251402854919434, 0.001068115234375, 0.0011110901832580566, 0.0011540651321411133, 0.00119704008102417, 0.0012400150299072266, 0.0012829899787902832, 0.0013259649276733398, 0.0013689398765563965, 0.0014119148254394531, 0.0014548897743225098, 0.0014978647232055664, 0.001540839672088623, 0.0015838146209716797, 0.0016267895698547363, 0.001669764518737793, 0.0017127394676208496, 0.0017557144165039062]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 11.0, 9.0, 24.0, 21.0, 38.0, 53.0, 66.0, 85.0, 120.0, 165.0, 249.0, 407.0, 666.0, 1371.0, 3293.0, 9587.0, 36036.0, 156658.0, 447038.0, 292679.0, 72490.0, 17508.0, 5412.0, 2035.0, 966.0, 526.0, 349.0, 170.0, 135.0, 102.0, 54.0, 52.0, 33.0, 34.0, 25.0, 18.0, 13.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.8125, -20.21337890625, -19.6142578125, -19.01513671875, -18.416015625, -17.81689453125, -17.2177734375, -16.61865234375, -16.01953125, -15.42041015625, -14.8212890625, -14.22216796875, -13.623046875, -13.02392578125, -12.4248046875, -11.82568359375, -11.2265625, -10.62744140625, -10.0283203125, -9.42919921875, -8.830078125, -8.23095703125, -7.6318359375, -7.03271484375, -6.43359375, -5.83447265625, -5.2353515625, -4.63623046875, -4.037109375, -3.43798828125, -2.8388671875, -2.23974609375, -1.640625, -1.04150390625, -0.4423828125, 0.15673828125, 0.755859375, 1.35498046875, 1.9541015625, 2.55322265625, 3.15234375, 3.75146484375, 4.3505859375, 4.94970703125, 5.548828125, 6.14794921875, 6.7470703125, 7.34619140625, 7.9453125, 8.54443359375, 9.1435546875, 9.74267578125, 10.341796875, 10.94091796875, 11.5400390625, 12.13916015625, 12.73828125, 13.33740234375, 13.9365234375, 14.53564453125, 15.134765625, 15.73388671875, 16.3330078125, 16.93212890625, 17.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 10.0, 17.0, 25.0, 35.0, 39.0, 71.0, 121.0, 119.0, 128.0, 113.0, 99.0, 65.0, 49.0, 32.0, 20.0, 22.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.949462890625, -4.80517578125, -4.660888671875, -4.5166015625, -4.372314453125, -4.22802734375, -4.083740234375, -3.939453125, -3.795166015625, -3.65087890625, -3.506591796875, -3.3623046875, -3.218017578125, -3.07373046875, -2.929443359375, -2.78515625, -2.640869140625, -2.49658203125, -2.352294921875, -2.2080078125, -2.063720703125, -1.91943359375, -1.775146484375, -1.630859375, -1.486572265625, -1.34228515625, -1.197998046875, -1.0537109375, -0.909423828125, -0.76513671875, -0.620849609375, -0.4765625, -0.332275390625, -0.18798828125, -0.043701171875, 0.1005859375, 0.244873046875, 0.38916015625, 0.533447265625, 0.677734375, 0.822021484375, 0.96630859375, 1.110595703125, 1.2548828125, 1.399169921875, 1.54345703125, 1.687744140625, 1.83203125, 1.976318359375, 2.12060546875, 2.264892578125, 2.4091796875, 2.553466796875, 2.69775390625, 2.842041015625, 2.986328125, 3.130615234375, 3.27490234375, 3.419189453125, 3.5634765625, 3.707763671875, 3.85205078125, 3.996337890625, 4.140625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 11.0, 11.0, 17.0, 8.0, 14.0, 20.0, 28.0, 45.0, 48.0, 52.0, 49.0, 58.0, 71.0, 65.0, 59.0, 52.0, 50.0, 55.0, 47.0, 38.0, 31.0, 31.0, 33.0, 19.0, 23.0, 12.0, 11.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.411050796508789, -8.113692283630371, -7.816334247589111, -7.518975734710693, -7.221617698669434, -6.924259185791016, -6.626900672912598, -6.329542636871338, -6.032184600830078, -5.73482608795166, -5.4374680519104, -5.140109539031982, -4.842751502990723, -4.545392990112305, -4.248034477233887, -3.950676441192627, -3.653317928314209, -3.35595965385437, -3.0586013793945312, -2.7612428665161133, -2.4638848304748535, -2.1665263175964355, -1.8691680431365967, -1.5718097686767578, -1.274451494216919, -0.9770932197570801, -0.6797348856925964, -0.3823765516281128, -0.08501827716827393, 0.21233999729156494, 0.5096983909606934, 0.8070566654205322, 1.104414939880371, 1.40177321434021, 1.6991314888000488, 1.9964898824691772, 2.2938480377197266, 2.5912065505981445, 2.8885648250579834, 3.1859230995178223, 3.483281373977661, 3.7806396484375, 4.077998161315918, 4.375356197357178, 4.672714710235596, 4.9700727462768555, 5.267431259155273, 5.564789772033691, 5.862147808074951, 6.159506320953369, 6.456864356994629, 6.754222869873047, 7.051580905914307, 7.348939418792725, 7.646297454833984, 7.943655967712402, 8.24101448059082, 8.538372993469238, 8.835731506347656, 9.133089065551758, 9.430447578430176, 9.727806091308594, 10.025164604187012, 10.32252311706543, 10.619880676269531]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 7.0, 5.0, 2.0, 2.0, 9.0, 10.0, 6.0, 14.0, 16.0, 15.0, 18.0, 18.0, 34.0, 29.0, 17.0, 30.0, 27.0, 28.0, 27.0, 36.0, 35.0, 47.0, 38.0, 48.0, 27.0, 47.0, 36.0, 28.0, 22.0, 39.0, 32.0, 30.0, 26.0, 25.0, 28.0, 21.0, 14.0, 20.0, 13.0, 10.0, 19.0, 14.0, 5.0, 7.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.186312198638916, -6.003700256347656, -5.8210883140563965, -5.638476371765137, -5.455864429473877, -5.273252487182617, -5.090640544891357, -4.908028602600098, -4.725416660308838, -4.542804718017578, -4.360192775726318, -4.177580833435059, -3.994968891143799, -3.812356948852539, -3.6297450065612793, -3.4471330642700195, -3.2645208835601807, -3.081908941268921, -2.899296998977661, -2.7166850566864014, -2.5340731143951416, -2.351461172103882, -2.168848991394043, -1.9862371683120728, -1.803625226020813, -1.6210132837295532, -1.4384013414382935, -1.2557892799377441, -1.0731773376464844, -0.8905654549598694, -0.7079534530639648, -0.5253415107727051, -0.3427295684814453, -0.16011761128902435, 0.022494345903396606, 0.20510631799697876, 0.3877182602882385, 0.5703302025794983, 0.7529422044754028, 0.9355541467666626, 1.1181660890579224, 1.3007780313491821, 1.483389973640442, 1.6660020351409912, 1.848613977432251, 2.0312259197235107, 2.2138378620147705, 2.3964498043060303, 2.57906174659729, 2.76167368888855, 2.9442856311798096, 3.1268975734710693, 3.309509515762329, 3.492121458053589, 3.6747336387634277, 3.8573455810546875, 4.039957523345947, 4.222569465637207, 4.405181407928467, 4.587793350219727, 4.770405292510986, 4.953017234802246, 5.135629177093506, 5.318241119384766, 5.500853061676025]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 7.0, 7.0, 7.0, 10.0, 14.0, 31.0, 32.0, 68.0, 70.0, 163.0, 203.0, 274.0, 407.0, 625.0, 1017.0, 1546.0, 2396.0, 3777.0, 5652.0, 9263.0, 15120.0, 25485.0, 44816.0, 79050.0, 145080.0, 273344.0, 506066.0, 790298.0, 860680.0, 628876.0, 359274.0, 192795.0, 104658.0, 58145.0, 33571.0, 19636.0, 11622.0, 7274.0, 4510.0, 2843.0, 1927.0, 1185.0, 808.0, 556.0, 379.0, 214.0, 178.0, 109.0, 96.0, 50.0, 31.0, 19.0, 18.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.140625, -5.94390869140625, -5.7471923828125, -5.55047607421875, -5.353759765625, -5.15704345703125, -4.9603271484375, -4.76361083984375, -4.56689453125, -4.37017822265625, -4.1734619140625, -3.97674560546875, -3.780029296875, -3.58331298828125, -3.3865966796875, -3.18988037109375, -2.9931640625, -2.79644775390625, -2.5997314453125, -2.40301513671875, -2.206298828125, -2.00958251953125, -1.8128662109375, -1.61614990234375, -1.41943359375, -1.22271728515625, -1.0260009765625, -0.82928466796875, -0.632568359375, -0.43585205078125, -0.2391357421875, -0.04241943359375, 0.154296875, 0.35101318359375, 0.5477294921875, 0.74444580078125, 0.941162109375, 1.13787841796875, 1.3345947265625, 1.53131103515625, 1.72802734375, 1.92474365234375, 2.1214599609375, 2.31817626953125, 2.514892578125, 2.71160888671875, 2.9083251953125, 3.10504150390625, 3.3017578125, 3.49847412109375, 3.6951904296875, 3.89190673828125, 4.088623046875, 4.28533935546875, 4.4820556640625, 4.67877197265625, 4.87548828125, 5.07220458984375, 5.2689208984375, 5.46563720703125, 5.662353515625, 5.85906982421875, 6.0557861328125, 6.25250244140625, 6.44921875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 9.0, 5.0, 6.0, 13.0, 5.0, 6.0, 9.0, 16.0, 25.0, 23.0, 29.0, 26.0, 23.0, 36.0, 20.0, 34.0, 19.0, 38.0, 39.0, 41.0, 27.0, 29.0, 49.0, 33.0, 48.0, 31.0, 38.0, 32.0, 32.0, 34.0, 24.0, 20.0, 29.0, 21.0, 21.0, 19.0, 17.0, 14.0, 7.0, 11.0, 6.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.724609375, -3.599578857421875, -3.47454833984375, -3.349517822265625, -3.2244873046875, -3.099456787109375, -2.97442626953125, -2.849395751953125, -2.724365234375, -2.599334716796875, -2.47430419921875, -2.349273681640625, -2.2242431640625, -2.099212646484375, -1.97418212890625, -1.849151611328125, -1.72412109375, -1.599090576171875, -1.47406005859375, -1.349029541015625, -1.2239990234375, -1.098968505859375, -0.97393798828125, -0.848907470703125, -0.723876953125, -0.598846435546875, -0.47381591796875, -0.348785400390625, -0.2237548828125, -0.098724365234375, 0.02630615234375, 0.151336669921875, 0.2763671875, 0.401397705078125, 0.52642822265625, 0.651458740234375, 0.7764892578125, 0.901519775390625, 1.02655029296875, 1.151580810546875, 1.276611328125, 1.401641845703125, 1.52667236328125, 1.651702880859375, 1.7767333984375, 1.901763916015625, 2.02679443359375, 2.151824951171875, 2.27685546875, 2.401885986328125, 2.52691650390625, 2.651947021484375, 2.7769775390625, 2.902008056640625, 3.02703857421875, 3.152069091796875, 3.277099609375, 3.402130126953125, 3.52716064453125, 3.652191162109375, 3.7772216796875, 3.902252197265625, 4.02728271484375, 4.152313232421875, 4.27734375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 15.0, 12.0, 23.0, 38.0, 58.0, 100.0, 147.0, 210.0, 293.0, 423.0, 713.0, 1105.0, 1669.0, 2598.0, 4135.0, 6563.0, 10398.0, 17365.0, 28614.0, 48184.0, 82582.0, 142720.0, 241622.0, 402969.0, 608902.0, 753030.0, 672889.0, 465473.0, 288033.0, 169470.0, 99109.0, 57487.0, 34194.0, 20221.0, 12338.0, 7460.0, 4723.0, 3009.0, 1900.0, 1213.0, 802.0, 501.0, 301.0, 225.0, 148.0, 95.0, 81.0, 36.0, 27.0, 20.0, 15.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-5.67578125, -5.49652099609375, -5.3172607421875, -5.13800048828125, -4.958740234375, -4.77947998046875, -4.6002197265625, -4.42095947265625, -4.24169921875, -4.06243896484375, -3.8831787109375, -3.70391845703125, -3.524658203125, -3.34539794921875, -3.1661376953125, -2.98687744140625, -2.8076171875, -2.62835693359375, -2.4490966796875, -2.26983642578125, -2.090576171875, -1.91131591796875, -1.7320556640625, -1.55279541015625, -1.37353515625, -1.19427490234375, -1.0150146484375, -0.83575439453125, -0.656494140625, -0.47723388671875, -0.2979736328125, -0.11871337890625, 0.060546875, 0.23980712890625, 0.4190673828125, 0.59832763671875, 0.777587890625, 0.95684814453125, 1.1361083984375, 1.31536865234375, 1.49462890625, 1.67388916015625, 1.8531494140625, 2.03240966796875, 2.211669921875, 2.39093017578125, 2.5701904296875, 2.74945068359375, 2.9287109375, 3.10797119140625, 3.2872314453125, 3.46649169921875, 3.645751953125, 3.82501220703125, 4.0042724609375, 4.18353271484375, 4.36279296875, 4.54205322265625, 4.7213134765625, 4.90057373046875, 5.079833984375, 5.25909423828125, 5.4383544921875, 5.61761474609375, 5.796875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 10.0, 2.0, 12.0, 14.0, 20.0, 21.0, 25.0, 26.0, 23.0, 41.0, 55.0, 67.0, 93.0, 102.0, 132.0, 163.0, 182.0, 172.0, 211.0, 246.0, 254.0, 244.0, 258.0, 240.0, 231.0, 186.0, 164.0, 167.0, 138.0, 107.0, 90.0, 74.0, 59.0, 50.0, 36.0, 31.0, 28.0, 18.0, 16.0, 18.0, 14.0, 8.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.041015625, -1.974884033203125, -1.90875244140625, -1.842620849609375, -1.7764892578125, -1.710357666015625, -1.64422607421875, -1.578094482421875, -1.511962890625, -1.445831298828125, -1.37969970703125, -1.313568115234375, -1.2474365234375, -1.181304931640625, -1.11517333984375, -1.049041748046875, -0.98291015625, -0.916778564453125, -0.85064697265625, -0.784515380859375, -0.7183837890625, -0.652252197265625, -0.58612060546875, -0.519989013671875, -0.453857421875, -0.387725830078125, -0.32159423828125, -0.255462646484375, -0.1893310546875, -0.123199462890625, -0.05706787109375, 0.009063720703125, 0.0751953125, 0.141326904296875, 0.20745849609375, 0.273590087890625, 0.3397216796875, 0.405853271484375, 0.47198486328125, 0.538116455078125, 0.604248046875, 0.670379638671875, 0.73651123046875, 0.802642822265625, 0.8687744140625, 0.934906005859375, 1.00103759765625, 1.067169189453125, 1.13330078125, 1.199432373046875, 1.26556396484375, 1.331695556640625, 1.3978271484375, 1.463958740234375, 1.53009033203125, 1.596221923828125, 1.662353515625, 1.728485107421875, 1.79461669921875, 1.860748291015625, 1.9268798828125, 1.993011474609375, 2.05914306640625, 2.125274658203125, 2.19140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 17.0, 14.0, 33.0, 33.0, 29.0, 38.0, 55.0, 55.0, 55.0, 81.0, 84.0, 67.0, 57.0, 57.0, 55.0, 49.0, 49.0, 25.0, 32.0, 20.0, 17.0, 14.0, 9.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.106962203979492, -7.835235118865967, -7.5635085105896, -7.291781425476074, -7.020054817199707, -6.748327732086182, -6.476600646972656, -6.204874038696289, -5.933146953582764, -5.661419868469238, -5.389693260192871, -5.117966175079346, -4.84623908996582, -4.574512481689453, -4.302785396575928, -4.031058311462402, -3.759331703186035, -3.487604856491089, -3.2158780097961426, -2.944150924682617, -2.672424077987671, -2.4006972312927246, -2.128970146179199, -1.857243299484253, -1.5855164527893066, -1.3137896060943604, -1.0420626401901245, -0.7703357338905334, -0.4986088275909424, -0.2268819808959961, 0.044844985008239746, 0.3165719509124756, 0.5882987976074219, 0.8600257039070129, 1.131752610206604, 1.4034795761108398, 1.6752064228057861, 1.9469332695007324, 2.218660354614258, 2.490387201309204, 2.7621140480041504, 3.0338408946990967, 3.305567741394043, 3.5772948265075684, 3.8490216732025146, 4.120748519897461, 4.392475605010986, 4.664202690124512, 4.935929298400879, 5.207656383514404, 5.4793829917907715, 5.751110076904297, 6.022836685180664, 6.2945637702941895, 6.566290855407715, 6.838017463684082, 7.109744548797607, 7.381471633911133, 7.6531982421875, 7.924925327301025, 8.19665241241455, 8.468379020690918, 8.740105628967285, 9.011833190917969, 9.283559799194336]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 9.0, 12.0, 8.0, 7.0, 16.0, 18.0, 18.0, 23.0, 28.0, 26.0, 23.0, 39.0, 36.0, 40.0, 38.0, 38.0, 51.0, 45.0, 38.0, 37.0, 49.0, 41.0, 36.0, 31.0, 30.0, 35.0, 33.0, 21.0, 23.0, 21.0, 26.0, 23.0, 14.0, 14.0, 11.0, 7.0, 8.0, 11.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.849778175354004, -5.6817708015441895, -5.513762950897217, -5.345755577087402, -5.17774772644043, -5.009740352630615, -4.841732978820801, -4.673725128173828, -4.5057172775268555, -4.337709903717041, -4.169702053070068, -4.001694679260254, -3.8336868286132812, -3.665679454803467, -3.4976718425750732, -3.3296642303466797, -3.1616568565368652, -2.9936492443084717, -2.825641632080078, -2.6576342582702637, -2.489626407623291, -2.3216190338134766, -2.153611421585083, -1.9856038093566895, -1.817596197128296, -1.6495885848999023, -1.4815809726715088, -1.3135734796524048, -1.1455658674240112, -0.9775582551956177, -0.8095507621765137, -0.6415431499481201, -0.47353506088256836, -0.3055274784564972, -0.13751989603042603, 0.030487656593322754, 0.1984952688217163, 0.36650288105010986, 0.5345103740692139, 0.7025179862976074, 0.870525598526001, 1.0385332107543945, 1.206540822982788, 1.374548316001892, 1.5425559282302856, 1.7105635404586792, 1.8785710334777832, 2.0465786457061768, 2.2145862579345703, 2.382593870162964, 2.5506014823913574, 2.718608856201172, 2.8866167068481445, 3.054624080657959, 3.2226316928863525, 3.390639305114746, 3.5586469173431396, 3.726654529571533, 3.8946621417999268, 4.06266975402832, 4.230677127838135, 4.398684978485107, 4.566692352294922, 4.7347002029418945, 4.902707576751709]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 9.0, 23.0, 19.0, 30.0, 56.0, 79.0, 121.0, 199.0, 284.0, 429.0, 619.0, 937.0, 1306.0, 2049.0, 3371.0, 5073.0, 7916.0, 12267.0, 19274.0, 30350.0, 47941.0, 75047.0, 111741.0, 151599.0, 165040.0, 138344.0, 97719.0, 63699.0, 40961.0, 25758.0, 16423.0, 10638.0, 6805.0, 4282.0, 2793.0, 1798.0, 1191.0, 814.0, 513.0, 330.0, 231.0, 156.0, 94.0, 69.0, 57.0, 34.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.5595703125, -1.5081329345703125, -1.456695556640625, -1.4052581787109375, -1.35382080078125, -1.3023834228515625, -1.250946044921875, -1.1995086669921875, -1.1480712890625, -1.0966339111328125, -1.045196533203125, -0.9937591552734375, -0.94232177734375, -0.8908843994140625, -0.839447021484375, -0.7880096435546875, -0.736572265625, -0.6851348876953125, -0.633697509765625, -0.5822601318359375, -0.53082275390625, -0.4793853759765625, -0.427947998046875, -0.3765106201171875, -0.3250732421875, -0.2736358642578125, -0.222198486328125, -0.1707611083984375, -0.11932373046875, -0.0678863525390625, -0.016448974609375, 0.0349884033203125, 0.08642578125, 0.1378631591796875, 0.189300537109375, 0.2407379150390625, 0.29217529296875, 0.3436126708984375, 0.395050048828125, 0.4464874267578125, 0.4979248046875, 0.5493621826171875, 0.600799560546875, 0.6522369384765625, 0.70367431640625, 0.7551116943359375, 0.806549072265625, 0.8579864501953125, 0.909423828125, 0.9608612060546875, 1.012298583984375, 1.0637359619140625, 1.11517333984375, 1.1666107177734375, 1.218048095703125, 1.2694854736328125, 1.3209228515625, 1.3723602294921875, 1.423797607421875, 1.4752349853515625, 1.52667236328125, 1.5781097412109375, 1.629547119140625, 1.6809844970703125, 1.732421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 13.0, 12.0, 17.0, 26.0, 21.0, 27.0, 30.0, 35.0, 43.0, 31.0, 39.0, 31.0, 53.0, 50.0, 34.0, 40.0, 50.0, 40.0, 47.0, 40.0, 42.0, 24.0, 31.0, 31.0, 22.0, 21.0, 22.0, 16.0, 17.0, 25.0, 7.0, 8.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.2890625, -6.106201171875, -5.92333984375, -5.740478515625, -5.5576171875, -5.374755859375, -5.19189453125, -5.009033203125, -4.826171875, -4.643310546875, -4.46044921875, -4.277587890625, -4.0947265625, -3.911865234375, -3.72900390625, -3.546142578125, -3.36328125, -3.180419921875, -2.99755859375, -2.814697265625, -2.6318359375, -2.448974609375, -2.26611328125, -2.083251953125, -1.900390625, -1.717529296875, -1.53466796875, -1.351806640625, -1.1689453125, -0.986083984375, -0.80322265625, -0.620361328125, -0.4375, -0.254638671875, -0.07177734375, 0.111083984375, 0.2939453125, 0.476806640625, 0.65966796875, 0.842529296875, 1.025390625, 1.208251953125, 1.39111328125, 1.573974609375, 1.7568359375, 1.939697265625, 2.12255859375, 2.305419921875, 2.48828125, 2.671142578125, 2.85400390625, 3.036865234375, 3.2197265625, 3.402587890625, 3.58544921875, 3.768310546875, 3.951171875, 4.134033203125, 4.31689453125, 4.499755859375, 4.6826171875, 4.865478515625, 5.04833984375, 5.231201171875, 5.4140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 20.0, 30.0, 34.0, 56.0, 90.0, 111.0, 153.0, 202.0, 316.0, 453.0, 606.0, 916.0, 1330.0, 1950.0, 2878.0, 4533.0, 7138.0, 11989.0, 22749.0, 81009.0, 824131.0, 42079.0, 18066.0, 9979.0, 5996.0, 3784.0, 2440.0, 1703.0, 1193.0, 815.0, 484.0, 360.0, 247.0, 199.0, 128.0, 94.0, 82.0, 30.0, 41.0, 27.0, 16.0, 9.0, 8.0, 11.0, 3.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.947998046875, -3.81787109375, -3.687744140625, -3.5576171875, -3.427490234375, -3.29736328125, -3.167236328125, -3.037109375, -2.906982421875, -2.77685546875, -2.646728515625, -2.5166015625, -2.386474609375, -2.25634765625, -2.126220703125, -1.99609375, -1.865966796875, -1.73583984375, -1.605712890625, -1.4755859375, -1.345458984375, -1.21533203125, -1.085205078125, -0.955078125, -0.824951171875, -0.69482421875, -0.564697265625, -0.4345703125, -0.304443359375, -0.17431640625, -0.044189453125, 0.0859375, 0.216064453125, 0.34619140625, 0.476318359375, 0.6064453125, 0.736572265625, 0.86669921875, 0.996826171875, 1.126953125, 1.257080078125, 1.38720703125, 1.517333984375, 1.6474609375, 1.777587890625, 1.90771484375, 2.037841796875, 2.16796875, 2.298095703125, 2.42822265625, 2.558349609375, 2.6884765625, 2.818603515625, 2.94873046875, 3.078857421875, 3.208984375, 3.339111328125, 3.46923828125, 3.599365234375, 3.7294921875, 3.859619140625, 3.98974609375, 4.119873046875, 4.25]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 20.0, 17.0, 20.0, 23.0, 24.0, 27.0, 34.0, 30.0, 34.0, 43.0, 31.0, 55.0, 54.0, 44.0, 45.0, 36.0, 37.0, 39.0, 44.0, 42.0, 41.0, 33.0, 19.0, 25.0, 16.0, 23.0, 19.0, 11.0, 7.0, 6.0, 13.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.7760009765625, -3.637939453125, -3.4998779296875, -3.36181640625, -3.2237548828125, -3.085693359375, -2.9476318359375, -2.8095703125, -2.6715087890625, -2.533447265625, -2.3953857421875, -2.25732421875, -2.1192626953125, -1.981201171875, -1.8431396484375, -1.705078125, -1.5670166015625, -1.428955078125, -1.2908935546875, -1.15283203125, -1.0147705078125, -0.876708984375, -0.7386474609375, -0.6005859375, -0.4625244140625, -0.324462890625, -0.1864013671875, -0.04833984375, 0.0897216796875, 0.227783203125, 0.3658447265625, 0.50390625, 0.6419677734375, 0.780029296875, 0.9180908203125, 1.05615234375, 1.1942138671875, 1.332275390625, 1.4703369140625, 1.6083984375, 1.7464599609375, 1.884521484375, 2.0225830078125, 2.16064453125, 2.2987060546875, 2.436767578125, 2.5748291015625, 2.712890625, 2.8509521484375, 2.989013671875, 3.1270751953125, 3.26513671875, 3.4031982421875, 3.541259765625, 3.6793212890625, 3.8173828125, 3.9554443359375, 4.093505859375, 4.2315673828125, 4.36962890625, 4.5076904296875, 4.645751953125, 4.7838134765625, 4.921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 19.0, 13.0, 11.0, 28.0, 35.0, 51.0, 68.0, 66.0, 115.0, 158.0, 191.0, 281.0, 447.0, 654.0, 970.0, 1567.0, 2405.0, 3785.0, 6177.0, 10946.0, 20743.0, 73722.0, 851059.0, 35683.0, 16061.0, 8812.0, 5107.0, 3223.0, 2031.0, 1299.0, 867.0, 584.0, 405.0, 260.0, 201.0, 151.0, 91.0, 77.0, 50.0, 33.0, 30.0, 21.0, 21.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.759765625, -1.706939697265625, -1.65411376953125, -1.601287841796875, -1.5484619140625, -1.495635986328125, -1.44281005859375, -1.389984130859375, -1.337158203125, -1.284332275390625, -1.23150634765625, -1.178680419921875, -1.1258544921875, -1.073028564453125, -1.02020263671875, -0.967376708984375, -0.91455078125, -0.861724853515625, -0.80889892578125, -0.756072998046875, -0.7032470703125, -0.650421142578125, -0.59759521484375, -0.544769287109375, -0.491943359375, -0.439117431640625, -0.38629150390625, -0.333465576171875, -0.2806396484375, -0.227813720703125, -0.17498779296875, -0.122161865234375, -0.0693359375, -0.016510009765625, 0.03631591796875, 0.089141845703125, 0.1419677734375, 0.194793701171875, 0.24761962890625, 0.300445556640625, 0.353271484375, 0.406097412109375, 0.45892333984375, 0.511749267578125, 0.5645751953125, 0.617401123046875, 0.67022705078125, 0.723052978515625, 0.77587890625, 0.828704833984375, 0.88153076171875, 0.934356689453125, 0.9871826171875, 1.040008544921875, 1.09283447265625, 1.145660400390625, 1.198486328125, 1.251312255859375, 1.30413818359375, 1.356964111328125, 1.4097900390625, 1.462615966796875, 1.51544189453125, 1.568267822265625, 1.62109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 19.0, 22.0, 37.0, 57.0, 71.0, 98.0, 113.0, 122.0, 104.0, 78.0, 67.0, 44.0, 32.0, 19.0, 17.0, 17.0, 2.0, 8.0, 7.0, 4.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021076202392578125, -0.00020478293299674988, -0.0001988038420677185, -0.00019282475113868713, -0.00018684566020965576, -0.0001808665692806244, -0.00017488747835159302, -0.00016890838742256165, -0.00016292929649353027, -0.0001569502055644989, -0.00015097111463546753, -0.00014499202370643616, -0.00013901293277740479, -0.0001330338418483734, -0.00012705475091934204, -0.00012107565999031067, -0.0001150965690612793, -0.00010911747813224792, -0.00010313838720321655, -9.715929627418518e-05, -9.118020534515381e-05, -8.520111441612244e-05, -7.922202348709106e-05, -7.324293255805969e-05, -6.726384162902832e-05, -6.128475069999695e-05, -5.5305659770965576e-05, -4.9326568841934204e-05, -4.334747791290283e-05, -3.736838698387146e-05, -3.138929605484009e-05, -2.5410205125808716e-05, -1.9431114196777344e-05, -1.3452023267745972e-05, -7.4729323387146e-06, -1.4938414096832275e-06, 4.4852495193481445e-06, 1.0464340448379517e-05, 1.644343137741089e-05, 2.242252230644226e-05, 2.8401613235473633e-05, 3.4380704164505005e-05, 4.035979509353638e-05, 4.633888602256775e-05, 5.231797695159912e-05, 5.829706788063049e-05, 6.427615880966187e-05, 7.025524973869324e-05, 7.623434066772461e-05, 8.221343159675598e-05, 8.819252252578735e-05, 9.417161345481873e-05, 0.0001001507043838501, 0.00010612979531288147, 0.00011210888624191284, 0.00011808797717094421, 0.00012406706809997559, 0.00013004615902900696, 0.00013602524995803833, 0.0001420043408870697, 0.00014798343181610107, 0.00015396252274513245, 0.00015994161367416382, 0.0001659207046031952, 0.00017189979553222656]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 7.0, 13.0, 21.0, 34.0, 42.0, 61.0, 76.0, 116.0, 177.0, 260.0, 402.0, 629.0, 898.0, 1407.0, 2186.0, 3504.0, 5583.0, 9501.0, 15300.0, 25773.0, 43533.0, 73987.0, 126400.0, 198073.0, 206229.0, 135998.0, 80311.0, 47045.0, 27878.0, 16356.0, 10080.0, 6094.0, 3724.0, 2429.0, 1495.0, 985.0, 679.0, 410.0, 266.0, 190.0, 135.0, 87.0, 64.0, 36.0, 19.0, 17.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7126312255859375, -0.688934326171875, -0.6652374267578125, -0.64154052734375, -0.6178436279296875, -0.594146728515625, -0.5704498291015625, -0.5467529296875, -0.5230560302734375, -0.499359130859375, -0.4756622314453125, -0.45196533203125, -0.4282684326171875, -0.404571533203125, -0.3808746337890625, -0.357177734375, -0.3334808349609375, -0.309783935546875, -0.2860870361328125, -0.26239013671875, -0.2386932373046875, -0.214996337890625, -0.1912994384765625, -0.1676025390625, -0.1439056396484375, -0.120208740234375, -0.0965118408203125, -0.07281494140625, -0.0491180419921875, -0.025421142578125, -0.0017242431640625, 0.02197265625, 0.0456695556640625, 0.069366455078125, 0.0930633544921875, 0.11676025390625, 0.1404571533203125, 0.164154052734375, 0.1878509521484375, 0.2115478515625, 0.2352447509765625, 0.258941650390625, 0.2826385498046875, 0.30633544921875, 0.3300323486328125, 0.353729248046875, 0.3774261474609375, 0.401123046875, 0.4248199462890625, 0.448516845703125, 0.4722137451171875, 0.49591064453125, 0.5196075439453125, 0.543304443359375, 0.5670013427734375, 0.5906982421875, 0.6143951416015625, 0.638092041015625, 0.6617889404296875, 0.68548583984375, 0.7091827392578125, 0.732879638671875, 0.7565765380859375, 0.7802734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 19.0, 14.0, 25.0, 27.0, 33.0, 31.0, 40.0, 49.0, 44.0, 51.0, 54.0, 51.0, 53.0, 44.0, 65.0, 50.0, 45.0, 41.0, 27.0, 37.0, 24.0, 22.0, 18.0, 12.0, 12.0, 10.0, 14.0, 9.0, 5.0, 4.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24935150146484375, -0.2411346435546875, -0.23291778564453125, -0.224700927734375, -0.21648406982421875, -0.2082672119140625, -0.20005035400390625, -0.19183349609375, -0.18361663818359375, -0.1753997802734375, -0.16718292236328125, -0.158966064453125, -0.15074920654296875, -0.1425323486328125, -0.13431549072265625, -0.1260986328125, -0.11788177490234375, -0.1096649169921875, -0.10144805908203125, -0.093231201171875, -0.08501434326171875, -0.0767974853515625, -0.06858062744140625, -0.06036376953125, -0.05214691162109375, -0.0439300537109375, -0.03571319580078125, -0.027496337890625, -0.01927947998046875, -0.0110626220703125, -0.00284576416015625, 0.00537109375, 0.01358795166015625, 0.0218048095703125, 0.03002166748046875, 0.038238525390625, 0.04645538330078125, 0.0546722412109375, 0.06288909912109375, 0.07110595703125, 0.07932281494140625, 0.0875396728515625, 0.09575653076171875, 0.103973388671875, 0.11219024658203125, 0.1204071044921875, 0.12862396240234375, 0.1368408203125, 0.14505767822265625, 0.1532745361328125, 0.16149139404296875, 0.169708251953125, 0.17792510986328125, 0.1861419677734375, 0.19435882568359375, 0.20257568359375, 0.21079254150390625, 0.2190093994140625, 0.22722625732421875, 0.235443115234375, 0.24365997314453125, 0.2518768310546875, 0.26009368896484375, 0.268310546875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 14.0, 14.0, 16.0, 28.0, 34.0, 38.0, 47.0, 45.0, 58.0, 64.0, 74.0, 84.0, 70.0, 72.0, 46.0, 62.0, 52.0, 29.0, 33.0, 27.0, 15.0, 19.0, 14.0, 8.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.229190826416016, -7.951141834259033, -7.673092842102051, -7.395044326782227, -7.116995334625244, -6.838946342468262, -6.5608978271484375, -6.282848834991455, -6.004799842834473, -5.72675085067749, -5.448701858520508, -5.170653343200684, -4.892604351043701, -4.614555358886719, -4.3365068435668945, -4.058457851409912, -3.7804088592529297, -3.5023598670959473, -3.224311113357544, -2.9462623596191406, -2.668213367462158, -2.390164375305176, -2.1121156215667725, -1.8340667486190796, -1.5560178756713867, -1.2779690027236938, -0.999920129776001, -0.7218712568283081, -0.44382238388061523, -0.16577351093292236, 0.11227536201477051, 0.3903242349624634, 0.6683740615844727, 0.9464229345321655, 1.2244718074798584, 1.5025206804275513, 1.7805695533752441, 2.0586185455322266, 2.33666729927063, 2.614716053009033, 2.8927650451660156, 3.170814037322998, 3.4488627910614014, 3.7269115447998047, 4.004960536956787, 4.2830095291137695, 4.561058044433594, 4.839107036590576, 5.117156028747559, 5.395205020904541, 5.673254013061523, 5.951302528381348, 6.22935152053833, 6.5074005126953125, 6.785449028015137, 7.063498020172119, 7.341547012329102, 7.619596004486084, 7.897644996643066, 8.17569351196289, 8.453742980957031, 8.731791496276855, 9.00984001159668, 9.28788948059082, 9.565937995910645]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 9.0, 14.0, 21.0, 22.0, 22.0, 29.0, 28.0, 24.0, 37.0, 39.0, 43.0, 41.0, 43.0, 48.0, 46.0, 32.0, 48.0, 45.0, 46.0, 29.0, 33.0, 39.0, 28.0, 24.0, 28.0, 22.0, 24.0, 19.0, 19.0, 11.0, 15.0, 6.0, 10.0, 11.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.924797058105469, -5.7518486976623535, -5.578900337219238, -5.405952453613281, -5.233004093170166, -5.060055732727051, -4.887107849121094, -4.7141594886779785, -4.541211128234863, -4.368262767791748, -4.195314407348633, -4.022366523742676, -3.8494181632995605, -3.6764698028564453, -3.503521680831909, -3.330573558807373, -3.157625198364258, -2.9846768379211426, -2.8117287158966064, -2.6387805938720703, -2.465832233428955, -2.29288387298584, -2.1199357509613037, -1.946987509727478, -1.7740392684936523, -1.6010910272598267, -1.428142786026001, -1.2551945447921753, -1.0822463035583496, -0.9092980623245239, -0.7363498210906982, -0.5634015798568726, -0.39045286178588867, -0.217504620552063, -0.044556379318237305, 0.12839186191558838, 0.30134010314941406, 0.47428834438323975, 0.6472365856170654, 0.8201848268508911, 0.9931330680847168, 1.1660813093185425, 1.3390295505523682, 1.5119777917861938, 1.6849260330200195, 1.8578742742538452, 2.030822515487671, 2.203770637512207, 2.3767189979553223, 2.5496673583984375, 2.7226154804229736, 2.8955636024475098, 3.068511962890625, 3.2414603233337402, 3.4144084453582764, 3.5873565673828125, 3.7603049278259277, 3.933253288269043, 4.106201171875, 4.279149532318115, 4.4520978927612305, 4.625046253204346, 4.797994613647461, 4.970942497253418, 5.143890857696533]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 9.0, 16.0, 14.0, 34.0, 35.0, 55.0, 91.0, 116.0, 199.0, 252.0, 397.0, 587.0, 832.0, 1310.0, 1877.0, 2924.0, 4276.0, 6176.0, 9534.0, 14046.0, 20801.0, 30915.0, 45108.0, 64110.0, 87238.0, 111080.0, 126907.0, 126229.0, 109124.0, 85512.0, 62809.0, 44059.0, 30282.0, 20342.0, 13616.0, 9014.0, 6169.0, 4062.0, 2793.0, 1792.0, 1188.0, 859.0, 580.0, 390.0, 258.0, 178.0, 106.0, 86.0, 59.0, 32.0, 23.0, 20.0, 16.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.5546875, -4.4075927734375, -4.260498046875, -4.1134033203125, -3.96630859375, -3.8192138671875, -3.672119140625, -3.5250244140625, -3.3779296875, -3.2308349609375, -3.083740234375, -2.9366455078125, -2.78955078125, -2.6424560546875, -2.495361328125, -2.3482666015625, -2.201171875, -2.0540771484375, -1.906982421875, -1.7598876953125, -1.61279296875, -1.4656982421875, -1.318603515625, -1.1715087890625, -1.0244140625, -0.8773193359375, -0.730224609375, -0.5831298828125, -0.43603515625, -0.2889404296875, -0.141845703125, 0.0052490234375, 0.15234375, 0.2994384765625, 0.446533203125, 0.5936279296875, 0.74072265625, 0.8878173828125, 1.034912109375, 1.1820068359375, 1.3291015625, 1.4761962890625, 1.623291015625, 1.7703857421875, 1.91748046875, 2.0645751953125, 2.211669921875, 2.3587646484375, 2.505859375, 2.6529541015625, 2.800048828125, 2.9471435546875, 3.09423828125, 3.2413330078125, 3.388427734375, 3.5355224609375, 3.6826171875, 3.8297119140625, 3.976806640625, 4.1239013671875, 4.27099609375, 4.4180908203125, 4.565185546875, 4.7122802734375, 4.859375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 7.0, 24.0, 20.0, 11.0, 24.0, 27.0, 27.0, 33.0, 35.0, 37.0, 44.0, 38.0, 40.0, 50.0, 44.0, 51.0, 41.0, 47.0, 35.0, 29.0, 41.0, 40.0, 30.0, 28.0, 30.0, 26.0, 31.0, 20.0, 22.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.43634033203125, -6.2593994140625, -6.08245849609375, -5.905517578125, -5.72857666015625, -5.5516357421875, -5.37469482421875, -5.19775390625, -5.02081298828125, -4.8438720703125, -4.66693115234375, -4.489990234375, -4.31304931640625, -4.1361083984375, -3.95916748046875, -3.7822265625, -3.60528564453125, -3.4283447265625, -3.25140380859375, -3.074462890625, -2.89752197265625, -2.7205810546875, -2.54364013671875, -2.36669921875, -2.18975830078125, -2.0128173828125, -1.83587646484375, -1.658935546875, -1.48199462890625, -1.3050537109375, -1.12811279296875, -0.951171875, -0.77423095703125, -0.5972900390625, -0.42034912109375, -0.243408203125, -0.06646728515625, 0.1104736328125, 0.28741455078125, 0.46435546875, 0.64129638671875, 0.8182373046875, 0.99517822265625, 1.172119140625, 1.34906005859375, 1.5260009765625, 1.70294189453125, 1.8798828125, 2.05682373046875, 2.2337646484375, 2.41070556640625, 2.587646484375, 2.76458740234375, 2.9415283203125, 3.11846923828125, 3.29541015625, 3.47235107421875, 3.6492919921875, 3.82623291015625, 4.003173828125, 4.18011474609375, 4.3570556640625, 4.53399658203125, 4.7109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 16.0, 36.0, 37.0, 76.0, 100.0, 173.0, 275.0, 400.0, 691.0, 1173.0, 1905.0, 3180.0, 5298.0, 8996.0, 15324.0, 25724.0, 43032.0, 71236.0, 109577.0, 150350.0, 169462.0, 150723.0, 110458.0, 71969.0, 44098.0, 26385.0, 15316.0, 9062.0, 5428.0, 3205.0, 1856.0, 1160.0, 673.0, 419.0, 281.0, 175.0, 94.0, 72.0, 41.0, 21.0, 20.0, 16.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4305419921875, -4.263427734375, -4.0963134765625, -3.92919921875, -3.7620849609375, -3.594970703125, -3.4278564453125, -3.2607421875, -3.0936279296875, -2.926513671875, -2.7593994140625, -2.59228515625, -2.4251708984375, -2.258056640625, -2.0909423828125, -1.923828125, -1.7567138671875, -1.589599609375, -1.4224853515625, -1.25537109375, -1.0882568359375, -0.921142578125, -0.7540283203125, -0.5869140625, -0.4197998046875, -0.252685546875, -0.0855712890625, 0.08154296875, 0.2486572265625, 0.415771484375, 0.5828857421875, 0.75, 0.9171142578125, 1.084228515625, 1.2513427734375, 1.41845703125, 1.5855712890625, 1.752685546875, 1.9197998046875, 2.0869140625, 2.2540283203125, 2.421142578125, 2.5882568359375, 2.75537109375, 2.9224853515625, 3.089599609375, 3.2567138671875, 3.423828125, 3.5909423828125, 3.758056640625, 3.9251708984375, 4.09228515625, 4.2593994140625, 4.426513671875, 4.5936279296875, 4.7607421875, 4.9278564453125, 5.094970703125, 5.2620849609375, 5.42919921875, 5.5963134765625, 5.763427734375, 5.9305419921875, 6.09765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 5.0, 6.0, 18.0, 6.0, 10.0, 13.0, 21.0, 13.0, 24.0, 24.0, 29.0, 37.0, 28.0, 32.0, 28.0, 47.0, 46.0, 40.0, 49.0, 50.0, 41.0, 40.0, 46.0, 38.0, 23.0, 39.0, 33.0, 21.0, 18.0, 26.0, 22.0, 21.0, 18.0, 14.0, 17.0, 12.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.31640625, -4.18438720703125, -4.0523681640625, -3.92034912109375, -3.788330078125, -3.65631103515625, -3.5242919921875, -3.39227294921875, -3.26025390625, -3.12823486328125, -2.9962158203125, -2.86419677734375, -2.732177734375, -2.60015869140625, -2.4681396484375, -2.33612060546875, -2.2041015625, -2.07208251953125, -1.9400634765625, -1.80804443359375, -1.676025390625, -1.54400634765625, -1.4119873046875, -1.27996826171875, -1.14794921875, -1.01593017578125, -0.8839111328125, -0.75189208984375, -0.619873046875, -0.48785400390625, -0.3558349609375, -0.22381591796875, -0.091796875, 0.04022216796875, 0.1722412109375, 0.30426025390625, 0.436279296875, 0.56829833984375, 0.7003173828125, 0.83233642578125, 0.96435546875, 1.09637451171875, 1.2283935546875, 1.36041259765625, 1.492431640625, 1.62445068359375, 1.7564697265625, 1.88848876953125, 2.0205078125, 2.15252685546875, 2.2845458984375, 2.41656494140625, 2.548583984375, 2.68060302734375, 2.8126220703125, 2.94464111328125, 3.07666015625, 3.20867919921875, 3.3406982421875, 3.47271728515625, 3.604736328125, 3.73675537109375, 3.8687744140625, 4.00079345703125, 4.1328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 13.0, 22.0, 38.0, 68.0, 95.0, 158.0, 282.0, 499.0, 961.0, 1711.0, 3487.0, 7773.0, 18918.0, 54102.0, 169702.0, 383499.0, 267489.0, 88908.0, 29807.0, 11214.0, 4898.0, 2264.0, 1143.0, 599.0, 315.0, 223.0, 114.0, 68.0, 53.0, 38.0, 23.0, 15.0, 11.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5, -10.1790771484375, -9.858154296875, -9.5372314453125, -9.21630859375, -8.8953857421875, -8.574462890625, -8.2535400390625, -7.9326171875, -7.6116943359375, -7.290771484375, -6.9698486328125, -6.64892578125, -6.3280029296875, -6.007080078125, -5.6861572265625, -5.365234375, -5.0443115234375, -4.723388671875, -4.4024658203125, -4.08154296875, -3.7606201171875, -3.439697265625, -3.1187744140625, -2.7978515625, -2.4769287109375, -2.156005859375, -1.8350830078125, -1.51416015625, -1.1932373046875, -0.872314453125, -0.5513916015625, -0.23046875, 0.0904541015625, 0.411376953125, 0.7322998046875, 1.05322265625, 1.3741455078125, 1.695068359375, 2.0159912109375, 2.3369140625, 2.6578369140625, 2.978759765625, 3.2996826171875, 3.62060546875, 3.9415283203125, 4.262451171875, 4.5833740234375, 4.904296875, 5.2252197265625, 5.546142578125, 5.8670654296875, 6.18798828125, 6.5089111328125, 6.829833984375, 7.1507568359375, 7.4716796875, 7.7926025390625, 8.113525390625, 8.4344482421875, 8.75537109375, 9.0762939453125, 9.397216796875, 9.7181396484375, 10.0390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 11.0, 12.0, 15.0, 20.0, 31.0, 21.0, 31.0, 40.0, 52.0, 46.0, 35.0, 65.0, 53.0, 68.0, 63.0, 60.0, 50.0, 46.0, 51.0, 47.0, 30.0, 35.0, 19.0, 19.0, 13.0, 10.0, 8.0, 10.0, 8.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00045680999755859375, -0.0004429668188095093, -0.0004291236400604248, -0.00041528046131134033, -0.00040143728256225586, -0.0003875941038131714, -0.0003737509250640869, -0.00035990774631500244, -0.00034606456756591797, -0.0003322213888168335, -0.000318378210067749, -0.00030453503131866455, -0.0002906918525695801, -0.0002768486738204956, -0.00026300549507141113, -0.00024916231632232666, -0.0002353191375732422, -0.00022147595882415771, -0.00020763278007507324, -0.00019378960132598877, -0.0001799464225769043, -0.00016610324382781982, -0.00015226006507873535, -0.00013841688632965088, -0.0001245737075805664, -0.00011073052883148193, -9.688735008239746e-05, -8.304417133331299e-05, -6.920099258422852e-05, -5.535781383514404e-05, -4.151463508605957e-05, -2.7671456336975098e-05, -1.3828277587890625e-05, 1.4901161193847656e-08, 1.385807991027832e-05, 2.7701258659362793e-05, 4.1544437408447266e-05, 5.538761615753174e-05, 6.923079490661621e-05, 8.307397365570068e-05, 9.691715240478516e-05, 0.00011076033115386963, 0.0001246035099029541, 0.00013844668865203857, 0.00015228986740112305, 0.00016613304615020752, 0.000179976224899292, 0.00019381940364837646, 0.00020766258239746094, 0.0002215057611465454, 0.00023534893989562988, 0.00024919211864471436, 0.00026303529739379883, 0.0002768784761428833, 0.0002907216548919678, 0.00030456483364105225, 0.0003184080123901367, 0.0003322511911392212, 0.00034609436988830566, 0.00035993754863739014, 0.0003737807273864746, 0.0003876239061355591, 0.00040146708488464355, 0.00041531026363372803, 0.0004291534423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 13.0, 12.0, 21.0, 26.0, 37.0, 52.0, 77.0, 114.0, 204.0, 291.0, 424.0, 697.0, 1135.0, 1982.0, 3497.0, 6604.0, 13414.0, 29688.0, 69528.0, 160943.0, 280028.0, 251471.0, 127685.0, 53854.0, 23125.0, 10841.0, 5467.0, 2824.0, 1731.0, 1003.0, 643.0, 384.0, 238.0, 156.0, 112.0, 64.0, 44.0, 40.0, 18.0, 16.0, 17.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65972900390625, -6.4366455078125, -6.21356201171875, -5.990478515625, -5.76739501953125, -5.5443115234375, -5.32122802734375, -5.09814453125, -4.87506103515625, -4.6519775390625, -4.42889404296875, -4.205810546875, -3.98272705078125, -3.7596435546875, -3.53656005859375, -3.3134765625, -3.09039306640625, -2.8673095703125, -2.64422607421875, -2.421142578125, -2.19805908203125, -1.9749755859375, -1.75189208984375, -1.52880859375, -1.30572509765625, -1.0826416015625, -0.85955810546875, -0.636474609375, -0.41339111328125, -0.1903076171875, 0.03277587890625, 0.255859375, 0.47894287109375, 0.7020263671875, 0.92510986328125, 1.148193359375, 1.37127685546875, 1.5943603515625, 1.81744384765625, 2.04052734375, 2.26361083984375, 2.4866943359375, 2.70977783203125, 2.932861328125, 3.15594482421875, 3.3790283203125, 3.60211181640625, 3.8251953125, 4.04827880859375, 4.2713623046875, 4.49444580078125, 4.717529296875, 4.94061279296875, 5.1636962890625, 5.38677978515625, 5.60986328125, 5.83294677734375, 6.0560302734375, 6.27911376953125, 6.502197265625, 6.72528076171875, 6.9483642578125, 7.17144775390625, 7.39453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 5.0, 15.0, 10.0, 10.0, 20.0, 23.0, 39.0, 41.0, 81.0, 79.0, 110.0, 110.0, 92.0, 89.0, 50.0, 40.0, 27.0, 35.0, 21.0, 24.0, 9.0, 12.0, 7.0, 5.0, 6.0, 4.0, 6.0, 0.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4609375, -3.35986328125, -3.2587890625, -3.15771484375, -3.056640625, -2.95556640625, -2.8544921875, -2.75341796875, -2.65234375, -2.55126953125, -2.4501953125, -2.34912109375, -2.248046875, -2.14697265625, -2.0458984375, -1.94482421875, -1.84375, -1.74267578125, -1.6416015625, -1.54052734375, -1.439453125, -1.33837890625, -1.2373046875, -1.13623046875, -1.03515625, -0.93408203125, -0.8330078125, -0.73193359375, -0.630859375, -0.52978515625, -0.4287109375, -0.32763671875, -0.2265625, -0.12548828125, -0.0244140625, 0.07666015625, 0.177734375, 0.27880859375, 0.3798828125, 0.48095703125, 0.58203125, 0.68310546875, 0.7841796875, 0.88525390625, 0.986328125, 1.08740234375, 1.1884765625, 1.28955078125, 1.390625, 1.49169921875, 1.5927734375, 1.69384765625, 1.794921875, 1.89599609375, 1.9970703125, 2.09814453125, 2.19921875, 2.30029296875, 2.4013671875, 2.50244140625, 2.603515625, 2.70458984375, 2.8056640625, 2.90673828125, 3.0078125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 4.0, 16.0, 21.0, 25.0, 29.0, 31.0, 45.0, 48.0, 66.0, 65.0, 71.0, 91.0, 73.0, 79.0, 67.0, 53.0, 50.0, 43.0, 20.0, 20.0, 21.0, 12.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9293670654296875, -7.647541522979736, -7.365716457366943, -7.083890914916992, -6.802065372467041, -6.52023983001709, -6.238414764404297, -5.956589221954346, -5.6747636795043945, -5.392938137054443, -5.11111307144165, -4.829287528991699, -4.547461986541748, -4.265636444091797, -3.983811378479004, -3.7019858360290527, -3.4201607704162598, -3.1383354663848877, -2.8565099239349365, -2.5746846199035645, -2.2928590774536133, -2.011033773422241, -1.7292084693908691, -1.4473830461502075, -1.165557622909546, -0.8837321996688843, -0.6019068360328674, -0.3200814723968506, -0.038256049156188965, 0.24356937408447266, 0.5253946781158447, 0.8072201013565063, 1.089045524597168, 1.3708709478378296, 1.6526963710784912, 1.9345216751098633, 2.2163472175598145, 2.4981725215911865, 2.7799978256225586, 3.0618233680725098, 3.343648672103882, 3.625473976135254, 3.907299518585205, 4.189125061035156, 4.470950126647949, 4.7527756690979, 5.034601211547852, 5.3164262771606445, 5.598251819610596, 5.880077362060547, 6.16190242767334, 6.443727970123291, 6.725553512573242, 7.007378578186035, 7.289204120635986, 7.5710296630859375, 7.8528547286987305, 8.134679794311523, 8.416505813598633, 8.698330879211426, 8.980155944824219, 9.261981964111328, 9.543807029724121, 9.825632095336914, 10.107458114624023]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 5.0, 7.0, 4.0, 14.0, 12.0, 17.0, 21.0, 23.0, 24.0, 22.0, 29.0, 45.0, 27.0, 41.0, 33.0, 42.0, 52.0, 37.0, 29.0, 47.0, 39.0, 29.0, 47.0, 48.0, 28.0, 29.0, 24.0, 31.0, 24.0, 28.0, 27.0, 15.0, 19.0, 15.0, 15.0, 15.0, 11.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.836164951324463, -5.655647277832031, -5.475129127502441, -5.294610977172852, -5.11409330368042, -4.933575630187988, -4.753057479858398, -4.572539329528809, -4.392021656036377, -4.211503982543945, -4.0309858322143555, -3.8504679203033447, -3.669950008392334, -3.4894320964813232, -3.3089141845703125, -3.1283962726593018, -2.947878360748291, -2.7673604488372803, -2.5868425369262695, -2.406324625015259, -2.225806713104248, -2.0452888011932373, -1.8647708892822266, -1.6842529773712158, -1.503735065460205, -1.3232171535491943, -1.1426992416381836, -0.9621813297271729, -0.7816634178161621, -0.6011455059051514, -0.4206275939941406, -0.24010968208312988, -0.05959129333496094, 0.1209266185760498, 0.30144453048706055, 0.4819624423980713, 0.662480354309082, 0.8429982662200928, 1.0235161781311035, 1.2040340900421143, 1.384552001953125, 1.5650699138641357, 1.7455878257751465, 1.9261057376861572, 2.106623649597168, 2.2871415615081787, 2.4676594734191895, 2.6481773853302, 2.828695297241211, 3.0092132091522217, 3.1897311210632324, 3.370249032974243, 3.550766944885254, 3.7312848567962646, 3.9118027687072754, 4.092320442199707, 4.272838592529297, 4.453356742858887, 4.633874416351318, 4.81439208984375, 4.99491024017334, 5.17542839050293, 5.355946063995361, 5.536463737487793, 5.716981887817383]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 6.0, 11.0, 12.0, 15.0, 23.0, 39.0, 51.0, 103.0, 131.0, 199.0, 296.0, 463.0, 732.0, 1198.0, 1966.0, 3413.0, 6195.0, 11297.0, 20973.0, 41158.0, 84003.0, 181458.0, 404994.0, 825437.0, 1106660.0, 791045.0, 381939.0, 170126.0, 78954.0, 37907.0, 19182.0, 10273.0, 5636.0, 3266.0, 1970.0, 1161.0, 669.0, 492.0, 286.0, 169.0, 119.0, 86.0, 55.0, 32.0, 27.0, 18.0, 18.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-6.62890625, -6.4246826171875, -6.220458984375, -6.0162353515625, -5.81201171875, -5.6077880859375, -5.403564453125, -5.1993408203125, -4.9951171875, -4.7908935546875, -4.586669921875, -4.3824462890625, -4.17822265625, -3.9739990234375, -3.769775390625, -3.5655517578125, -3.361328125, -3.1571044921875, -2.952880859375, -2.7486572265625, -2.54443359375, -2.3402099609375, -2.135986328125, -1.9317626953125, -1.7275390625, -1.5233154296875, -1.319091796875, -1.1148681640625, -0.91064453125, -0.7064208984375, -0.502197265625, -0.2979736328125, -0.09375, 0.1104736328125, 0.314697265625, 0.5189208984375, 0.72314453125, 0.9273681640625, 1.131591796875, 1.3358154296875, 1.5400390625, 1.7442626953125, 1.948486328125, 2.1527099609375, 2.35693359375, 2.5611572265625, 2.765380859375, 2.9696044921875, 3.173828125, 3.3780517578125, 3.582275390625, 3.7864990234375, 3.99072265625, 4.1949462890625, 4.399169921875, 4.6033935546875, 4.8076171875, 5.0118408203125, 5.216064453125, 5.4202880859375, 5.62451171875, 5.8287353515625, 6.032958984375, 6.2371826171875, 6.44140625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 12.0, 22.0, 21.0, 22.0, 22.0, 27.0, 27.0, 37.0, 37.0, 35.0, 52.0, 45.0, 47.0, 33.0, 38.0, 43.0, 37.0, 31.0, 39.0, 22.0, 40.0, 43.0, 38.0, 33.0, 26.0, 24.0, 10.0, 19.0, 15.0, 17.0, 17.0, 10.0, 10.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.676300048828125, -3.55963134765625, -3.442962646484375, -3.3262939453125, -3.209625244140625, -3.09295654296875, -2.976287841796875, -2.859619140625, -2.742950439453125, -2.62628173828125, -2.509613037109375, -2.3929443359375, -2.276275634765625, -2.15960693359375, -2.042938232421875, -1.92626953125, -1.809600830078125, -1.69293212890625, -1.576263427734375, -1.4595947265625, -1.342926025390625, -1.22625732421875, -1.109588623046875, -0.992919921875, -0.876251220703125, -0.75958251953125, -0.642913818359375, -0.5262451171875, -0.409576416015625, -0.29290771484375, -0.176239013671875, -0.0595703125, 0.057098388671875, 0.17376708984375, 0.290435791015625, 0.4071044921875, 0.523773193359375, 0.64044189453125, 0.757110595703125, 0.873779296875, 0.990447998046875, 1.10711669921875, 1.223785400390625, 1.3404541015625, 1.457122802734375, 1.57379150390625, 1.690460205078125, 1.80712890625, 1.923797607421875, 2.04046630859375, 2.157135009765625, 2.2738037109375, 2.390472412109375, 2.50714111328125, 2.623809814453125, 2.740478515625, 2.857147216796875, 2.97381591796875, 3.090484619140625, 3.2071533203125, 3.323822021484375, 3.44049072265625, 3.557159423828125, 3.673828125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 20.0, 20.0, 31.0, 66.0, 69.0, 108.0, 128.0, 232.0, 373.0, 513.0, 745.0, 1099.0, 1795.0, 2774.0, 4490.0, 7219.0, 12021.0, 19952.0, 34184.0, 59727.0, 106214.0, 188841.0, 329165.0, 541379.0, 756543.0, 766135.0, 558444.0, 341447.0, 197232.0, 111090.0, 62699.0, 35717.0, 21235.0, 12450.0, 7281.0, 4679.0, 2781.0, 1881.0, 1114.0, 740.0, 557.0, 348.0, 230.0, 160.0, 118.0, 79.0, 50.0, 26.0, 25.0, 15.0, 17.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.9921875, -4.83636474609375, -4.6805419921875, -4.52471923828125, -4.368896484375, -4.21307373046875, -4.0572509765625, -3.90142822265625, -3.74560546875, -3.58978271484375, -3.4339599609375, -3.27813720703125, -3.122314453125, -2.96649169921875, -2.8106689453125, -2.65484619140625, -2.4990234375, -2.34320068359375, -2.1873779296875, -2.03155517578125, -1.875732421875, -1.71990966796875, -1.5640869140625, -1.40826416015625, -1.25244140625, -1.09661865234375, -0.9407958984375, -0.78497314453125, -0.629150390625, -0.47332763671875, -0.3175048828125, -0.16168212890625, -0.005859375, 0.14996337890625, 0.3057861328125, 0.46160888671875, 0.617431640625, 0.77325439453125, 0.9290771484375, 1.08489990234375, 1.24072265625, 1.39654541015625, 1.5523681640625, 1.70819091796875, 1.864013671875, 2.01983642578125, 2.1756591796875, 2.33148193359375, 2.4873046875, 2.64312744140625, 2.7989501953125, 2.95477294921875, 3.110595703125, 3.26641845703125, 3.4222412109375, 3.57806396484375, 3.73388671875, 3.88970947265625, 4.0455322265625, 4.20135498046875, 4.357177734375, 4.51300048828125, 4.6688232421875, 4.82464599609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 13.0, 18.0, 25.0, 22.0, 47.0, 51.0, 58.0, 91.0, 94.0, 121.0, 167.0, 171.0, 203.0, 240.0, 288.0, 309.0, 256.0, 268.0, 280.0, 250.0, 209.0, 180.0, 130.0, 125.0, 91.0, 78.0, 66.0, 40.0, 42.0, 29.0, 24.0, 24.0, 15.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.23046875, -2.1687164306640625, -2.106964111328125, -2.0452117919921875, -1.98345947265625, -1.9217071533203125, -1.859954833984375, -1.7982025146484375, -1.7364501953125, -1.6746978759765625, -1.612945556640625, -1.5511932373046875, -1.48944091796875, -1.4276885986328125, -1.365936279296875, -1.3041839599609375, -1.242431640625, -1.1806793212890625, -1.118927001953125, -1.0571746826171875, -0.99542236328125, -0.9336700439453125, -0.871917724609375, -0.8101654052734375, -0.7484130859375, -0.6866607666015625, -0.624908447265625, -0.5631561279296875, -0.50140380859375, -0.4396514892578125, -0.377899169921875, -0.3161468505859375, -0.25439453125, -0.1926422119140625, -0.130889892578125, -0.0691375732421875, -0.00738525390625, 0.0543670654296875, 0.116119384765625, 0.1778717041015625, 0.2396240234375, 0.3013763427734375, 0.363128662109375, 0.4248809814453125, 0.48663330078125, 0.5483856201171875, 0.610137939453125, 0.6718902587890625, 0.733642578125, 0.7953948974609375, 0.857147216796875, 0.9188995361328125, 0.98065185546875, 1.0424041748046875, 1.104156494140625, 1.1659088134765625, 1.2276611328125, 1.2894134521484375, 1.351165771484375, 1.4129180908203125, 1.47467041015625, 1.5364227294921875, 1.598175048828125, 1.6599273681640625, 1.7216796875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 13.0, 22.0, 22.0, 33.0, 41.0, 39.0, 54.0, 68.0, 81.0, 66.0, 81.0, 53.0, 81.0, 64.0, 70.0, 42.0, 33.0, 26.0, 20.0, 18.0, 15.0, 7.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.195919513702393, -5.962164402008057, -5.728409290313721, -5.494654178619385, -5.260899543762207, -5.027144432067871, -4.793389320373535, -4.559634208679199, -4.325879096984863, -4.092123985290527, -3.8583688735961914, -3.6246140003204346, -3.3908588886260986, -3.1571037769317627, -2.923348903656006, -2.68959379196167, -2.455838680267334, -2.222083568572998, -1.9883285760879517, -1.7545735836029053, -1.5208184719085693, -1.2870633602142334, -1.053308367729187, -0.8195533752441406, -0.5857982635498047, -0.3520432114601135, -0.11828815937042236, 0.1154668927192688, 0.34922194480895996, 0.5829770565032959, 0.8167320489883423, 1.0504870414733887, 1.2842426300048828, 1.5179977416992188, 1.7517527341842651, 1.9855077266693115, 2.2192628383636475, 2.4530179500579834, 2.6867728233337402, 2.920527935028076, 3.154283046722412, 3.388038158416748, 3.621793270111084, 3.855548143386841, 4.089303016662598, 4.323058128356934, 4.5568132400512695, 4.7905683517456055, 5.024323463439941, 5.258078575134277, 5.491833686828613, 5.725588798522949, 5.959343910217285, 6.193099021911621, 6.426853656768799, 6.660608768463135, 6.894363880157471, 7.128118991851807, 7.361874103546143, 7.5956292152404785, 7.829383850097656, 8.063138961791992, 8.296894073486328, 8.530649185180664, 8.764404296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 13.0, 6.0, 19.0, 14.0, 28.0, 25.0, 27.0, 34.0, 36.0, 34.0, 44.0, 51.0, 38.0, 52.0, 44.0, 43.0, 32.0, 46.0, 44.0, 33.0, 35.0, 27.0, 28.0, 30.0, 34.0, 24.0, 29.0, 25.0, 11.0, 13.0, 9.0, 13.0, 12.0, 5.0, 11.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.548825263977051, -4.397319316864014, -4.245813369750977, -4.0943074226379395, -3.9428014755249023, -3.7912955284118652, -3.639789581298828, -3.488283634185791, -3.336777687072754, -3.185271739959717, -3.0337657928466797, -2.8822598457336426, -2.7307538986206055, -2.5792479515075684, -2.4277420043945312, -2.276236057281494, -2.124730348587036, -1.973224401473999, -1.821718454360962, -1.6702125072479248, -1.5187065601348877, -1.3672006130218506, -1.215694785118103, -1.064188838005066, -0.9126828908920288, -0.7611769437789917, -0.6096709966659546, -0.45816510915756226, -0.30665916204452515, -0.15515321493148804, -0.003647327423095703, 0.1478586196899414, 0.2993645668029785, 0.4508705139160156, 0.6023764610290527, 0.7538823485374451, 0.9053882956504822, 1.056894302368164, 1.2084001302719116, 1.3599060773849487, 1.5114120244979858, 1.662917971611023, 1.81442391872406, 1.9659297466278076, 2.1174356937408447, 2.268941640853882, 2.420447587966919, 2.571953535079956, 2.723459482192993, 2.8749654293060303, 3.0264713764190674, 3.1779773235321045, 3.3294832706451416, 3.4809892177581787, 3.6324949264526367, 3.784000873565674, 3.935506820678711, 4.087012767791748, 4.238518714904785, 4.390024662017822, 4.541530609130859, 4.6930365562438965, 4.844542503356934, 4.996048450469971, 5.147554397583008]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 9.0, 8.0, 5.0, 11.0, 15.0, 27.0, 26.0, 39.0, 56.0, 81.0, 148.0, 251.0, 434.0, 729.0, 1275.0, 2242.0, 4016.0, 7384.0, 14448.0, 27744.0, 53823.0, 102481.0, 181313.0, 238863.0, 186995.0, 107195.0, 56845.0, 29499.0, 15053.0, 7970.0, 4178.0, 2229.0, 1302.0, 712.0, 398.0, 290.0, 166.0, 86.0, 67.0, 36.0, 30.0, 27.0, 10.0, 17.0, 7.0, 11.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.186920166015625, -1.14044189453125, -1.093963623046875, -1.0474853515625, -1.001007080078125, -0.95452880859375, -0.908050537109375, -0.861572265625, -0.815093994140625, -0.76861572265625, -0.722137451171875, -0.6756591796875, -0.629180908203125, -0.58270263671875, -0.536224365234375, -0.48974609375, -0.443267822265625, -0.39678955078125, -0.350311279296875, -0.3038330078125, -0.257354736328125, -0.21087646484375, -0.164398193359375, -0.117919921875, -0.071441650390625, -0.02496337890625, 0.021514892578125, 0.0679931640625, 0.114471435546875, 0.16094970703125, 0.207427978515625, 0.25390625, 0.300384521484375, 0.34686279296875, 0.393341064453125, 0.4398193359375, 0.486297607421875, 0.53277587890625, 0.579254150390625, 0.625732421875, 0.672210693359375, 0.71868896484375, 0.765167236328125, 0.8116455078125, 0.858123779296875, 0.90460205078125, 0.951080322265625, 0.99755859375, 1.044036865234375, 1.09051513671875, 1.136993408203125, 1.1834716796875, 1.229949951171875, 1.27642822265625, 1.322906494140625, 1.369384765625, 1.415863037109375, 1.46234130859375, 1.508819580078125, 1.5552978515625, 1.601776123046875, 1.64825439453125, 1.694732666015625, 1.7412109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 6.0, 11.0, 20.0, 12.0, 21.0, 26.0, 25.0, 22.0, 22.0, 30.0, 33.0, 44.0, 53.0, 42.0, 42.0, 44.0, 43.0, 40.0, 43.0, 44.0, 35.0, 39.0, 29.0, 32.0, 21.0, 29.0, 24.0, 28.0, 19.0, 20.0, 16.0, 8.0, 12.0, 14.0, 10.0, 9.0, 13.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.12518310546875, -3.9691162109375, -3.81304931640625, -3.656982421875, -3.50091552734375, -3.3448486328125, -3.18878173828125, -3.03271484375, -2.87664794921875, -2.7205810546875, -2.56451416015625, -2.408447265625, -2.25238037109375, -2.0963134765625, -1.94024658203125, -1.7841796875, -1.62811279296875, -1.4720458984375, -1.31597900390625, -1.159912109375, -1.00384521484375, -0.8477783203125, -0.69171142578125, -0.53564453125, -0.37957763671875, -0.2235107421875, -0.06744384765625, 0.088623046875, 0.24468994140625, 0.4007568359375, 0.55682373046875, 0.712890625, 0.86895751953125, 1.0250244140625, 1.18109130859375, 1.337158203125, 1.49322509765625, 1.6492919921875, 1.80535888671875, 1.96142578125, 2.11749267578125, 2.2735595703125, 2.42962646484375, 2.585693359375, 2.74176025390625, 2.8978271484375, 3.05389404296875, 3.2099609375, 3.36602783203125, 3.5220947265625, 3.67816162109375, 3.834228515625, 3.99029541015625, 4.1463623046875, 4.30242919921875, 4.45849609375, 4.61456298828125, 4.7706298828125, 4.92669677734375, 5.082763671875, 5.23883056640625, 5.3948974609375, 5.55096435546875, 5.70703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 2.0, 10.0, 5.0, 13.0, 12.0, 26.0, 28.0, 41.0, 52.0, 70.0, 109.0, 148.0, 210.0, 320.0, 502.0, 721.0, 1162.0, 1777.0, 3040.0, 5326.0, 9684.0, 20313.0, 66851.0, 844900.0, 52989.0, 18508.0, 9193.0, 4920.0, 2712.0, 1725.0, 1077.0, 700.0, 473.0, 259.0, 200.0, 126.0, 108.0, 64.0, 38.0, 30.0, 25.0, 16.0, 15.0, 10.0, 11.0, 8.0, 10.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -2.997802734375, -2.89599609375, -2.794189453125, -2.6923828125, -2.590576171875, -2.48876953125, -2.386962890625, -2.28515625, -2.183349609375, -2.08154296875, -1.979736328125, -1.8779296875, -1.776123046875, -1.67431640625, -1.572509765625, -1.470703125, -1.368896484375, -1.26708984375, -1.165283203125, -1.0634765625, -0.961669921875, -0.85986328125, -0.758056640625, -0.65625, -0.554443359375, -0.45263671875, -0.350830078125, -0.2490234375, -0.147216796875, -0.04541015625, 0.056396484375, 0.158203125, 0.260009765625, 0.36181640625, 0.463623046875, 0.5654296875, 0.667236328125, 0.76904296875, 0.870849609375, 0.97265625, 1.074462890625, 1.17626953125, 1.278076171875, 1.3798828125, 1.481689453125, 1.58349609375, 1.685302734375, 1.787109375, 1.888916015625, 1.99072265625, 2.092529296875, 2.1943359375, 2.296142578125, 2.39794921875, 2.499755859375, 2.6015625, 2.703369140625, 2.80517578125, 2.906982421875, 3.0087890625, 3.110595703125, 3.21240234375, 3.314208984375, 3.416015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 13.0, 15.0, 14.0, 16.0, 27.0, 30.0, 28.0, 28.0, 29.0, 34.0, 38.0, 42.0, 50.0, 53.0, 53.0, 44.0, 54.0, 55.0, 46.0, 41.0, 44.0, 29.0, 35.0, 33.0, 17.0, 29.0, 25.0, 14.0, 9.0, 11.0, 9.0, 7.0, 2.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.0892333984375, -4.897216796875, -4.7052001953125, -4.51318359375, -4.3211669921875, -4.129150390625, -3.9371337890625, -3.7451171875, -3.5531005859375, -3.361083984375, -3.1690673828125, -2.97705078125, -2.7850341796875, -2.593017578125, -2.4010009765625, -2.208984375, -2.0169677734375, -1.824951171875, -1.6329345703125, -1.44091796875, -1.2489013671875, -1.056884765625, -0.8648681640625, -0.6728515625, -0.4808349609375, -0.288818359375, -0.0968017578125, 0.09521484375, 0.2872314453125, 0.479248046875, 0.6712646484375, 0.86328125, 1.0552978515625, 1.247314453125, 1.4393310546875, 1.63134765625, 1.8233642578125, 2.015380859375, 2.2073974609375, 2.3994140625, 2.5914306640625, 2.783447265625, 2.9754638671875, 3.16748046875, 3.3594970703125, 3.551513671875, 3.7435302734375, 3.935546875, 4.1275634765625, 4.319580078125, 4.5115966796875, 4.70361328125, 4.8956298828125, 5.087646484375, 5.2796630859375, 5.4716796875, 5.6636962890625, 5.855712890625, 6.0477294921875, 6.23974609375, 6.4317626953125, 6.623779296875, 6.8157958984375, 7.0078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 4.0, 14.0, 16.0, 26.0, 24.0, 43.0, 56.0, 91.0, 129.0, 218.0, 322.0, 539.0, 899.0, 1573.0, 2909.0, 5476.0, 12350.0, 32948.0, 892365.0, 63667.0, 18175.0, 7762.0, 3838.0, 2051.0, 1173.0, 661.0, 405.0, 244.0, 179.0, 131.0, 83.0, 40.0, 37.0, 38.0, 16.0, 12.0, 13.0, 2.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.69140625, -1.6380615234375, -1.584716796875, -1.5313720703125, -1.47802734375, -1.4246826171875, -1.371337890625, -1.3179931640625, -1.2646484375, -1.2113037109375, -1.157958984375, -1.1046142578125, -1.05126953125, -0.9979248046875, -0.944580078125, -0.8912353515625, -0.837890625, -0.7845458984375, -0.731201171875, -0.6778564453125, -0.62451171875, -0.5711669921875, -0.517822265625, -0.4644775390625, -0.4111328125, -0.3577880859375, -0.304443359375, -0.2510986328125, -0.19775390625, -0.1444091796875, -0.091064453125, -0.0377197265625, 0.015625, 0.0689697265625, 0.122314453125, 0.1756591796875, 0.22900390625, 0.2823486328125, 0.335693359375, 0.3890380859375, 0.4423828125, 0.4957275390625, 0.549072265625, 0.6024169921875, 0.65576171875, 0.7091064453125, 0.762451171875, 0.8157958984375, 0.869140625, 0.9224853515625, 0.975830078125, 1.0291748046875, 1.08251953125, 1.1358642578125, 1.189208984375, 1.2425537109375, 1.2958984375, 1.3492431640625, 1.402587890625, 1.4559326171875, 1.50927734375, 1.5626220703125, 1.615966796875, 1.6693115234375, 1.72265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 14.0, 18.0, 21.0, 29.0, 37.0, 44.0, 47.0, 54.0, 64.0, 59.0, 57.0, 58.0, 78.0, 56.0, 39.0, 47.0, 35.0, 29.0, 26.0, 23.0, 21.0, 12.0, 15.0, 8.0, 7.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.8041343688964844e-05, -4.650000482797623e-05, -4.495866596698761e-05, -4.341732710599899e-05, -4.1875988245010376e-05, -4.033464938402176e-05, -3.879331052303314e-05, -3.7251971662044525e-05, -3.571063280105591e-05, -3.416929394006729e-05, -3.2627955079078674e-05, -3.108661621809006e-05, -2.954527735710144e-05, -2.8003938496112823e-05, -2.6462599635124207e-05, -2.492126077413559e-05, -2.3379921913146973e-05, -2.1838583052158356e-05, -2.029724419116974e-05, -1.8755905330181122e-05, -1.7214566469192505e-05, -1.5673227608203888e-05, -1.4131888747215271e-05, -1.2590549886226654e-05, -1.1049211025238037e-05, -9.50787216424942e-06, -7.966533303260803e-06, -6.425194442272186e-06, -4.883855581283569e-06, -3.3425167202949524e-06, -1.8011778593063354e-06, -2.598389983177185e-07, 1.2814998626708984e-06, 2.8228387236595154e-06, 4.364177584648132e-06, 5.905516445636749e-06, 7.446855306625366e-06, 8.988194167613983e-06, 1.05295330286026e-05, 1.2070871889591217e-05, 1.3612210750579834e-05, 1.5153549611568451e-05, 1.6694888472557068e-05, 1.8236227333545685e-05, 1.9777566194534302e-05, 2.131890505552292e-05, 2.2860243916511536e-05, 2.4401582777500153e-05, 2.594292163848877e-05, 2.7484260499477386e-05, 2.9025599360466003e-05, 3.056693822145462e-05, 3.210827708244324e-05, 3.3649615943431854e-05, 3.519095480442047e-05, 3.673229366540909e-05, 3.8273632526397705e-05, 3.981497138738632e-05, 4.135631024837494e-05, 4.2897649109363556e-05, 4.443898797035217e-05, 4.598032683134079e-05, 4.752166569232941e-05, 4.9063004553318024e-05, 5.060434341430664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 2.0, 9.0, 10.0, 17.0, 27.0, 46.0, 40.0, 73.0, 112.0, 149.0, 236.0, 333.0, 491.0, 676.0, 1048.0, 1698.0, 2533.0, 3938.0, 6196.0, 10152.0, 17297.0, 29049.0, 52089.0, 95094.0, 173293.0, 244294.0, 179787.0, 99015.0, 54012.0, 30464.0, 17699.0, 10559.0, 6479.0, 4008.0, 2544.0, 1666.0, 1089.0, 737.0, 506.0, 373.0, 240.0, 141.0, 90.0, 88.0, 43.0, 42.0, 29.0, 20.0, 9.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5234603881835938, -0.5073699951171875, -0.49127960205078125, -0.475189208984375, -0.45909881591796875, -0.4430084228515625, -0.42691802978515625, -0.41082763671875, -0.39473724365234375, -0.3786468505859375, -0.36255645751953125, -0.346466064453125, -0.33037567138671875, -0.3142852783203125, -0.29819488525390625, -0.2821044921875, -0.26601409912109375, -0.2499237060546875, -0.23383331298828125, -0.217742919921875, -0.20165252685546875, -0.1855621337890625, -0.16947174072265625, -0.15338134765625, -0.13729095458984375, -0.1212005615234375, -0.10511016845703125, -0.089019775390625, -0.07292938232421875, -0.0568389892578125, -0.04074859619140625, -0.024658203125, -0.00856781005859375, 0.0075225830078125, 0.02361297607421875, 0.039703369140625, 0.05579376220703125, 0.0718841552734375, 0.08797454833984375, 0.10406494140625, 0.12015533447265625, 0.1362457275390625, 0.15233612060546875, 0.168426513671875, 0.18451690673828125, 0.2006072998046875, 0.21669769287109375, 0.2327880859375, 0.24887847900390625, 0.2649688720703125, 0.28105926513671875, 0.297149658203125, 0.31324005126953125, 0.3293304443359375, 0.34542083740234375, 0.36151123046875, 0.37760162353515625, 0.3936920166015625, 0.40978240966796875, 0.425872802734375, 0.44196319580078125, 0.4580535888671875, 0.47414398193359375, 0.490234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 12.0, 7.0, 19.0, 17.0, 22.0, 30.0, 18.0, 41.0, 37.0, 56.0, 51.0, 54.0, 88.0, 65.0, 73.0, 65.0, 68.0, 44.0, 42.0, 27.0, 28.0, 23.0, 21.0, 11.0, 12.0, 15.0, 7.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.2678680419921875, -0.257415771484375, -0.2469635009765625, -0.23651123046875, -0.2260589599609375, -0.215606689453125, -0.2051544189453125, -0.1947021484375, -0.1842498779296875, -0.173797607421875, -0.1633453369140625, -0.15289306640625, -0.1424407958984375, -0.131988525390625, -0.1215362548828125, -0.111083984375, -0.1006317138671875, -0.090179443359375, -0.0797271728515625, -0.06927490234375, -0.0588226318359375, -0.048370361328125, -0.0379180908203125, -0.0274658203125, -0.0170135498046875, -0.006561279296875, 0.0038909912109375, 0.01434326171875, 0.0247955322265625, 0.035247802734375, 0.0457000732421875, 0.05615234375, 0.0666046142578125, 0.077056884765625, 0.0875091552734375, 0.09796142578125, 0.1084136962890625, 0.118865966796875, 0.1293182373046875, 0.1397705078125, 0.1502227783203125, 0.160675048828125, 0.1711273193359375, 0.18157958984375, 0.1920318603515625, 0.202484130859375, 0.2129364013671875, 0.223388671875, 0.2338409423828125, 0.244293212890625, 0.2547454833984375, 0.26519775390625, 0.2756500244140625, 0.286102294921875, 0.2965545654296875, 0.3070068359375, 0.3174591064453125, 0.327911376953125, 0.3383636474609375, 0.34881591796875, 0.3592681884765625, 0.369720458984375, 0.3801727294921875, 0.390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 7.0, 18.0, 16.0, 26.0, 31.0, 46.0, 49.0, 48.0, 80.0, 70.0, 65.0, 74.0, 72.0, 72.0, 72.0, 52.0, 49.0, 30.0, 30.0, 19.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2333083152771, -5.998308181762695, -5.763307571411133, -5.52830696105957, -5.293306827545166, -5.058306694030762, -4.823306083679199, -4.588305473327637, -4.353305339813232, -4.118305206298828, -3.8833045959472656, -3.6483042240142822, -3.413303852081299, -3.1783034801483154, -2.943303108215332, -2.7083027362823486, -2.4733023643493652, -2.238301992416382, -2.0033016204833984, -1.768301248550415, -1.5333008766174316, -1.2983005046844482, -1.0633001327514648, -0.8282997608184814, -0.593299388885498, -0.35829901695251465, -0.12329864501953125, 0.11170172691345215, 0.34670209884643555, 0.581702470779419, 0.8167028427124023, 1.0517032146453857, 1.286703109741211, 1.5217034816741943, 1.7567038536071777, 1.9917042255401611, 2.2267045974731445, 2.461704969406128, 2.6967053413391113, 2.9317057132720947, 3.166706085205078, 3.4017064571380615, 3.636706829071045, 3.8717072010040283, 4.106707572937012, 4.341708183288574, 4.5767083168029785, 4.811708450317383, 5.046709060668945, 5.281709671020508, 5.516709804534912, 5.751709938049316, 5.986710548400879, 6.221711158752441, 6.456711292266846, 6.69171142578125, 6.9267120361328125, 7.161712646484375, 7.396712779998779, 7.631712913513184, 7.866713523864746, 8.101714134216309, 8.336713790893555, 8.571714401245117, 8.80671501159668]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 13.0, 19.0, 33.0, 29.0, 33.0, 24.0, 41.0, 39.0, 55.0, 38.0, 49.0, 39.0, 47.0, 40.0, 50.0, 29.0, 44.0, 35.0, 35.0, 24.0, 32.0, 32.0, 27.0, 27.0, 17.0, 20.0, 13.0, 8.0, 19.0, 7.0, 12.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.304595470428467, -4.1580305099487305, -4.011465072631836, -3.8649001121520996, -3.7183351516723633, -3.571769952774048, -3.4252047538757324, -3.278639793395996, -3.1320745944976807, -2.9855093955993652, -2.838944435119629, -2.6923792362213135, -2.545814037322998, -2.3992490768432617, -2.2526838779449463, -2.106118679046631, -1.9595537185668945, -1.8129886388778687, -1.6664235591888428, -1.5198583602905273, -1.3732932806015015, -1.2267282009124756, -1.0801630020141602, -0.9335979223251343, -0.7870328426361084, -0.6404677629470825, -0.49390262365341187, -0.3473375141620636, -0.20077240467071533, -0.05420732498168945, 0.0923578143119812, 0.23892295360565186, 0.38548755645751953, 0.5320526361465454, 0.6786177754402161, 0.8251829147338867, 0.9717479944229126, 1.1183130741119385, 1.264878273010254, 1.4114433526992798, 1.5580084323883057, 1.7045735120773315, 1.8511385917663574, 1.9977037906646729, 2.1442689895629883, 2.2908339500427246, 2.43739914894104, 2.5839643478393555, 2.730529308319092, 2.8770945072174072, 3.0236594676971436, 3.170224666595459, 3.3167896270751953, 3.4633548259735107, 3.609920024871826, 3.7564849853515625, 3.903050184249878, 4.049615383148193, 4.19618034362793, 4.342745304107666, 4.4893107414245605, 4.635875701904297, 4.782440662384033, 4.929006099700928, 5.075571060180664]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 16.0, 19.0, 31.0, 39.0, 76.0, 99.0, 154.0, 227.0, 352.0, 539.0, 796.0, 1295.0, 1919.0, 2953.0, 4726.0, 7163.0, 11233.0, 17176.0, 26680.0, 40126.0, 58488.0, 82887.0, 108401.0, 127656.0, 131114.0, 118378.0, 94883.0, 69800.0, 48561.0, 32503.0, 21137.0, 13791.0, 8782.0, 5722.0, 3807.0, 2408.0, 1656.0, 1032.0, 687.0, 424.0, 285.0, 173.0, 127.0, 77.0, 62.0, 36.0, 19.0, 15.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.76171875, -3.65185546875, -3.5419921875, -3.43212890625, -3.322265625, -3.21240234375, -3.1025390625, -2.99267578125, -2.8828125, -2.77294921875, -2.6630859375, -2.55322265625, -2.443359375, -2.33349609375, -2.2236328125, -2.11376953125, -2.00390625, -1.89404296875, -1.7841796875, -1.67431640625, -1.564453125, -1.45458984375, -1.3447265625, -1.23486328125, -1.125, -1.01513671875, -0.9052734375, -0.79541015625, -0.685546875, -0.57568359375, -0.4658203125, -0.35595703125, -0.24609375, -0.13623046875, -0.0263671875, 0.08349609375, 0.193359375, 0.30322265625, 0.4130859375, 0.52294921875, 0.6328125, 0.74267578125, 0.8525390625, 0.96240234375, 1.072265625, 1.18212890625, 1.2919921875, 1.40185546875, 1.51171875, 1.62158203125, 1.7314453125, 1.84130859375, 1.951171875, 2.06103515625, 2.1708984375, 2.28076171875, 2.390625, 2.50048828125, 2.6103515625, 2.72021484375, 2.830078125, 2.93994140625, 3.0498046875, 3.15966796875, 3.26953125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 10.0, 9.0, 17.0, 21.0, 18.0, 25.0, 48.0, 39.0, 34.0, 35.0, 36.0, 42.0, 35.0, 51.0, 53.0, 50.0, 41.0, 45.0, 32.0, 42.0, 32.0, 24.0, 33.0, 39.0, 23.0, 20.0, 19.0, 16.0, 13.0, 12.0, 17.0, 9.0, 7.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.2835693359375, -4.137451171875, -3.9913330078125, -3.84521484375, -3.6990966796875, -3.552978515625, -3.4068603515625, -3.2607421875, -3.1146240234375, -2.968505859375, -2.8223876953125, -2.67626953125, -2.5301513671875, -2.384033203125, -2.2379150390625, -2.091796875, -1.9456787109375, -1.799560546875, -1.6534423828125, -1.50732421875, -1.3612060546875, -1.215087890625, -1.0689697265625, -0.9228515625, -0.7767333984375, -0.630615234375, -0.4844970703125, -0.33837890625, -0.1922607421875, -0.046142578125, 0.0999755859375, 0.24609375, 0.3922119140625, 0.538330078125, 0.6844482421875, 0.83056640625, 0.9766845703125, 1.122802734375, 1.2689208984375, 1.4150390625, 1.5611572265625, 1.707275390625, 1.8533935546875, 1.99951171875, 2.1456298828125, 2.291748046875, 2.4378662109375, 2.583984375, 2.7301025390625, 2.876220703125, 3.0223388671875, 3.16845703125, 3.3145751953125, 3.460693359375, 3.6068115234375, 3.7529296875, 3.8990478515625, 4.045166015625, 4.1912841796875, 4.33740234375, 4.4835205078125, 4.629638671875, 4.7757568359375, 4.921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 7.0, 8.0, 18.0, 26.0, 33.0, 77.0, 99.0, 142.0, 220.0, 307.0, 549.0, 767.0, 1168.0, 2005.0, 3197.0, 5069.0, 8030.0, 13053.0, 21199.0, 34063.0, 54207.0, 80869.0, 113051.0, 140179.0, 147682.0, 131324.0, 100960.0, 69943.0, 45153.0, 28328.0, 17684.0, 11034.0, 6712.0, 4079.0, 2599.0, 1741.0, 1037.0, 676.0, 406.0, 306.0, 176.0, 129.0, 73.0, 54.0, 49.0, 15.0, 14.0, 12.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.83203125, -3.7203369140625, -3.608642578125, -3.4969482421875, -3.38525390625, -3.2735595703125, -3.161865234375, -3.0501708984375, -2.9384765625, -2.8267822265625, -2.715087890625, -2.6033935546875, -2.49169921875, -2.3800048828125, -2.268310546875, -2.1566162109375, -2.044921875, -1.9332275390625, -1.821533203125, -1.7098388671875, -1.59814453125, -1.4864501953125, -1.374755859375, -1.2630615234375, -1.1513671875, -1.0396728515625, -0.927978515625, -0.8162841796875, -0.70458984375, -0.5928955078125, -0.481201171875, -0.3695068359375, -0.2578125, -0.1461181640625, -0.034423828125, 0.0772705078125, 0.18896484375, 0.3006591796875, 0.412353515625, 0.5240478515625, 0.6357421875, 0.7474365234375, 0.859130859375, 0.9708251953125, 1.08251953125, 1.1942138671875, 1.305908203125, 1.4176025390625, 1.529296875, 1.6409912109375, 1.752685546875, 1.8643798828125, 1.97607421875, 2.0877685546875, 2.199462890625, 2.3111572265625, 2.4228515625, 2.5345458984375, 2.646240234375, 2.7579345703125, 2.86962890625, 2.9813232421875, 3.093017578125, 3.2047119140625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 6.0, 5.0, 8.0, 9.0, 17.0, 12.0, 8.0, 18.0, 20.0, 32.0, 28.0, 27.0, 45.0, 33.0, 27.0, 29.0, 35.0, 45.0, 43.0, 50.0, 36.0, 41.0, 55.0, 39.0, 44.0, 32.0, 29.0, 26.0, 31.0, 24.0, 24.0, 23.0, 15.0, 10.0, 15.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.33203125, -4.212890625, -4.09375, -3.974609375, -3.85546875, -3.736328125, -3.6171875, -3.498046875, -3.37890625, -3.259765625, -3.140625, -3.021484375, -2.90234375, -2.783203125, -2.6640625, -2.544921875, -2.42578125, -2.306640625, -2.1875, -2.068359375, -1.94921875, -1.830078125, -1.7109375, -1.591796875, -1.47265625, -1.353515625, -1.234375, -1.115234375, -0.99609375, -0.876953125, -0.7578125, -0.638671875, -0.51953125, -0.400390625, -0.28125, -0.162109375, -0.04296875, 0.076171875, 0.1953125, 0.314453125, 0.43359375, 0.552734375, 0.671875, 0.791015625, 0.91015625, 1.029296875, 1.1484375, 1.267578125, 1.38671875, 1.505859375, 1.625, 1.744140625, 1.86328125, 1.982421875, 2.1015625, 2.220703125, 2.33984375, 2.458984375, 2.578125, 2.697265625, 2.81640625, 2.935546875, 3.0546875, 3.173828125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 17.0, 25.0, 27.0, 45.0, 72.0, 115.0, 161.0, 238.0, 433.0, 642.0, 1093.0, 1968.0, 3548.0, 7078.0, 15768.0, 40082.0, 113649.0, 311182.0, 338553.0, 133093.0, 46091.0, 17663.0, 7941.0, 3892.0, 2098.0, 1194.0, 708.0, 431.0, 267.0, 152.0, 112.0, 55.0, 39.0, 34.0, 25.0, 15.0, 11.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.0390625, -8.78131103515625, -8.5235595703125, -8.26580810546875, -8.008056640625, -7.75030517578125, -7.4925537109375, -7.23480224609375, -6.97705078125, -6.71929931640625, -6.4615478515625, -6.20379638671875, -5.946044921875, -5.68829345703125, -5.4305419921875, -5.17279052734375, -4.9150390625, -4.65728759765625, -4.3995361328125, -4.14178466796875, -3.884033203125, -3.62628173828125, -3.3685302734375, -3.11077880859375, -2.85302734375, -2.59527587890625, -2.3375244140625, -2.07977294921875, -1.822021484375, -1.56427001953125, -1.3065185546875, -1.04876708984375, -0.791015625, -0.53326416015625, -0.2755126953125, -0.01776123046875, 0.239990234375, 0.49774169921875, 0.7554931640625, 1.01324462890625, 1.27099609375, 1.52874755859375, 1.7864990234375, 2.04425048828125, 2.302001953125, 2.55975341796875, 2.8175048828125, 3.07525634765625, 3.3330078125, 3.59075927734375, 3.8485107421875, 4.10626220703125, 4.364013671875, 4.62176513671875, 4.8795166015625, 5.13726806640625, 5.39501953125, 5.65277099609375, 5.9105224609375, 6.16827392578125, 6.426025390625, 6.68377685546875, 6.9415283203125, 7.19927978515625, 7.45703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 12.0, 8.0, 21.0, 15.0, 26.0, 31.0, 33.0, 47.0, 50.0, 54.0, 61.0, 60.0, 81.0, 68.0, 73.0, 67.0, 71.0, 52.0, 45.0, 28.0, 23.0, 22.0, 14.0, 13.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000514984130859375, -0.0005029588937759399, -0.0004909336566925049, -0.0004789084196090698, -0.00046688318252563477, -0.0004548579454421997, -0.00044283270835876465, -0.0004308074712753296, -0.00041878223419189453, -0.00040675699710845947, -0.0003947317600250244, -0.00038270652294158936, -0.0003706812858581543, -0.00035865604877471924, -0.0003466308116912842, -0.0003346055746078491, -0.00032258033752441406, -0.000310555100440979, -0.00029852986335754395, -0.0002865046262741089, -0.00027447938919067383, -0.00026245415210723877, -0.0002504289150238037, -0.00023840367794036865, -0.0002263784408569336, -0.00021435320377349854, -0.00020232796669006348, -0.00019030272960662842, -0.00017827749252319336, -0.0001662522554397583, -0.00015422701835632324, -0.00014220178127288818, -0.00013017654418945312, -0.00011815130710601807, -0.00010612607002258301, -9.410083293914795e-05, -8.207559585571289e-05, -7.005035877227783e-05, -5.8025121688842773e-05, -4.5999884605407715e-05, -3.3974647521972656e-05, -2.1949410438537598e-05, -9.924173355102539e-06, 2.1010637283325195e-06, 1.4126300811767578e-05, 2.6151537895202637e-05, 3.8176774978637695e-05, 5.0202012062072754e-05, 6.222724914550781e-05, 7.425248622894287e-05, 8.627772331237793e-05, 9.830296039581299e-05, 0.00011032819747924805, 0.0001223534345626831, 0.00013437867164611816, 0.00014640390872955322, 0.00015842914581298828, 0.00017045438289642334, 0.0001824796199798584, 0.00019450485706329346, 0.00020653009414672852, 0.00021855533123016357, 0.00023058056831359863, 0.0002426058053970337, 0.00025463104248046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 17.0, 18.0, 23.0, 41.0, 62.0, 79.0, 117.0, 153.0, 227.0, 392.0, 591.0, 964.0, 1647.0, 3026.0, 6058.0, 13460.0, 34626.0, 99420.0, 255053.0, 342844.0, 181911.0, 64687.0, 23213.0, 9450.0, 4447.0, 2332.0, 1322.0, 811.0, 507.0, 312.0, 208.0, 149.0, 97.0, 84.0, 55.0, 48.0, 29.0, 18.0, 12.0, 10.0, 7.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0], "bins": [-7.71875, -7.506103515625, -7.29345703125, -7.080810546875, -6.8681640625, -6.655517578125, -6.44287109375, -6.230224609375, -6.017578125, -5.804931640625, -5.59228515625, -5.379638671875, -5.1669921875, -4.954345703125, -4.74169921875, -4.529052734375, -4.31640625, -4.103759765625, -3.89111328125, -3.678466796875, -3.4658203125, -3.253173828125, -3.04052734375, -2.827880859375, -2.615234375, -2.402587890625, -2.18994140625, -1.977294921875, -1.7646484375, -1.552001953125, -1.33935546875, -1.126708984375, -0.9140625, -0.701416015625, -0.48876953125, -0.276123046875, -0.0634765625, 0.149169921875, 0.36181640625, 0.574462890625, 0.787109375, 0.999755859375, 1.21240234375, 1.425048828125, 1.6376953125, 1.850341796875, 2.06298828125, 2.275634765625, 2.48828125, 2.700927734375, 2.91357421875, 3.126220703125, 3.3388671875, 3.551513671875, 3.76416015625, 3.976806640625, 4.189453125, 4.402099609375, 4.61474609375, 4.827392578125, 5.0400390625, 5.252685546875, 5.46533203125, 5.677978515625, 5.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 9.0, 4.0, 7.0, 4.0, 11.0, 12.0, 18.0, 25.0, 40.0, 61.0, 76.0, 108.0, 124.0, 110.0, 96.0, 82.0, 52.0, 42.0, 31.0, 18.0, 18.0, 7.0, 5.0, 6.0, 9.0, 2.0, 2.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99114990234375, -3.8533935546875, -3.71563720703125, -3.577880859375, -3.44012451171875, -3.3023681640625, -3.16461181640625, -3.02685546875, -2.88909912109375, -2.7513427734375, -2.61358642578125, -2.475830078125, -2.33807373046875, -2.2003173828125, -2.06256103515625, -1.9248046875, -1.78704833984375, -1.6492919921875, -1.51153564453125, -1.373779296875, -1.23602294921875, -1.0982666015625, -0.96051025390625, -0.82275390625, -0.68499755859375, -0.5472412109375, -0.40948486328125, -0.271728515625, -0.13397216796875, 0.0037841796875, 0.14154052734375, 0.279296875, 0.41705322265625, 0.5548095703125, 0.69256591796875, 0.830322265625, 0.96807861328125, 1.1058349609375, 1.24359130859375, 1.38134765625, 1.51910400390625, 1.6568603515625, 1.79461669921875, 1.932373046875, 2.07012939453125, 2.2078857421875, 2.34564208984375, 2.4833984375, 2.62115478515625, 2.7589111328125, 2.89666748046875, 3.034423828125, 3.17218017578125, 3.3099365234375, 3.44769287109375, 3.58544921875, 3.72320556640625, 3.8609619140625, 3.99871826171875, 4.136474609375, 4.27423095703125, 4.4119873046875, 4.54974365234375, 4.6875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 9.0, 20.0, 21.0, 28.0, 22.0, 44.0, 51.0, 61.0, 61.0, 59.0, 61.0, 68.0, 77.0, 71.0, 60.0, 51.0, 47.0, 34.0, 20.0, 29.0, 17.0, 13.0, 14.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9219207763671875, -5.702857494354248, -5.48379373550415, -5.264730453491211, -5.0456671714782715, -4.826603889465332, -4.607540130615234, -4.388476848602295, -4.1694135665893555, -3.950350046157837, -3.7312867641448975, -3.512223243713379, -3.2931599617004395, -3.074096441268921, -2.8550329208374023, -2.635969638824463, -2.4169058799743652, -2.1978423595428467, -1.9787790775299072, -1.7597155570983887, -1.5406521558761597, -1.3215887546539307, -1.102525234222412, -0.8834618330001831, -0.6643984317779541, -0.4453350007534027, -0.22627156972885132, -0.007208108901977539, 0.21185529232025146, 0.43091869354248047, 0.649982213973999, 0.869045615196228, 1.088109016418457, 1.307172417640686, 1.526235818862915, 1.7452993392944336, 1.9643627405166626, 2.1834261417388916, 2.40248966217041, 2.6215529441833496, 2.840616464614868, 3.0596799850463867, 3.278743267059326, 3.4978067874908447, 3.7168703079223633, 3.9359335899353027, 4.154996871948242, 4.37406063079834, 4.593123912811279, 4.812187194824219, 5.031250953674316, 5.250314235687256, 5.469377517700195, 5.688441276550293, 5.907504558563232, 6.126567840576172, 6.3456315994262695, 6.564694881439209, 6.783758640289307, 7.002821922302246, 7.2218852043151855, 7.440948486328125, 7.660012245178223, 7.879075527191162, 8.098138809204102]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 14.0, 12.0, 23.0, 23.0, 23.0, 27.0, 30.0, 25.0, 29.0, 35.0, 29.0, 48.0, 23.0, 58.0, 35.0, 41.0, 46.0, 43.0, 46.0, 34.0, 32.0, 24.0, 31.0, 22.0, 26.0, 26.0, 26.0, 16.0, 16.0, 21.0, 10.0, 11.0, 12.0, 7.0, 8.0, 7.0, 4.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.201750755310059, -4.0681376457214355, -3.9345247745513916, -3.8009116649627686, -3.6672987937927246, -3.5336856842041016, -3.4000725746154785, -3.2664594650268555, -3.1328465938568115, -2.9992334842681885, -2.8656206130981445, -2.7320075035095215, -2.5983943939208984, -2.4647815227508545, -2.3311684131622314, -2.1975555419921875, -2.0639424324035645, -1.930329442024231, -1.7967164516448975, -1.6631033420562744, -1.529490351676941, -1.3958773612976074, -1.2622642517089844, -1.1286512613296509, -0.9950382709503174, -0.8614252805709839, -0.7278122305870056, -0.5941991806030273, -0.46058619022369385, -0.32697319984436035, -0.19336014986038208, -0.05974709987640381, 0.07386636734008789, 0.20747938752174377, 0.34109240770339966, 0.47470542788505554, 0.6083184480667114, 0.7419314384460449, 0.8755444884300232, 1.0091575384140015, 1.142770528793335, 1.2763835191726685, 1.409996509552002, 1.543609619140625, 1.6772226095199585, 1.810835599899292, 1.944448709487915, 2.078061580657959, 2.211674690246582, 2.345287799835205, 2.478900671005249, 2.612513780593872, 2.746126651763916, 2.879739761352539, 3.013352870941162, 3.146965980529785, 3.280578851699829, 3.414191961288452, 3.547804832458496, 3.681417942047119, 3.815031051635742, 3.948643922805786, 4.08225679397583, 4.215869903564453, 4.349483013153076]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 10.0, 12.0, 16.0, 22.0, 37.0, 59.0, 89.0, 121.0, 167.0, 238.0, 391.0, 587.0, 908.0, 1377.0, 2223.0, 3708.0, 6034.0, 10597.0, 18808.0, 35303.0, 69897.0, 148690.0, 331050.0, 717269.0, 1103106.0, 897387.0, 449642.0, 200628.0, 94093.0, 45803.0, 24388.0, 13014.0, 7266.0, 4379.0, 2643.0, 1582.0, 974.0, 599.0, 412.0, 275.0, 159.0, 113.0, 70.0, 48.0, 30.0, 18.0, 15.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.39453125, -5.22430419921875, -5.0540771484375, -4.88385009765625, -4.713623046875, -4.54339599609375, -4.3731689453125, -4.20294189453125, -4.03271484375, -3.86248779296875, -3.6922607421875, -3.52203369140625, -3.351806640625, -3.18157958984375, -3.0113525390625, -2.84112548828125, -2.6708984375, -2.50067138671875, -2.3304443359375, -2.16021728515625, -1.989990234375, -1.81976318359375, -1.6495361328125, -1.47930908203125, -1.30908203125, -1.13885498046875, -0.9686279296875, -0.79840087890625, -0.628173828125, -0.45794677734375, -0.2877197265625, -0.11749267578125, 0.052734375, 0.22296142578125, 0.3931884765625, 0.56341552734375, 0.733642578125, 0.90386962890625, 1.0740966796875, 1.24432373046875, 1.41455078125, 1.58477783203125, 1.7550048828125, 1.92523193359375, 2.095458984375, 2.26568603515625, 2.4359130859375, 2.60614013671875, 2.7763671875, 2.94659423828125, 3.1168212890625, 3.28704833984375, 3.457275390625, 3.62750244140625, 3.7977294921875, 3.96795654296875, 4.13818359375, 4.30841064453125, 4.4786376953125, 4.64886474609375, 4.819091796875, 4.98931884765625, 5.1595458984375, 5.32977294921875, 5.5]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 10.0, 13.0, 7.0, 14.0, 14.0, 21.0, 28.0, 27.0, 26.0, 31.0, 29.0, 35.0, 36.0, 28.0, 46.0, 29.0, 33.0, 40.0, 37.0, 36.0, 40.0, 33.0, 36.0, 29.0, 22.0, 29.0, 28.0, 30.0, 18.0, 16.0, 20.0, 16.0, 15.0, 23.0, 11.0, 14.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.49609375, -2.417938232421875, -2.33978271484375, -2.261627197265625, -2.1834716796875, -2.105316162109375, -2.02716064453125, -1.949005126953125, -1.870849609375, -1.792694091796875, -1.71453857421875, -1.636383056640625, -1.5582275390625, -1.480072021484375, -1.40191650390625, -1.323760986328125, -1.24560546875, -1.167449951171875, -1.08929443359375, -1.011138916015625, -0.9329833984375, -0.854827880859375, -0.77667236328125, -0.698516845703125, -0.620361328125, -0.542205810546875, -0.46405029296875, -0.385894775390625, -0.3077392578125, -0.229583740234375, -0.15142822265625, -0.073272705078125, 0.0048828125, 0.083038330078125, 0.16119384765625, 0.239349365234375, 0.3175048828125, 0.395660400390625, 0.47381591796875, 0.551971435546875, 0.630126953125, 0.708282470703125, 0.78643798828125, 0.864593505859375, 0.9427490234375, 1.020904541015625, 1.09906005859375, 1.177215576171875, 1.25537109375, 1.333526611328125, 1.41168212890625, 1.489837646484375, 1.5679931640625, 1.646148681640625, 1.72430419921875, 1.802459716796875, 1.880615234375, 1.958770751953125, 2.03692626953125, 2.115081787109375, 2.1932373046875, 2.271392822265625, 2.34954833984375, 2.427703857421875, 2.505859375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 12.0, 9.0, 20.0, 22.0, 38.0, 46.0, 54.0, 99.0, 161.0, 229.0, 346.0, 554.0, 899.0, 1479.0, 2338.0, 3986.0, 6904.0, 11790.0, 20967.0, 37055.0, 67625.0, 127072.0, 240662.0, 446529.0, 745203.0, 907245.0, 695983.0, 405284.0, 215979.0, 114646.0, 61573.0, 33689.0, 18992.0, 10794.0, 6277.0, 3759.0, 2219.0, 1406.0, 789.0, 553.0, 343.0, 220.0, 113.0, 98.0, 77.0, 48.0, 21.0, 14.0, 16.0, 11.0, 8.0, 9.0, 6.0, 7.0, 1.0, 4.0], "bins": [-5.015625, -4.86553955078125, -4.7154541015625, -4.56536865234375, -4.415283203125, -4.26519775390625, -4.1151123046875, -3.96502685546875, -3.81494140625, -3.66485595703125, -3.5147705078125, -3.36468505859375, -3.214599609375, -3.06451416015625, -2.9144287109375, -2.76434326171875, -2.6142578125, -2.46417236328125, -2.3140869140625, -2.16400146484375, -2.013916015625, -1.86383056640625, -1.7137451171875, -1.56365966796875, -1.41357421875, -1.26348876953125, -1.1134033203125, -0.96331787109375, -0.813232421875, -0.66314697265625, -0.5130615234375, -0.36297607421875, -0.212890625, -0.06280517578125, 0.0872802734375, 0.23736572265625, 0.387451171875, 0.53753662109375, 0.6876220703125, 0.83770751953125, 0.98779296875, 1.13787841796875, 1.2879638671875, 1.43804931640625, 1.588134765625, 1.73822021484375, 1.8883056640625, 2.03839111328125, 2.1884765625, 2.33856201171875, 2.4886474609375, 2.63873291015625, 2.788818359375, 2.93890380859375, 3.0889892578125, 3.23907470703125, 3.38916015625, 3.53924560546875, 3.6893310546875, 3.83941650390625, 3.989501953125, 4.13958740234375, 4.2896728515625, 4.43975830078125, 4.58984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 4.0, 8.0, 15.0, 18.0, 18.0, 27.0, 50.0, 43.0, 51.0, 65.0, 76.0, 93.0, 90.0, 140.0, 177.0, 189.0, 201.0, 259.0, 242.0, 290.0, 265.0, 240.0, 219.0, 193.0, 201.0, 164.0, 132.0, 123.0, 101.0, 73.0, 74.0, 56.0, 44.0, 31.0, 27.0, 17.0, 18.0, 10.0, 4.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.444854736328125, -1.39752197265625, -1.350189208984375, -1.3028564453125, -1.255523681640625, -1.20819091796875, -1.160858154296875, -1.113525390625, -1.066192626953125, -1.01885986328125, -0.971527099609375, -0.9241943359375, -0.876861572265625, -0.82952880859375, -0.782196044921875, -0.73486328125, -0.687530517578125, -0.64019775390625, -0.592864990234375, -0.5455322265625, -0.498199462890625, -0.45086669921875, -0.403533935546875, -0.356201171875, -0.308868408203125, -0.26153564453125, -0.214202880859375, -0.1668701171875, -0.119537353515625, -0.07220458984375, -0.024871826171875, 0.0224609375, 0.069793701171875, 0.11712646484375, 0.164459228515625, 0.2117919921875, 0.259124755859375, 0.30645751953125, 0.353790283203125, 0.401123046875, 0.448455810546875, 0.49578857421875, 0.543121337890625, 0.5904541015625, 0.637786865234375, 0.68511962890625, 0.732452392578125, 0.77978515625, 0.827117919921875, 0.87445068359375, 0.921783447265625, 0.9691162109375, 1.016448974609375, 1.06378173828125, 1.111114501953125, 1.158447265625, 1.205780029296875, 1.25311279296875, 1.300445556640625, 1.3477783203125, 1.395111083984375, 1.44244384765625, 1.489776611328125, 1.537109375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 14.0, 15.0, 27.0, 36.0, 30.0, 42.0, 55.0, 63.0, 65.0, 84.0, 81.0, 68.0, 54.0, 62.0, 52.0, 38.0, 35.0, 31.0, 29.0, 21.0, 15.0, 16.0, 15.0, 11.0, 3.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.318307876586914, -5.1266021728515625, -4.934896469116211, -4.743190765380859, -4.55148458480835, -4.359778881072998, -4.1680731773376465, -3.976367473602295, -3.7846615314483643, -3.5929558277130127, -3.401249885559082, -3.2095441818237305, -3.017838478088379, -2.8261325359344482, -2.6344268321990967, -2.442720890045166, -2.2510151863098145, -2.059309482574463, -1.8676035404205322, -1.6758978366851807, -1.4841920137405396, -1.2924861907958984, -1.1007804870605469, -0.9090746641159058, -0.7173688411712646, -0.5256630182266235, -0.3339572548866272, -0.14225149154663086, 0.049454331398010254, 0.24116015434265137, 0.43286585807800293, 0.624571681022644, 0.8162775039672852, 1.0079833269119263, 1.1996891498565674, 1.391394853591919, 1.58310067653656, 1.7748064994812012, 1.9665122032165527, 2.1582179069519043, 2.349923849105835, 2.5416295528411865, 2.733335494995117, 2.9250411987304688, 3.1167469024658203, 3.308452844619751, 3.5001585483551025, 3.691864490509033, 3.8835701942443848, 4.075275897979736, 4.266981601715088, 4.458687782287598, 4.650393486022949, 4.842099189758301, 5.033804893493652, 5.225510597229004, 5.4172163009643555, 5.608922004699707, 5.800627708435059, 5.99233341217041, 6.18403959274292, 6.3757452964782715, 6.567451000213623, 6.759156703948975, 6.950862884521484]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 8.0, 5.0, 7.0, 19.0, 11.0, 18.0, 12.0, 20.0, 17.0, 32.0, 34.0, 19.0, 28.0, 31.0, 32.0, 42.0, 29.0, 37.0, 24.0, 45.0, 36.0, 24.0, 33.0, 36.0, 37.0, 43.0, 32.0, 34.0, 23.0, 28.0, 20.0, 21.0, 15.0, 24.0, 19.0, 11.0, 15.0, 9.0, 10.0, 12.0, 5.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.2040908336639404, -3.1065220832824707, -3.008953332901001, -2.9113845825195312, -2.8138160705566406, -2.716247320175171, -2.618678569793701, -2.5211098194122314, -2.4235410690307617, -2.325972318649292, -2.2284035682678223, -2.1308350563049316, -2.033266305923462, -1.9356975555419922, -1.8381288051605225, -1.7405600547790527, -1.642991542816162, -1.5454227924346924, -1.4478541612625122, -1.3502854108810425, -1.2527167797088623, -1.1551480293273926, -1.0575792789459229, -0.9600105881690979, -0.862441897392273, -0.764873206615448, -0.667304515838623, -0.5697357654571533, -0.47216707468032837, -0.3745983839035034, -0.2770296335220337, -0.17946094274520874, -0.08189201354980469, 0.015676692128181458, 0.1132453978061676, 0.21081411838531494, 0.3083828091621399, 0.40595149993896484, 0.5035202503204346, 0.6010889410972595, 0.6986576318740845, 0.7962263226509094, 0.8937950134277344, 0.9913637638092041, 1.0889325141906738, 1.186501145362854, 1.2840698957443237, 1.381638526916504, 1.4792072772979736, 1.5767760276794434, 1.6743446588516235, 1.7719134092330933, 1.8694820404052734, 1.9670507907867432, 2.064619541168213, 2.1621882915496826, 2.2597570419311523, 2.357325792312622, 2.454894542694092, 2.5524630546569824, 2.650031805038452, 2.747600555419922, 2.8451693058013916, 2.9427380561828613, 3.040306568145752]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 26.0, 19.0, 39.0, 73.0, 119.0, 184.0, 316.0, 499.0, 846.0, 1528.0, 2853.0, 5200.0, 9820.0, 19282.0, 39256.0, 78906.0, 152554.0, 239338.0, 225355.0, 134413.0, 68508.0, 33800.0, 16820.0, 8670.0, 4400.0, 2448.0, 1355.0, 768.0, 458.0, 257.0, 138.0, 92.0, 68.0, 50.0, 24.0, 18.0, 11.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8952713012695312, -0.8672027587890625, -0.8391342163085938, -0.811065673828125, -0.7829971313476562, -0.7549285888671875, -0.7268600463867188, -0.69879150390625, -0.6707229614257812, -0.6426544189453125, -0.6145858764648438, -0.586517333984375, -0.5584487915039062, -0.5303802490234375, -0.5023117065429688, -0.4742431640625, -0.44617462158203125, -0.4181060791015625, -0.39003753662109375, -0.361968994140625, -0.33390045166015625, -0.3058319091796875, -0.27776336669921875, -0.24969482421875, -0.22162628173828125, -0.1935577392578125, -0.16548919677734375, -0.137420654296875, -0.10935211181640625, -0.0812835693359375, -0.05321502685546875, -0.025146484375, 0.00292205810546875, 0.0309906005859375, 0.05905914306640625, 0.087127685546875, 0.11519622802734375, 0.1432647705078125, 0.17133331298828125, 0.19940185546875, 0.22747039794921875, 0.2555389404296875, 0.28360748291015625, 0.311676025390625, 0.33974456787109375, 0.3678131103515625, 0.39588165283203125, 0.4239501953125, 0.45201873779296875, 0.4800872802734375, 0.5081558227539062, 0.536224365234375, 0.5642929077148438, 0.5923614501953125, 0.6204299926757812, 0.64849853515625, 0.6765670776367188, 0.7046356201171875, 0.7327041625976562, 0.760772705078125, 0.7888412475585938, 0.8169097900390625, 0.8449783325195312, 0.873046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 13.0, 17.0, 28.0, 19.0, 10.0, 23.0, 20.0, 20.0, 37.0, 40.0, 31.0, 33.0, 22.0, 32.0, 38.0, 34.0, 34.0, 40.0, 31.0, 40.0, 27.0, 34.0, 36.0, 23.0, 34.0, 23.0, 39.0, 20.0, 30.0, 23.0, 8.0, 14.0, 11.0, 16.0, 5.0, 12.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.197265625, -3.09100341796875, -2.9847412109375, -2.87847900390625, -2.772216796875, -2.66595458984375, -2.5596923828125, -2.45343017578125, -2.34716796875, -2.24090576171875, -2.1346435546875, -2.02838134765625, -1.922119140625, -1.81585693359375, -1.7095947265625, -1.60333251953125, -1.4970703125, -1.39080810546875, -1.2845458984375, -1.17828369140625, -1.072021484375, -0.96575927734375, -0.8594970703125, -0.75323486328125, -0.64697265625, -0.54071044921875, -0.4344482421875, -0.32818603515625, -0.221923828125, -0.11566162109375, -0.0093994140625, 0.09686279296875, 0.203125, 0.30938720703125, 0.4156494140625, 0.52191162109375, 0.628173828125, 0.73443603515625, 0.8406982421875, 0.94696044921875, 1.05322265625, 1.15948486328125, 1.2657470703125, 1.37200927734375, 1.478271484375, 1.58453369140625, 1.6907958984375, 1.79705810546875, 1.9033203125, 2.00958251953125, 2.1158447265625, 2.22210693359375, 2.328369140625, 2.43463134765625, 2.5408935546875, 2.64715576171875, 2.75341796875, 2.85968017578125, 2.9659423828125, 3.07220458984375, 3.178466796875, 3.28472900390625, 3.3909912109375, 3.49725341796875, 3.603515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 11.0, 13.0, 11.0, 27.0, 27.0, 41.0, 62.0, 87.0, 120.0, 204.0, 284.0, 429.0, 727.0, 1165.0, 2045.0, 4039.0, 8765.0, 21462.0, 107276.0, 835929.0, 39045.0, 13580.0, 6064.0, 2930.0, 1614.0, 955.0, 513.0, 345.0, 222.0, 142.0, 117.0, 80.0, 54.0, 32.0, 34.0, 34.0, 16.0, 11.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.708984375, -2.632171630859375, -2.55535888671875, -2.478546142578125, -2.4017333984375, -2.324920654296875, -2.24810791015625, -2.171295166015625, -2.094482421875, -2.017669677734375, -1.94085693359375, -1.864044189453125, -1.7872314453125, -1.710418701171875, -1.63360595703125, -1.556793212890625, -1.47998046875, -1.403167724609375, -1.32635498046875, -1.249542236328125, -1.1727294921875, -1.095916748046875, -1.01910400390625, -0.942291259765625, -0.865478515625, -0.788665771484375, -0.71185302734375, -0.635040283203125, -0.5582275390625, -0.481414794921875, -0.40460205078125, -0.327789306640625, -0.2509765625, -0.174163818359375, -0.09735107421875, -0.020538330078125, 0.0562744140625, 0.133087158203125, 0.20989990234375, 0.286712646484375, 0.363525390625, 0.440338134765625, 0.51715087890625, 0.593963623046875, 0.6707763671875, 0.747589111328125, 0.82440185546875, 0.901214599609375, 0.97802734375, 1.054840087890625, 1.13165283203125, 1.208465576171875, 1.2852783203125, 1.362091064453125, 1.43890380859375, 1.515716552734375, 1.592529296875, 1.669342041015625, 1.74615478515625, 1.822967529296875, 1.8997802734375, 1.976593017578125, 2.05340576171875, 2.130218505859375, 2.20703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 7.0, 6.0, 10.0, 10.0, 8.0, 17.0, 18.0, 20.0, 19.0, 24.0, 32.0, 36.0, 40.0, 42.0, 41.0, 39.0, 55.0, 49.0, 45.0, 47.0, 49.0, 50.0, 40.0, 44.0, 37.0, 36.0, 30.0, 34.0, 13.0, 20.0, 10.0, 16.0, 16.0, 11.0, 4.0, 5.0, 2.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.467315673828125, -4.33306884765625, -4.198822021484375, -4.0645751953125, -3.930328369140625, -3.79608154296875, -3.661834716796875, -3.527587890625, -3.393341064453125, -3.25909423828125, -3.124847412109375, -2.9906005859375, -2.856353759765625, -2.72210693359375, -2.587860107421875, -2.45361328125, -2.319366455078125, -2.18511962890625, -2.050872802734375, -1.9166259765625, -1.782379150390625, -1.64813232421875, -1.513885498046875, -1.379638671875, -1.245391845703125, -1.11114501953125, -0.976898193359375, -0.8426513671875, -0.708404541015625, -0.57415771484375, -0.439910888671875, -0.3056640625, -0.171417236328125, -0.03717041015625, 0.097076416015625, 0.2313232421875, 0.365570068359375, 0.49981689453125, 0.634063720703125, 0.768310546875, 0.902557373046875, 1.03680419921875, 1.171051025390625, 1.3052978515625, 1.439544677734375, 1.57379150390625, 1.708038330078125, 1.84228515625, 1.976531982421875, 2.11077880859375, 2.245025634765625, 2.3792724609375, 2.513519287109375, 2.64776611328125, 2.782012939453125, 2.916259765625, 3.050506591796875, 3.18475341796875, 3.319000244140625, 3.4532470703125, 3.587493896484375, 3.72174072265625, 3.855987548828125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 9.0, 15.0, 24.0, 29.0, 34.0, 46.0, 76.0, 119.0, 184.0, 270.0, 432.0, 632.0, 942.0, 1477.0, 2401.0, 3956.0, 6728.0, 12622.0, 28406.0, 787769.0, 152518.0, 22975.0, 10927.0, 5982.0, 3704.0, 2201.0, 1322.0, 894.0, 617.0, 397.0, 280.0, 168.0, 117.0, 87.0, 48.0, 35.0, 32.0, 27.0, 14.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0016326904296875, -0.968109130859375, -0.9345855712890625, -0.90106201171875, -0.8675384521484375, -0.834014892578125, -0.8004913330078125, -0.7669677734375, -0.7334442138671875, -0.699920654296875, -0.6663970947265625, -0.63287353515625, -0.5993499755859375, -0.565826416015625, -0.5323028564453125, -0.498779296875, -0.4652557373046875, -0.431732177734375, -0.3982086181640625, -0.36468505859375, -0.3311614990234375, -0.297637939453125, -0.2641143798828125, -0.2305908203125, -0.1970672607421875, -0.163543701171875, -0.1300201416015625, -0.09649658203125, -0.0629730224609375, -0.029449462890625, 0.0040740966796875, 0.03759765625, 0.0711212158203125, 0.104644775390625, 0.1381683349609375, 0.17169189453125, 0.2052154541015625, 0.238739013671875, 0.2722625732421875, 0.3057861328125, 0.3393096923828125, 0.372833251953125, 0.4063568115234375, 0.43988037109375, 0.4734039306640625, 0.506927490234375, 0.5404510498046875, 0.573974609375, 0.6074981689453125, 0.641021728515625, 0.6745452880859375, 0.70806884765625, 0.7415924072265625, 0.775115966796875, 0.8086395263671875, 0.8421630859375, 0.8756866455078125, 0.909210205078125, 0.9427337646484375, 0.97625732421875, 1.0097808837890625, 1.043304443359375, 1.0768280029296875, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 4.0, 12.0, 15.0, 24.0, 38.0, 66.0, 93.0, 110.0, 115.0, 130.0, 110.0, 95.0, 52.0, 37.0, 24.0, 14.0, 7.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.7738037109375e-05, -8.535012602806091e-05, -8.296221494674683e-05, -8.057430386543274e-05, -7.818639278411865e-05, -7.579848170280457e-05, -7.341057062149048e-05, -7.102265954017639e-05, -6.86347484588623e-05, -6.624683737754822e-05, -6.385892629623413e-05, -6.147101521492004e-05, -5.908310413360596e-05, -5.669519305229187e-05, -5.430728197097778e-05, -5.1919370889663696e-05, -4.953145980834961e-05, -4.714354872703552e-05, -4.4755637645721436e-05, -4.236772656440735e-05, -3.997981548309326e-05, -3.7591904401779175e-05, -3.520399332046509e-05, -3.2816082239151e-05, -3.0428171157836914e-05, -2.8040260076522827e-05, -2.565234899520874e-05, -2.3264437913894653e-05, -2.0876526832580566e-05, -1.848861575126648e-05, -1.6100704669952393e-05, -1.3712793588638306e-05, -1.1324882507324219e-05, -8.936971426010132e-06, -6.549060344696045e-06, -4.161149263381958e-06, -1.773238182067871e-06, 6.146728992462158e-07, 3.0025839805603027e-06, 5.39049506187439e-06, 7.778406143188477e-06, 1.0166317224502563e-05, 1.255422830581665e-05, 1.4942139387130737e-05, 1.7330050468444824e-05, 1.971796154975891e-05, 2.2105872631072998e-05, 2.4493783712387085e-05, 2.6881694793701172e-05, 2.926960587501526e-05, 3.1657516956329346e-05, 3.404542803764343e-05, 3.643333911895752e-05, 3.8821250200271606e-05, 4.120916128158569e-05, 4.359707236289978e-05, 4.598498344421387e-05, 4.8372894525527954e-05, 5.076080560684204e-05, 5.314871668815613e-05, 5.5536627769470215e-05, 5.79245388507843e-05, 6.031244993209839e-05, 6.270036101341248e-05, 6.508827209472656e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 14.0, 18.0, 19.0, 27.0, 50.0, 61.0, 84.0, 105.0, 184.0, 228.0, 347.0, 530.0, 720.0, 1107.0, 1709.0, 2713.0, 4352.0, 7331.0, 12446.0, 22368.0, 42006.0, 84907.0, 178772.0, 292808.0, 197128.0, 93713.0, 46410.0, 24195.0, 13353.0, 7757.0, 4615.0, 2877.0, 1828.0, 1177.0, 766.0, 532.0, 375.0, 269.0, 177.0, 120.0, 90.0, 74.0, 51.0, 42.0, 28.0, 9.0, 17.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0], "bins": [-0.356689453125, -0.34539031982421875, -0.3340911865234375, -0.32279205322265625, -0.311492919921875, -0.30019378662109375, -0.2888946533203125, -0.27759552001953125, -0.26629638671875, -0.25499725341796875, -0.2436981201171875, -0.23239898681640625, -0.221099853515625, -0.20980072021484375, -0.1985015869140625, -0.18720245361328125, -0.1759033203125, -0.16460418701171875, -0.1533050537109375, -0.14200592041015625, -0.130706787109375, -0.11940765380859375, -0.1081085205078125, -0.09680938720703125, -0.08551025390625, -0.07421112060546875, -0.0629119873046875, -0.05161285400390625, -0.040313720703125, -0.02901458740234375, -0.0177154541015625, -0.00641632080078125, 0.0048828125, 0.01618194580078125, 0.0274810791015625, 0.03878021240234375, 0.050079345703125, 0.06137847900390625, 0.0726776123046875, 0.08397674560546875, 0.09527587890625, 0.10657501220703125, 0.1178741455078125, 0.12917327880859375, 0.140472412109375, 0.15177154541015625, 0.1630706787109375, 0.17436981201171875, 0.1856689453125, 0.19696807861328125, 0.2082672119140625, 0.21956634521484375, 0.230865478515625, 0.24216461181640625, 0.2534637451171875, 0.26476287841796875, 0.27606201171875, 0.28736114501953125, 0.2986602783203125, 0.30995941162109375, 0.321258544921875, 0.33255767822265625, 0.3438568115234375, 0.35515594482421875, 0.366455078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 13.0, 32.0, 21.0, 23.0, 38.0, 30.0, 56.0, 76.0, 85.0, 85.0, 89.0, 64.0, 69.0, 43.0, 34.0, 27.0, 28.0, 26.0, 28.0, 17.0, 13.0, 5.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24890899658203125, -0.2402496337890625, -0.23159027099609375, -0.222930908203125, -0.21427154541015625, -0.2056121826171875, -0.19695281982421875, -0.18829345703125, -0.17963409423828125, -0.1709747314453125, -0.16231536865234375, -0.153656005859375, -0.14499664306640625, -0.1363372802734375, -0.12767791748046875, -0.1190185546875, -0.11035919189453125, -0.1016998291015625, -0.09304046630859375, -0.084381103515625, -0.07572174072265625, -0.0670623779296875, -0.05840301513671875, -0.04974365234375, -0.04108428955078125, -0.0324249267578125, -0.02376556396484375, -0.015106201171875, -0.00644683837890625, 0.0022125244140625, 0.01087188720703125, 0.01953125, 0.02819061279296875, 0.0368499755859375, 0.04550933837890625, 0.054168701171875, 0.06282806396484375, 0.0714874267578125, 0.08014678955078125, 0.08880615234375, 0.09746551513671875, 0.1061248779296875, 0.11478424072265625, 0.123443603515625, 0.13210296630859375, 0.1407623291015625, 0.14942169189453125, 0.1580810546875, 0.16674041748046875, 0.1753997802734375, 0.18405914306640625, 0.192718505859375, 0.20137786865234375, 0.2100372314453125, 0.21869659423828125, 0.22735595703125, 0.23601531982421875, 0.2446746826171875, 0.25333404541015625, 0.261993408203125, 0.27065277099609375, 0.2793121337890625, 0.28797149658203125, 0.296630859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 16.0, 14.0, 20.0, 28.0, 37.0, 32.0, 55.0, 52.0, 71.0, 84.0, 64.0, 84.0, 53.0, 65.0, 56.0, 40.0, 37.0, 39.0, 27.0, 21.0, 23.0, 10.0, 17.0, 13.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.360625743865967, -5.171506881713867, -4.982387542724609, -4.79326868057251, -4.60414981842041, -4.4150309562683105, -4.225912094116211, -4.036792755126953, -3.8476738929748535, -3.658555030822754, -3.469435930252075, -3.2803168296813965, -3.091197967529297, -2.9020791053771973, -2.7129600048065186, -2.52384090423584, -2.3347220420837402, -2.1456031799316406, -1.956484079360962, -1.7673650979995728, -1.5782461166381836, -1.3891271352767944, -1.2000081539154053, -1.0108891725540161, -0.821770191192627, -0.6326512098312378, -0.44353222846984863, -0.2544132471084595, -0.06529426574707031, 0.12382471561431885, 0.312943696975708, 0.5020626783370972, 0.6911821365356445, 0.8803011178970337, 1.0694200992584229, 1.258539080619812, 1.4476580619812012, 1.6367770433425903, 1.8258960247039795, 2.015015125274658, 2.204133987426758, 2.3932528495788574, 2.582371950149536, 2.771491050720215, 2.9606099128723145, 3.149728775024414, 3.3388478755950928, 3.5279669761657715, 3.717085838317871, 3.9062047004699707, 4.09532356262207, 4.284442901611328, 4.473561763763428, 4.662680625915527, 4.851799964904785, 5.040918827056885, 5.230037689208984, 5.419156551361084, 5.608275413513184, 5.797394752502441, 5.986513614654541, 6.175632476806641, 6.364751815795898, 6.553870677947998, 6.742989540100098]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 5.0, 7.0, 10.0, 12.0, 16.0, 11.0, 24.0, 20.0, 27.0, 23.0, 33.0, 31.0, 21.0, 35.0, 31.0, 31.0, 25.0, 35.0, 44.0, 32.0, 35.0, 34.0, 28.0, 37.0, 38.0, 36.0, 36.0, 34.0, 19.0, 24.0, 28.0, 19.0, 21.0, 16.0, 18.0, 12.0, 14.0, 6.0, 14.0, 10.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-3.0880866050720215, -2.992785692214966, -2.8974850177764893, -2.8021841049194336, -2.706883192062378, -2.6115822792053223, -2.5162816047668457, -2.42098069190979, -2.3256797790527344, -2.2303788661956787, -2.135078191757202, -2.0397772789001465, -1.9444763660430908, -1.8491755723953247, -1.7538747787475586, -1.658573865890503, -1.5632731914520264, -1.4679723978042603, -1.3726714849472046, -1.2773706912994385, -1.1820697784423828, -1.0867689847946167, -0.9914681911468506, -0.8961673378944397, -0.8008664846420288, -0.7055656313896179, -0.610264778137207, -0.5149639844894409, -0.41966313123703003, -0.32436227798461914, -0.22906148433685303, -0.13376063108444214, -0.03845977783203125, 0.056841060519218445, 0.15214189887046814, 0.24744272232055664, 0.34274357557296753, 0.4380444288253784, 0.5333452224731445, 0.6286460757255554, 0.7239469289779663, 0.8192477822303772, 0.9145486354827881, 1.0098494291305542, 1.1051502227783203, 1.200451135635376, 1.295751929283142, 1.3910527229309082, 1.4863536357879639, 1.58165442943573, 1.6769553422927856, 1.7722561359405518, 1.8675570487976074, 1.9628578424453735, 2.0581586360931396, 2.1534595489501953, 2.248760223388672, 2.3440611362457275, 2.439361810684204, 2.5346627235412598, 2.6299636363983154, 2.725264549255371, 2.8205652236938477, 2.9158661365509033, 3.011167049407959]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 6.0, 11.0, 13.0, 22.0, 22.0, 47.0, 81.0, 110.0, 171.0, 302.0, 524.0, 936.0, 1580.0, 3029.0, 5480.0, 10103.0, 19143.0, 35976.0, 65418.0, 112024.0, 165511.0, 192244.0, 169839.0, 116472.0, 68522.0, 37525.0, 19848.0, 10635.0, 5743.0, 3177.0, 1670.0, 959.0, 541.0, 312.0, 188.0, 136.0, 87.0, 47.0, 32.0, 23.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2421875, -4.09857177734375, -3.9549560546875, -3.81134033203125, -3.667724609375, -3.52410888671875, -3.3804931640625, -3.23687744140625, -3.09326171875, -2.94964599609375, -2.8060302734375, -2.66241455078125, -2.518798828125, -2.37518310546875, -2.2315673828125, -2.08795166015625, -1.9443359375, -1.80072021484375, -1.6571044921875, -1.51348876953125, -1.369873046875, -1.22625732421875, -1.0826416015625, -0.93902587890625, -0.79541015625, -0.65179443359375, -0.5081787109375, -0.36456298828125, -0.220947265625, -0.07733154296875, 0.0662841796875, 0.20989990234375, 0.353515625, 0.49713134765625, 0.6407470703125, 0.78436279296875, 0.927978515625, 1.07159423828125, 1.2152099609375, 1.35882568359375, 1.50244140625, 1.64605712890625, 1.7896728515625, 1.93328857421875, 2.076904296875, 2.22052001953125, 2.3641357421875, 2.50775146484375, 2.6513671875, 2.79498291015625, 2.9385986328125, 3.08221435546875, 3.225830078125, 3.36944580078125, 3.5130615234375, 3.65667724609375, 3.80029296875, 3.94390869140625, 4.0875244140625, 4.23114013671875, 4.374755859375, 4.51837158203125, 4.6619873046875, 4.80560302734375, 4.94921875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 7.0, 17.0, 12.0, 22.0, 19.0, 22.0, 19.0, 28.0, 37.0, 29.0, 34.0, 47.0, 46.0, 32.0, 40.0, 34.0, 34.0, 40.0, 48.0, 40.0, 42.0, 46.0, 37.0, 41.0, 24.0, 25.0, 22.0, 20.0, 20.0, 19.0, 12.0, 15.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125, -3.00823974609375, -2.8914794921875, -2.77471923828125, -2.657958984375, -2.54119873046875, -2.4244384765625, -2.30767822265625, -2.19091796875, -2.07415771484375, -1.9573974609375, -1.84063720703125, -1.723876953125, -1.60711669921875, -1.4903564453125, -1.37359619140625, -1.2568359375, -1.14007568359375, -1.0233154296875, -0.90655517578125, -0.789794921875, -0.67303466796875, -0.5562744140625, -0.43951416015625, -0.32275390625, -0.20599365234375, -0.0892333984375, 0.02752685546875, 0.144287109375, 0.26104736328125, 0.3778076171875, 0.49456787109375, 0.611328125, 0.72808837890625, 0.8448486328125, 0.96160888671875, 1.078369140625, 1.19512939453125, 1.3118896484375, 1.42864990234375, 1.54541015625, 1.66217041015625, 1.7789306640625, 1.89569091796875, 2.012451171875, 2.12921142578125, 2.2459716796875, 2.36273193359375, 2.4794921875, 2.59625244140625, 2.7130126953125, 2.82977294921875, 2.946533203125, 3.06329345703125, 3.1800537109375, 3.29681396484375, 3.41357421875, 3.53033447265625, 3.6470947265625, 3.76385498046875, 3.880615234375, 3.99737548828125, 4.1141357421875, 4.23089599609375, 4.34765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 13.0, 22.0, 35.0, 35.0, 68.0, 101.0, 170.0, 219.0, 366.0, 573.0, 858.0, 1310.0, 2150.0, 3342.0, 5456.0, 8890.0, 15337.0, 26202.0, 44065.0, 72350.0, 110534.0, 149037.0, 166005.0, 149346.0, 110605.0, 72066.0, 43999.0, 26066.0, 15193.0, 9332.0, 5405.0, 3574.0, 2133.0, 1273.0, 851.0, 529.0, 320.0, 246.0, 146.0, 91.0, 65.0, 40.0, 43.0, 24.0, 15.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.521270751953125, -3.40582275390625, -3.290374755859375, -3.1749267578125, -3.059478759765625, -2.94403076171875, -2.828582763671875, -2.713134765625, -2.597686767578125, -2.48223876953125, -2.366790771484375, -2.2513427734375, -2.135894775390625, -2.02044677734375, -1.904998779296875, -1.78955078125, -1.674102783203125, -1.55865478515625, -1.443206787109375, -1.3277587890625, -1.212310791015625, -1.09686279296875, -0.981414794921875, -0.865966796875, -0.750518798828125, -0.63507080078125, -0.519622802734375, -0.4041748046875, -0.288726806640625, -0.17327880859375, -0.057830810546875, 0.0576171875, 0.173065185546875, 0.28851318359375, 0.403961181640625, 0.5194091796875, 0.634857177734375, 0.75030517578125, 0.865753173828125, 0.981201171875, 1.096649169921875, 1.21209716796875, 1.327545166015625, 1.4429931640625, 1.558441162109375, 1.67388916015625, 1.789337158203125, 1.90478515625, 2.020233154296875, 2.13568115234375, 2.251129150390625, 2.3665771484375, 2.482025146484375, 2.59747314453125, 2.712921142578125, 2.828369140625, 2.943817138671875, 3.05926513671875, 3.174713134765625, 3.2901611328125, 3.405609130859375, 3.52105712890625, 3.636505126953125, 3.751953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 13.0, 8.0, 15.0, 16.0, 24.0, 13.0, 26.0, 29.0, 23.0, 25.0, 31.0, 26.0, 36.0, 41.0, 41.0, 37.0, 35.0, 36.0, 47.0, 37.0, 37.0, 38.0, 35.0, 37.0, 37.0, 34.0, 27.0, 26.0, 31.0, 20.0, 16.0, 15.0, 7.0, 16.0, 13.0, 10.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.383148193359375, -2.30340576171875, -2.223663330078125, -2.1439208984375, -2.064178466796875, -1.98443603515625, -1.904693603515625, -1.824951171875, -1.745208740234375, -1.66546630859375, -1.585723876953125, -1.5059814453125, -1.426239013671875, -1.34649658203125, -1.266754150390625, -1.18701171875, -1.107269287109375, -1.02752685546875, -0.947784423828125, -0.8680419921875, -0.788299560546875, -0.70855712890625, -0.628814697265625, -0.549072265625, -0.469329833984375, -0.38958740234375, -0.309844970703125, -0.2301025390625, -0.150360107421875, -0.07061767578125, 0.009124755859375, 0.0888671875, 0.168609619140625, 0.24835205078125, 0.328094482421875, 0.4078369140625, 0.487579345703125, 0.56732177734375, 0.647064208984375, 0.726806640625, 0.806549072265625, 0.88629150390625, 0.966033935546875, 1.0457763671875, 1.125518798828125, 1.20526123046875, 1.285003662109375, 1.36474609375, 1.444488525390625, 1.52423095703125, 1.603973388671875, 1.6837158203125, 1.763458251953125, 1.84320068359375, 1.922943115234375, 2.002685546875, 2.082427978515625, 2.16217041015625, 2.241912841796875, 2.3216552734375, 2.401397705078125, 2.48114013671875, 2.560882568359375, 2.640625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 27.0, 38.0, 49.0, 108.0, 120.0, 193.0, 252.0, 409.0, 656.0, 1085.0, 1909.0, 3168.0, 5830.0, 11121.0, 23458.0, 49758.0, 105314.0, 203392.0, 265370.0, 190279.0, 96457.0, 44835.0, 21162.0, 10466.0, 5481.0, 3107.0, 1652.0, 998.0, 633.0, 388.0, 275.0, 169.0, 120.0, 71.0, 42.0, 33.0, 23.0, 16.0, 12.0, 16.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.748046875, -3.624908447265625, -3.50177001953125, -3.378631591796875, -3.2554931640625, -3.132354736328125, -3.00921630859375, -2.886077880859375, -2.762939453125, -2.639801025390625, -2.51666259765625, -2.393524169921875, -2.2703857421875, -2.147247314453125, -2.02410888671875, -1.900970458984375, -1.77783203125, -1.654693603515625, -1.53155517578125, -1.408416748046875, -1.2852783203125, -1.162139892578125, -1.03900146484375, -0.915863037109375, -0.792724609375, -0.669586181640625, -0.54644775390625, -0.423309326171875, -0.3001708984375, -0.177032470703125, -0.05389404296875, 0.069244384765625, 0.1923828125, 0.315521240234375, 0.43865966796875, 0.561798095703125, 0.6849365234375, 0.808074951171875, 0.93121337890625, 1.054351806640625, 1.177490234375, 1.300628662109375, 1.42376708984375, 1.546905517578125, 1.6700439453125, 1.793182373046875, 1.91632080078125, 2.039459228515625, 2.16259765625, 2.285736083984375, 2.40887451171875, 2.532012939453125, 2.6551513671875, 2.778289794921875, 2.90142822265625, 3.024566650390625, 3.147705078125, 3.270843505859375, 3.39398193359375, 3.517120361328125, 3.6402587890625, 3.763397216796875, 3.88653564453125, 4.009674072265625, 4.1328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 12.0, 13.0, 12.0, 17.0, 15.0, 26.0, 22.0, 25.0, 34.0, 35.0, 47.0, 36.0, 57.0, 58.0, 52.0, 47.0, 72.0, 48.0, 60.0, 47.0, 33.0, 46.0, 34.0, 23.0, 23.0, 22.0, 12.0, 16.0, 5.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.000209808349609375, -0.00020260736346244812, -0.00019540637731552124, -0.00018820539116859436, -0.00018100440502166748, -0.0001738034188747406, -0.00016660243272781372, -0.00015940144658088684, -0.00015220046043395996, -0.00014499947428703308, -0.0001377984881401062, -0.00013059750199317932, -0.00012339651584625244, -0.00011619552969932556, -0.00010899454355239868, -0.0001017935574054718, -9.459257125854492e-05, -8.739158511161804e-05, -8.019059896469116e-05, -7.298961281776428e-05, -6.57886266708374e-05, -5.858764052391052e-05, -5.138665437698364e-05, -4.418566823005676e-05, -3.698468208312988e-05, -2.9783695936203003e-05, -2.2582709789276123e-05, -1.5381723642349243e-05, -8.180737495422363e-06, -9.797513484954834e-07, 6.2212347984313965e-06, 1.3422220945358276e-05, 2.0623207092285156e-05, 2.7824193239212036e-05, 3.5025179386138916e-05, 4.2226165533065796e-05, 4.9427151679992676e-05, 5.6628137826919556e-05, 6.382912397384644e-05, 7.103011012077332e-05, 7.82310962677002e-05, 8.543208241462708e-05, 9.263306856155396e-05, 9.983405470848083e-05, 0.00010703504085540771, 0.0001142360270023346, 0.00012143701314926147, 0.00012863799929618835, 0.00013583898544311523, 0.00014303997159004211, 0.000150240957736969, 0.00015744194388389587, 0.00016464293003082275, 0.00017184391617774963, 0.00017904490232467651, 0.0001862458884716034, 0.00019344687461853027, 0.00020064786076545715, 0.00020784884691238403, 0.0002150498330593109, 0.0002222508192062378, 0.00022945180535316467, 0.00023665279150009155, 0.00024385377764701843, 0.0002510547637939453]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 23.0, 34.0, 46.0, 46.0, 68.0, 98.0, 123.0, 197.0, 267.0, 379.0, 616.0, 872.0, 1345.0, 2105.0, 3591.0, 6139.0, 10970.0, 20373.0, 39507.0, 76686.0, 140605.0, 213647.0, 216364.0, 145298.0, 79573.0, 40885.0, 21268.0, 11206.0, 6129.0, 3663.0, 2136.0, 1379.0, 905.0, 598.0, 435.0, 286.0, 173.0, 127.0, 98.0, 69.0, 56.0, 38.0, 34.0, 20.0, 15.0, 11.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.771697998046875, -2.67620849609375, -2.580718994140625, -2.4852294921875, -2.389739990234375, -2.29425048828125, -2.198760986328125, -2.103271484375, -2.007781982421875, -1.91229248046875, -1.816802978515625, -1.7213134765625, -1.625823974609375, -1.53033447265625, -1.434844970703125, -1.33935546875, -1.243865966796875, -1.14837646484375, -1.052886962890625, -0.9573974609375, -0.861907958984375, -0.76641845703125, -0.670928955078125, -0.575439453125, -0.479949951171875, -0.38446044921875, -0.288970947265625, -0.1934814453125, -0.097991943359375, -0.00250244140625, 0.092987060546875, 0.1884765625, 0.283966064453125, 0.37945556640625, 0.474945068359375, 0.5704345703125, 0.665924072265625, 0.76141357421875, 0.856903076171875, 0.952392578125, 1.047882080078125, 1.14337158203125, 1.238861083984375, 1.3343505859375, 1.429840087890625, 1.52532958984375, 1.620819091796875, 1.71630859375, 1.811798095703125, 1.90728759765625, 2.002777099609375, 2.0982666015625, 2.193756103515625, 2.28924560546875, 2.384735107421875, 2.480224609375, 2.575714111328125, 2.67120361328125, 2.766693115234375, 2.8621826171875, 2.957672119140625, 3.05316162109375, 3.148651123046875, 3.244140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 17.0, 16.0, 25.0, 43.0, 41.0, 50.0, 74.0, 85.0, 90.0, 99.0, 94.0, 75.0, 64.0, 61.0, 45.0, 25.0, 18.0, 16.0, 8.0, 9.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8076171875, -1.753326416015625, -1.69903564453125, -1.644744873046875, -1.5904541015625, -1.536163330078125, -1.48187255859375, -1.427581787109375, -1.373291015625, -1.319000244140625, -1.26470947265625, -1.210418701171875, -1.1561279296875, -1.101837158203125, -1.04754638671875, -0.993255615234375, -0.93896484375, -0.884674072265625, -0.83038330078125, -0.776092529296875, -0.7218017578125, -0.667510986328125, -0.61322021484375, -0.558929443359375, -0.504638671875, -0.450347900390625, -0.39605712890625, -0.341766357421875, -0.2874755859375, -0.233184814453125, -0.17889404296875, -0.124603271484375, -0.0703125, -0.016021728515625, 0.03826904296875, 0.092559814453125, 0.1468505859375, 0.201141357421875, 0.25543212890625, 0.309722900390625, 0.364013671875, 0.418304443359375, 0.47259521484375, 0.526885986328125, 0.5811767578125, 0.635467529296875, 0.68975830078125, 0.744049072265625, 0.79833984375, 0.852630615234375, 0.90692138671875, 0.961212158203125, 1.0155029296875, 1.069793701171875, 1.12408447265625, 1.178375244140625, 1.232666015625, 1.286956787109375, 1.34124755859375, 1.395538330078125, 1.4498291015625, 1.504119873046875, 1.55841064453125, 1.612701416015625, 1.6669921875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 14.0, 21.0, 27.0, 34.0, 46.0, 47.0, 60.0, 64.0, 66.0, 64.0, 76.0, 76.0, 72.0, 48.0, 38.0, 39.0, 39.0, 21.0, 20.0, 18.0, 15.0, 12.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.441328048706055, -5.262688636779785, -5.084048748016357, -4.905409336090088, -4.72676944732666, -4.548130035400391, -4.369490623474121, -4.190850734710693, -4.012210845947266, -3.833571195602417, -3.6549315452575684, -3.476292133331299, -3.297652244567871, -3.1190128326416016, -2.940373182296753, -2.7617335319519043, -2.5830941200256348, -2.404454469680786, -2.2258148193359375, -2.047175407409668, -1.8685356378555298, -1.6898959875106812, -1.511256456375122, -1.3326168060302734, -1.1539771556854248, -0.9753375053405762, -0.7966979146003723, -0.6180583238601685, -0.4394186735153198, -0.2607790231704712, -0.08213949203491211, 0.09650015830993652, 0.27513980865478516, 0.4537794291973114, 0.6324190497398376, 0.8110586404800415, 0.9896982908248901, 1.1683379411697388, 1.3469774723052979, 1.5256171226501465, 1.7042567729949951, 1.8828964233398438, 2.0615360736846924, 2.240175724029541, 2.4188151359558105, 2.5974550247192383, 2.776094436645508, 2.9547340869903564, 3.133373737335205, 3.3120133876800537, 3.4906530380249023, 3.669292449951172, 3.8479323387145996, 4.026571750640869, 4.205211639404297, 4.383851051330566, 4.562490463256836, 4.7411298751831055, 4.919769763946533, 5.098409175872803, 5.2770490646362305, 5.4556884765625, 5.6343278884887695, 5.812967777252197, 5.991607666015625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 10.0, 8.0, 15.0, 12.0, 11.0, 20.0, 23.0, 22.0, 17.0, 26.0, 35.0, 29.0, 32.0, 32.0, 40.0, 42.0, 36.0, 40.0, 39.0, 37.0, 45.0, 35.0, 53.0, 26.0, 33.0, 35.0, 27.0, 31.0, 20.0, 21.0, 23.0, 20.0, 12.0, 9.0, 10.0, 14.0, 14.0, 10.0, 3.0, 0.0, 8.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904827833175659, -2.800170660018921, -2.6955134868621826, -2.5908563137054443, -2.486199378967285, -2.381542205810547, -2.2768850326538086, -2.1722278594970703, -2.067570686340332, -1.9629135131835938, -1.8582563400268555, -1.7535992860794067, -1.6489421129226685, -1.5442849397659302, -1.4396278858184814, -1.3349707126617432, -1.2303135395050049, -1.1256563663482666, -1.0209991931915283, -0.9163421392440796, -0.8116849660873413, -0.707027792930603, -0.6023706793785095, -0.497713565826416, -0.39305639266967773, -0.28839924931526184, -0.18374210596084595, -0.07908496260643005, 0.02557218074798584, 0.13022935390472412, 0.23488646745681763, 0.33954358100891113, 0.4442005157470703, 0.5488576889038086, 0.6535148024559021, 0.7581719160079956, 0.8628290891647339, 0.9674862623214722, 1.072143316268921, 1.1768004894256592, 1.2814576625823975, 1.3861148357391357, 1.490772008895874, 1.5954290628433228, 1.700086236000061, 1.8047434091567993, 1.909400463104248, 2.0140576362609863, 2.1187148094177246, 2.223371982574463, 2.328029155731201, 2.4326863288879395, 2.5373435020446777, 2.642000675201416, 2.746657609939575, 2.8513147830963135, 2.9559719562530518, 3.06062912940979, 3.1652863025665283, 3.2699434757232666, 3.374600410461426, 3.479257583618164, 3.5839147567749023, 3.6885719299316406, 3.793229103088379]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 6.0, 11.0, 21.0, 31.0, 40.0, 62.0, 97.0, 137.0, 206.0, 341.0, 536.0, 857.0, 1391.0, 2189.0, 3936.0, 6655.0, 11866.0, 21978.0, 42679.0, 89275.0, 207019.0, 517130.0, 1103335.0, 1172823.0, 581934.0, 230019.0, 99202.0, 46537.0, 23532.0, 12924.0, 6989.0, 4121.0, 2376.0, 1473.0, 943.0, 556.0, 351.0, 249.0, 146.0, 94.0, 69.0, 46.0, 36.0, 25.0, 12.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.3203125, -5.1490478515625, -4.977783203125, -4.8065185546875, -4.63525390625, -4.4639892578125, -4.292724609375, -4.1214599609375, -3.9501953125, -3.7789306640625, -3.607666015625, -3.4364013671875, -3.26513671875, -3.0938720703125, -2.922607421875, -2.7513427734375, -2.580078125, -2.4088134765625, -2.237548828125, -2.0662841796875, -1.89501953125, -1.7237548828125, -1.552490234375, -1.3812255859375, -1.2099609375, -1.0386962890625, -0.867431640625, -0.6961669921875, -0.52490234375, -0.3536376953125, -0.182373046875, -0.0111083984375, 0.16015625, 0.3314208984375, 0.502685546875, 0.6739501953125, 0.84521484375, 1.0164794921875, 1.187744140625, 1.3590087890625, 1.5302734375, 1.7015380859375, 1.872802734375, 2.0440673828125, 2.21533203125, 2.3865966796875, 2.557861328125, 2.7291259765625, 2.900390625, 3.0716552734375, 3.242919921875, 3.4141845703125, 3.58544921875, 3.7567138671875, 3.927978515625, 4.0992431640625, 4.2705078125, 4.4417724609375, 4.613037109375, 4.7843017578125, 4.95556640625, 5.1268310546875, 5.298095703125, 5.4693603515625, 5.640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 5.0, 14.0, 10.0, 14.0, 15.0, 16.0, 23.0, 20.0, 22.0, 24.0, 21.0, 37.0, 40.0, 40.0, 40.0, 41.0, 38.0, 30.0, 47.0, 33.0, 39.0, 37.0, 28.0, 32.0, 31.0, 36.0, 36.0, 29.0, 22.0, 20.0, 10.0, 15.0, 21.0, 8.0, 15.0, 13.0, 14.0, 7.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2.22265625, -2.15447998046875, -2.0863037109375, -2.01812744140625, -1.949951171875, -1.88177490234375, -1.8135986328125, -1.74542236328125, -1.67724609375, -1.60906982421875, -1.5408935546875, -1.47271728515625, -1.404541015625, -1.33636474609375, -1.2681884765625, -1.20001220703125, -1.1318359375, -1.06365966796875, -0.9954833984375, -0.92730712890625, -0.859130859375, -0.79095458984375, -0.7227783203125, -0.65460205078125, -0.58642578125, -0.51824951171875, -0.4500732421875, -0.38189697265625, -0.313720703125, -0.24554443359375, -0.1773681640625, -0.10919189453125, -0.041015625, 0.02716064453125, 0.0953369140625, 0.16351318359375, 0.231689453125, 0.29986572265625, 0.3680419921875, 0.43621826171875, 0.50439453125, 0.57257080078125, 0.6407470703125, 0.70892333984375, 0.777099609375, 0.84527587890625, 0.9134521484375, 0.98162841796875, 1.0498046875, 1.11798095703125, 1.1861572265625, 1.25433349609375, 1.322509765625, 1.39068603515625, 1.4588623046875, 1.52703857421875, 1.59521484375, 1.66339111328125, 1.7315673828125, 1.79974365234375, 1.867919921875, 1.93609619140625, 2.0042724609375, 2.07244873046875, 2.140625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 8.0, 18.0, 20.0, 32.0, 51.0, 79.0, 128.0, 211.0, 337.0, 564.0, 1051.0, 1738.0, 3279.0, 5726.0, 10712.0, 20277.0, 39524.0, 79682.0, 166347.0, 351410.0, 713747.0, 1077336.0, 858196.0, 446810.0, 211612.0, 100617.0, 50009.0, 25007.0, 13425.0, 7092.0, 3897.0, 2150.0, 1273.0, 757.0, 438.0, 259.0, 170.0, 112.0, 60.0, 45.0, 24.0, 14.0, 11.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.57476806640625, -4.4151611328125, -4.25555419921875, -4.095947265625, -3.93634033203125, -3.7767333984375, -3.61712646484375, -3.45751953125, -3.29791259765625, -3.1383056640625, -2.97869873046875, -2.819091796875, -2.65948486328125, -2.4998779296875, -2.34027099609375, -2.1806640625, -2.02105712890625, -1.8614501953125, -1.70184326171875, -1.542236328125, -1.38262939453125, -1.2230224609375, -1.06341552734375, -0.90380859375, -0.74420166015625, -0.5845947265625, -0.42498779296875, -0.265380859375, -0.10577392578125, 0.0538330078125, 0.21343994140625, 0.373046875, 0.53265380859375, 0.6922607421875, 0.85186767578125, 1.011474609375, 1.17108154296875, 1.3306884765625, 1.49029541015625, 1.64990234375, 1.80950927734375, 1.9691162109375, 2.12872314453125, 2.288330078125, 2.44793701171875, 2.6075439453125, 2.76715087890625, 2.9267578125, 3.08636474609375, 3.2459716796875, 3.40557861328125, 3.565185546875, 3.72479248046875, 3.8843994140625, 4.04400634765625, 4.20361328125, 4.36322021484375, 4.5228271484375, 4.68243408203125, 4.842041015625, 5.00164794921875, 5.1612548828125, 5.32086181640625, 5.48046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 4.0, 9.0, 12.0, 14.0, 18.0, 24.0, 38.0, 33.0, 37.0, 61.0, 63.0, 70.0, 79.0, 109.0, 173.0, 156.0, 162.0, 196.0, 217.0, 241.0, 272.0, 247.0, 247.0, 236.0, 214.0, 155.0, 180.0, 138.0, 109.0, 117.0, 91.0, 75.0, 70.0, 49.0, 34.0, 25.0, 28.0, 23.0, 11.0, 9.0, 5.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2294921875, -1.189666748046875, -1.14984130859375, -1.110015869140625, -1.0701904296875, -1.030364990234375, -0.99053955078125, -0.950714111328125, -0.910888671875, -0.871063232421875, -0.83123779296875, -0.791412353515625, -0.7515869140625, -0.711761474609375, -0.67193603515625, -0.632110595703125, -0.59228515625, -0.552459716796875, -0.51263427734375, -0.472808837890625, -0.4329833984375, -0.393157958984375, -0.35333251953125, -0.313507080078125, -0.273681640625, -0.233856201171875, -0.19403076171875, -0.154205322265625, -0.1143798828125, -0.074554443359375, -0.03472900390625, 0.005096435546875, 0.044921875, 0.084747314453125, 0.12457275390625, 0.164398193359375, 0.2042236328125, 0.244049072265625, 0.28387451171875, 0.323699951171875, 0.363525390625, 0.403350830078125, 0.44317626953125, 0.483001708984375, 0.5228271484375, 0.562652587890625, 0.60247802734375, 0.642303466796875, 0.68212890625, 0.721954345703125, 0.76177978515625, 0.801605224609375, 0.8414306640625, 0.881256103515625, 0.92108154296875, 0.960906982421875, 1.000732421875, 1.040557861328125, 1.08038330078125, 1.120208740234375, 1.1600341796875, 1.199859619140625, 1.23968505859375, 1.279510498046875, 1.3193359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 3.0, 7.0, 9.0, 13.0, 20.0, 10.0, 20.0, 25.0, 37.0, 51.0, 57.0, 63.0, 54.0, 68.0, 65.0, 71.0, 57.0, 64.0, 60.0, 51.0, 33.0, 37.0, 24.0, 23.0, 16.0, 13.0, 7.0, 14.0, 5.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.061370372772217, -4.901939868927002, -4.742508888244629, -4.583078384399414, -4.423647880554199, -4.264216899871826, -4.104786396026611, -3.9453556537628174, -3.7859249114990234, -3.6264941692352295, -3.4670634269714355, -3.3076329231262207, -3.1482021808624268, -2.988771438598633, -2.829340934753418, -2.669910192489624, -2.51047945022583, -2.351048707962036, -2.191617965698242, -2.0321874618530273, -1.8727567195892334, -1.7133259773254395, -1.553895354270935, -1.3944647312164307, -1.2350339889526367, -1.0756032466888428, -0.9161726236343384, -0.7567419409751892, -0.59731125831604, -0.43788057565689087, -0.2784498929977417, -0.1190192699432373, 0.040411949157714844, 0.199842631816864, 0.3592733144760132, 0.5187039971351624, 0.6781346797943115, 0.8375653624534607, 0.9969960451126099, 1.1564266681671143, 1.3158574104309082, 1.4752881526947021, 1.6347187757492065, 1.794149398803711, 1.9535801410675049, 2.113010883331299, 2.2724413871765137, 2.4318721294403076, 2.5913028717041016, 2.7507336139678955, 2.9101643562316895, 3.0695948600769043, 3.2290256023406982, 3.388456344604492, 3.547886848449707, 3.707317590713501, 3.866748332977295, 4.02617883682251, 4.185609817504883, 4.345040321350098, 4.5044708251953125, 4.6639018058776855, 4.8233323097229, 4.982763290405273, 5.142193794250488]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 3.0, 7.0, 10.0, 7.0, 9.0, 12.0, 10.0, 16.0, 16.0, 26.0, 21.0, 22.0, 37.0, 30.0, 38.0, 39.0, 40.0, 37.0, 42.0, 53.0, 47.0, 44.0, 35.0, 43.0, 34.0, 36.0, 27.0, 25.0, 29.0, 24.0, 29.0, 31.0, 18.0, 23.0, 10.0, 11.0, 12.0, 11.0, 5.0, 10.0, 6.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.797964096069336, -2.7095541954040527, -2.6211440563201904, -2.5327341556549072, -2.444324254989624, -2.3559141159057617, -2.2675042152404785, -2.1790943145751953, -2.090684413909912, -2.002274513244629, -1.9138644933700562, -1.8254544734954834, -1.7370445728302002, -1.6486345529556274, -1.5602245330810547, -1.4718146324157715, -1.3834044933319092, -1.2949944734573364, -1.2065845727920532, -1.1181745529174805, -1.0297646522521973, -0.9413546323776245, -0.8529446125030518, -0.7645346522331238, -0.6761246919631958, -0.5877147316932678, -0.49930474162101746, -0.4108947515487671, -0.3224847912788391, -0.23407483100891113, -0.14566481113433838, -0.0572548508644104, 0.031154870986938477, 0.11956484615802765, 0.20797482132911682, 0.2963848114013672, 0.38479477167129517, 0.47320473194122314, 0.5616147518157959, 0.6500247120857239, 0.7384346723556519, 0.8268446326255798, 0.9152545928955078, 1.0036646127700806, 1.0920746326446533, 1.1804845333099365, 1.2688945531845093, 1.357304573059082, 1.4457144737243652, 1.534124493598938, 1.6225343942642212, 1.710944414138794, 1.7993543148040771, 1.88776433467865, 1.9761743545532227, 2.064584255218506, 2.152994155883789, 2.2414040565490723, 2.3298141956329346, 2.4182240962982178, 2.506633996963501, 2.5950441360473633, 2.6834540367126465, 2.7718639373779297, 2.860274076461792]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 6.0, 15.0, 10.0, 24.0, 33.0, 40.0, 66.0, 110.0, 115.0, 186.0, 304.0, 402.0, 661.0, 1115.0, 1875.0, 3256.0, 5748.0, 10559.0, 19136.0, 36249.0, 67235.0, 120252.0, 187913.0, 214364.0, 164789.0, 97413.0, 53224.0, 28442.0, 15235.0, 8216.0, 4639.0, 2619.0, 1650.0, 906.0, 567.0, 341.0, 240.0, 169.0, 126.0, 68.0, 71.0, 50.0, 26.0, 19.0, 12.0, 15.0, 7.0, 5.0, 2.0, 10.0, 5.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.52783203125, -0.5114974975585938, -0.4951629638671875, -0.47882843017578125, -0.462493896484375, -0.44615936279296875, -0.4298248291015625, -0.41349029541015625, -0.39715576171875, -0.38082122802734375, -0.3644866943359375, -0.34815216064453125, -0.331817626953125, -0.31548309326171875, -0.2991485595703125, -0.28281402587890625, -0.2664794921875, -0.25014495849609375, -0.2338104248046875, -0.21747589111328125, -0.201141357421875, -0.18480682373046875, -0.1684722900390625, -0.15213775634765625, -0.13580322265625, -0.11946868896484375, -0.1031341552734375, -0.08679962158203125, -0.070465087890625, -0.05413055419921875, -0.0377960205078125, -0.02146148681640625, -0.005126953125, 0.01120758056640625, 0.0275421142578125, 0.04387664794921875, 0.060211181640625, 0.07654571533203125, 0.0928802490234375, 0.10921478271484375, 0.12554931640625, 0.14188385009765625, 0.1582183837890625, 0.17455291748046875, 0.190887451171875, 0.20722198486328125, 0.2235565185546875, 0.23989105224609375, 0.2562255859375, 0.27256011962890625, 0.2888946533203125, 0.30522918701171875, 0.321563720703125, 0.33789825439453125, 0.3542327880859375, 0.37056732177734375, 0.38690185546875, 0.40323638916015625, 0.4195709228515625, 0.43590545654296875, 0.452239990234375, 0.46857452392578125, 0.4849090576171875, 0.5012435913085938, 0.517578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 11.0, 16.0, 13.0, 15.0, 23.0, 23.0, 30.0, 21.0, 35.0, 40.0, 39.0, 41.0, 36.0, 45.0, 54.0, 54.0, 36.0, 42.0, 40.0, 50.0, 29.0, 43.0, 29.0, 39.0, 27.0, 23.0, 16.0, 15.0, 17.0, 16.0, 9.0, 12.0, 11.0, 4.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.9840087890625, -2.880126953125, -2.7762451171875, -2.67236328125, -2.5684814453125, -2.464599609375, -2.3607177734375, -2.2568359375, -2.1529541015625, -2.049072265625, -1.9451904296875, -1.84130859375, -1.7374267578125, -1.633544921875, -1.5296630859375, -1.42578125, -1.3218994140625, -1.218017578125, -1.1141357421875, -1.01025390625, -0.9063720703125, -0.802490234375, -0.6986083984375, -0.5947265625, -0.4908447265625, -0.386962890625, -0.2830810546875, -0.17919921875, -0.0753173828125, 0.028564453125, 0.1324462890625, 0.236328125, 0.3402099609375, 0.444091796875, 0.5479736328125, 0.65185546875, 0.7557373046875, 0.859619140625, 0.9635009765625, 1.0673828125, 1.1712646484375, 1.275146484375, 1.3790283203125, 1.48291015625, 1.5867919921875, 1.690673828125, 1.7945556640625, 1.8984375, 2.0023193359375, 2.106201171875, 2.2100830078125, 2.31396484375, 2.4178466796875, 2.521728515625, 2.6256103515625, 2.7294921875, 2.8333740234375, 2.937255859375, 3.0411376953125, 3.14501953125, 3.2489013671875, 3.352783203125, 3.4566650390625, 3.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 16.0, 24.0, 16.0, 28.0, 40.0, 43.0, 54.0, 82.0, 113.0, 166.0, 216.0, 278.0, 469.0, 607.0, 1061.0, 1622.0, 2751.0, 5235.0, 10357.0, 24288.0, 158943.0, 773983.0, 37615.0, 14354.0, 6792.0, 3570.0, 1983.0, 1236.0, 792.0, 518.0, 362.0, 243.0, 185.0, 115.0, 79.0, 61.0, 58.0, 44.0, 31.0, 23.0, 19.0, 8.0, 9.0, 7.0, 7.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.6416015625, -1.5921478271484375, -1.542694091796875, -1.4932403564453125, -1.44378662109375, -1.3943328857421875, -1.344879150390625, -1.2954254150390625, -1.2459716796875, -1.1965179443359375, -1.147064208984375, -1.0976104736328125, -1.04815673828125, -0.9987030029296875, -0.949249267578125, -0.8997955322265625, -0.850341796875, -0.8008880615234375, -0.751434326171875, -0.7019805908203125, -0.65252685546875, -0.6030731201171875, -0.553619384765625, -0.5041656494140625, -0.4547119140625, -0.4052581787109375, -0.355804443359375, -0.3063507080078125, -0.25689697265625, -0.2074432373046875, -0.157989501953125, -0.1085357666015625, -0.05908203125, -0.0096282958984375, 0.039825439453125, 0.0892791748046875, 0.13873291015625, 0.1881866455078125, 0.237640380859375, 0.2870941162109375, 0.3365478515625, 0.3860015869140625, 0.435455322265625, 0.4849090576171875, 0.53436279296875, 0.5838165283203125, 0.633270263671875, 0.6827239990234375, 0.732177734375, 0.7816314697265625, 0.831085205078125, 0.8805389404296875, 0.92999267578125, 0.9794464111328125, 1.028900146484375, 1.0783538818359375, 1.1278076171875, 1.1772613525390625, 1.226715087890625, 1.2761688232421875, 1.32562255859375, 1.3750762939453125, 1.424530029296875, 1.4739837646484375, 1.5234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 4.0, 8.0, 7.0, 13.0, 9.0, 14.0, 16.0, 18.0, 15.0, 22.0, 23.0, 28.0, 25.0, 34.0, 27.0, 46.0, 30.0, 40.0, 38.0, 39.0, 38.0, 48.0, 40.0, 37.0, 38.0, 32.0, 36.0, 32.0, 30.0, 26.0, 13.0, 20.0, 18.0, 18.0, 19.0, 14.0, 16.0, 9.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.541015625, -2.46380615234375, -2.3865966796875, -2.30938720703125, -2.232177734375, -2.15496826171875, -2.0777587890625, -2.00054931640625, -1.92333984375, -1.84613037109375, -1.7689208984375, -1.69171142578125, -1.614501953125, -1.53729248046875, -1.4600830078125, -1.38287353515625, -1.3056640625, -1.22845458984375, -1.1512451171875, -1.07403564453125, -0.996826171875, -0.91961669921875, -0.8424072265625, -0.76519775390625, -0.68798828125, -0.61077880859375, -0.5335693359375, -0.45635986328125, -0.379150390625, -0.30194091796875, -0.2247314453125, -0.14752197265625, -0.0703125, 0.00689697265625, 0.0841064453125, 0.16131591796875, 0.238525390625, 0.31573486328125, 0.3929443359375, 0.47015380859375, 0.54736328125, 0.62457275390625, 0.7017822265625, 0.77899169921875, 0.856201171875, 0.93341064453125, 1.0106201171875, 1.08782958984375, 1.1650390625, 1.24224853515625, 1.3194580078125, 1.39666748046875, 1.473876953125, 1.55108642578125, 1.6282958984375, 1.70550537109375, 1.78271484375, 1.85992431640625, 1.9371337890625, 2.01434326171875, 2.091552734375, 2.16876220703125, 2.2459716796875, 2.32318115234375, 2.400390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 15.0, 29.0, 36.0, 71.0, 71.0, 116.0, 200.0, 273.0, 450.0, 724.0, 1085.0, 1743.0, 2834.0, 4658.0, 8174.0, 15437.0, 37109.0, 874691.0, 57488.0, 19200.0, 9753.0, 5526.0, 3318.0, 1974.0, 1226.0, 804.0, 519.0, 318.0, 235.0, 150.0, 83.0, 66.0, 54.0, 29.0, 22.0, 19.0, 15.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.49204254150390625, -0.4728546142578125, -0.45366668701171875, -0.434478759765625, -0.41529083251953125, -0.3961029052734375, -0.37691497802734375, -0.35772705078125, -0.33853912353515625, -0.3193511962890625, -0.30016326904296875, -0.280975341796875, -0.26178741455078125, -0.2425994873046875, -0.22341156005859375, -0.2042236328125, -0.18503570556640625, -0.1658477783203125, -0.14665985107421875, -0.127471923828125, -0.10828399658203125, -0.0890960693359375, -0.06990814208984375, -0.05072021484375, -0.03153228759765625, -0.0123443603515625, 0.00684356689453125, 0.026031494140625, 0.04521942138671875, 0.0644073486328125, 0.08359527587890625, 0.102783203125, 0.12197113037109375, 0.1411590576171875, 0.16034698486328125, 0.179534912109375, 0.19872283935546875, 0.2179107666015625, 0.23709869384765625, 0.25628662109375, 0.27547454833984375, 0.2946624755859375, 0.31385040283203125, 0.333038330078125, 0.35222625732421875, 0.3714141845703125, 0.39060211181640625, 0.4097900390625, 0.42897796630859375, 0.4481658935546875, 0.46735382080078125, 0.486541748046875, 0.5057296752929688, 0.5249176025390625, 0.5441055297851562, 0.56329345703125, 0.5824813842773438, 0.6016693115234375, 0.6208572387695312, 0.640045166015625, 0.6592330932617188, 0.6784210205078125, 0.6976089477539062, 0.716796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 13.0, 18.0, 20.0, 17.0, 15.0, 25.0, 30.0, 30.0, 49.0, 31.0, 38.0, 36.0, 39.0, 35.0, 59.0, 30.0, 45.0, 33.0, 38.0, 38.0, 34.0, 39.0, 29.0, 33.0, 20.0, 34.0, 22.0, 15.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.183819353580475e-05, -3.089383244514465e-05, -2.9949471354484558e-05, -2.9005110263824463e-05, -2.8060749173164368e-05, -2.7116388082504272e-05, -2.6172026991844177e-05, -2.5227665901184082e-05, -2.4283304810523987e-05, -2.333894371986389e-05, -2.2394582629203796e-05, -2.14502215385437e-05, -2.0505860447883606e-05, -1.956149935722351e-05, -1.8617138266563416e-05, -1.767277717590332e-05, -1.6728416085243225e-05, -1.578405499458313e-05, -1.4839693903923035e-05, -1.389533281326294e-05, -1.2950971722602844e-05, -1.2006610631942749e-05, -1.1062249541282654e-05, -1.0117888450622559e-05, -9.173527359962463e-06, -8.229166269302368e-06, -7.284805178642273e-06, -6.340444087982178e-06, -5.3960829973220825e-06, -4.451721906661987e-06, -3.507360816001892e-06, -2.562999725341797e-06, -1.6186386346817017e-06, -6.742775440216064e-07, 2.7008354663848877e-07, 1.214444637298584e-06, 2.158805727958679e-06, 3.1031668186187744e-06, 4.04752790927887e-06, 4.991888999938965e-06, 5.93625009059906e-06, 6.880611181259155e-06, 7.82497227191925e-06, 8.769333362579346e-06, 9.713694453239441e-06, 1.0658055543899536e-05, 1.1602416634559631e-05, 1.2546777725219727e-05, 1.3491138815879822e-05, 1.4435499906539917e-05, 1.5379860997200012e-05, 1.6324222087860107e-05, 1.7268583178520203e-05, 1.8212944269180298e-05, 1.9157305359840393e-05, 2.0101666450500488e-05, 2.1046027541160583e-05, 2.199038863182068e-05, 2.2934749722480774e-05, 2.387911081314087e-05, 2.4823471903800964e-05, 2.576783299446106e-05, 2.6712194085121155e-05, 2.765655517578125e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 19.0, 19.0, 24.0, 28.0, 48.0, 75.0, 106.0, 141.0, 210.0, 332.0, 486.0, 677.0, 1165.0, 1786.0, 2986.0, 5145.0, 9292.0, 17908.0, 36776.0, 80510.0, 183817.0, 312423.0, 211974.0, 94592.0, 42331.0, 20490.0, 10426.0, 5775.0, 3292.0, 2000.0, 1243.0, 827.0, 511.0, 347.0, 235.0, 158.0, 102.0, 77.0, 48.0, 39.0, 24.0, 21.0, 10.0, 12.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2139892578125, -0.20699501037597656, -0.20000076293945312, -0.1930065155029297, -0.18601226806640625, -0.1790180206298828, -0.17202377319335938, -0.16502952575683594, -0.1580352783203125, -0.15104103088378906, -0.14404678344726562, -0.1370525360107422, -0.13005828857421875, -0.12306404113769531, -0.11606979370117188, -0.10907554626464844, -0.102081298828125, -0.09508705139160156, -0.08809280395507812, -0.08109855651855469, -0.07410430908203125, -0.06711006164550781, -0.060115814208984375, -0.05312156677246094, -0.0461273193359375, -0.03913307189941406, -0.032138824462890625, -0.025144577026367188, -0.01815032958984375, -0.011156082153320312, -0.004161834716796875, 0.0028324127197265625, 0.00982666015625, 0.016820907592773438, 0.023815155029296875, 0.030809402465820312, 0.03780364990234375, 0.04479789733886719, 0.051792144775390625, 0.05878639221191406, 0.0657806396484375, 0.07277488708496094, 0.07976913452148438, 0.08676338195800781, 0.09375762939453125, 0.10075187683105469, 0.10774612426757812, 0.11474037170410156, 0.121734619140625, 0.12872886657714844, 0.13572311401367188, 0.1427173614501953, 0.14971160888671875, 0.1567058563232422, 0.16370010375976562, 0.17069435119628906, 0.1776885986328125, 0.18468284606933594, 0.19167709350585938, 0.1986713409423828, 0.20566558837890625, 0.2126598358154297, 0.21965408325195312, 0.22664833068847656, 0.233642578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 10.0, 12.0, 12.0, 13.0, 22.0, 21.0, 30.0, 49.0, 43.0, 61.0, 85.0, 81.0, 93.0, 85.0, 70.0, 62.0, 47.0, 36.0, 15.0, 17.0, 20.0, 22.0, 12.0, 11.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12485885620117188, -0.12044525146484375, -0.11603164672851562, -0.1116180419921875, -0.10720443725585938, -0.10279083251953125, -0.09837722778320312, -0.093963623046875, -0.08955001831054688, -0.08513641357421875, -0.08072280883789062, -0.0763092041015625, -0.07189559936523438, -0.06748199462890625, -0.06306838989257812, -0.05865478515625, -0.054241180419921875, -0.04982757568359375, -0.045413970947265625, -0.0410003662109375, -0.036586761474609375, -0.03217315673828125, -0.027759552001953125, -0.023345947265625, -0.018932342529296875, -0.01451873779296875, -0.010105133056640625, -0.0056915283203125, -0.001277923583984375, 0.00313568115234375, 0.007549285888671875, 0.011962890625, 0.016376495361328125, 0.02079010009765625, 0.025203704833984375, 0.0296173095703125, 0.034030914306640625, 0.03844451904296875, 0.042858123779296875, 0.047271728515625, 0.051685333251953125, 0.05609893798828125, 0.060512542724609375, 0.0649261474609375, 0.06933975219726562, 0.07375335693359375, 0.07816696166992188, 0.08258056640625, 0.08699417114257812, 0.09140777587890625, 0.09582138061523438, 0.1002349853515625, 0.10464859008789062, 0.10906219482421875, 0.11347579956054688, 0.117889404296875, 0.12230300903320312, 0.12671661376953125, 0.13113021850585938, 0.1355438232421875, 0.13995742797851562, 0.14437103271484375, 0.14878463745117188, 0.1531982421875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 11.0, 5.0, 7.0, 7.0, 11.0, 14.0, 19.0, 11.0, 22.0, 31.0, 49.0, 42.0, 59.0, 67.0, 62.0, 58.0, 65.0, 70.0, 48.0, 68.0, 67.0, 36.0, 42.0, 27.0, 25.0, 17.0, 16.0, 14.0, 5.0, 13.0, 6.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.942590713500977, -4.7854461669921875, -4.628301620483398, -4.471157073974609, -4.31401252746582, -4.156867980957031, -3.9997236728668213, -3.8425791263580322, -3.685434579849243, -3.528290033340454, -3.371145486831665, -3.214000940322876, -3.056856632232666, -2.899712085723877, -2.742567539215088, -2.585422992706299, -2.4282784461975098, -2.2711338996887207, -2.1139893531799316, -1.9568449258804321, -1.799700379371643, -1.642555832862854, -1.4854114055633545, -1.3282668590545654, -1.1711223125457764, -1.0139777660369873, -0.856833279132843, -0.6996887922286987, -0.5425442457199097, -0.3853996992111206, -0.22825521230697632, -0.07111072540283203, 0.08603382110595703, 0.2431783378124237, 0.4003228545188904, 0.5574673414230347, 0.7146118879318237, 0.8717564344406128, 1.0289008617401123, 1.1860454082489014, 1.3431899547576904, 1.5003345012664795, 1.6574790477752686, 1.814623475074768, 1.9717680215835571, 2.1289124488830566, 2.2860569953918457, 2.4432015419006348, 2.600346088409424, 2.757490634918213, 2.914635181427002, 3.071779727935791, 3.22892427444458, 3.386068820953369, 3.543213129043579, 3.700357675552368, 3.8575022220611572, 4.014646530151367, 4.171791076660156, 4.328935623168945, 4.486080169677734, 4.643224716186523, 4.8003692626953125, 4.957513809204102, 5.114658355712891]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 11.0, 12.0, 15.0, 16.0, 15.0, 26.0, 20.0, 36.0, 29.0, 35.0, 40.0, 39.0, 38.0, 36.0, 54.0, 47.0, 48.0, 40.0, 40.0, 39.0, 29.0, 35.0, 20.0, 35.0, 29.0, 19.0, 29.0, 27.0, 18.0, 15.0, 14.0, 10.0, 13.0, 7.0, 6.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.8237361907958984, -2.7358651161193848, -2.647994041442871, -2.5601229667663574, -2.4722518920898438, -2.38438081741333, -2.2965097427368164, -2.2086386680603027, -2.120767593383789, -2.0328965187072754, -1.9450254440307617, -1.857154369354248, -1.7692832946777344, -1.6814122200012207, -1.5935412645339966, -1.505670189857483, -1.4177992343902588, -1.3299281597137451, -1.2420570850372314, -1.1541860103607178, -1.066314935684204, -0.9784439206123352, -0.8905729055404663, -0.8027018308639526, -0.714830756187439, -0.6269596815109253, -0.5390886068344116, -0.4512175917625427, -0.36334651708602905, -0.2754754424095154, -0.18760442733764648, -0.09973335266113281, -0.01186227798461914, 0.07600878179073334, 0.16387984156608582, 0.2517508864402771, 0.33962196111679077, 0.42749303579330444, 0.5153640508651733, 0.603235125541687, 0.6911062002182007, 0.7789772748947144, 0.866848349571228, 0.9547193646430969, 1.0425903797149658, 1.1304614543914795, 1.2183325290679932, 1.3062036037445068, 1.3940746784210205, 1.4819457530975342, 1.5698168277740479, 1.6576879024505615, 1.7455589771270752, 1.8334300518035889, 1.921301007270813, 2.009171962738037, 2.097043037414551, 2.1849141120910645, 2.272785186767578, 2.360656261444092, 2.4485273361206055, 2.536398410797119, 2.624269485473633, 2.7121405601501465, 2.80001163482666]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 18.0, 24.0, 38.0, 63.0, 97.0, 143.0, 210.0, 364.0, 531.0, 918.0, 1490.0, 2654.0, 4234.0, 6735.0, 11581.0, 18956.0, 31577.0, 50646.0, 79152.0, 113377.0, 144064.0, 155466.0, 137245.0, 103328.0, 70792.0, 44876.0, 27707.0, 16633.0, 10027.0, 5943.0, 3745.0, 2294.0, 1372.0, 815.0, 498.0, 334.0, 206.0, 124.0, 83.0, 66.0, 27.0, 34.0, 11.0, 8.0, 5.0, 2.0, 9.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-3.341796875, -3.238555908203125, -3.13531494140625, -3.032073974609375, -2.9288330078125, -2.825592041015625, -2.72235107421875, -2.619110107421875, -2.515869140625, -2.412628173828125, -2.30938720703125, -2.206146240234375, -2.1029052734375, -1.999664306640625, -1.89642333984375, -1.793182373046875, -1.68994140625, -1.586700439453125, -1.48345947265625, -1.380218505859375, -1.2769775390625, -1.173736572265625, -1.07049560546875, -0.967254638671875, -0.864013671875, -0.760772705078125, -0.65753173828125, -0.554290771484375, -0.4510498046875, -0.347808837890625, -0.24456787109375, -0.141326904296875, -0.0380859375, 0.065155029296875, 0.16839599609375, 0.271636962890625, 0.3748779296875, 0.478118896484375, 0.58135986328125, 0.684600830078125, 0.787841796875, 0.891082763671875, 0.99432373046875, 1.097564697265625, 1.2008056640625, 1.304046630859375, 1.40728759765625, 1.510528564453125, 1.61376953125, 1.717010498046875, 1.82025146484375, 1.923492431640625, 2.0267333984375, 2.129974365234375, 2.23321533203125, 2.336456298828125, 2.439697265625, 2.542938232421875, 2.64617919921875, 2.749420166015625, 2.8526611328125, 2.955902099609375, 3.05914306640625, 3.162384033203125, 3.265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 7.0, 13.0, 13.0, 13.0, 15.0, 21.0, 25.0, 23.0, 23.0, 40.0, 28.0, 31.0, 35.0, 33.0, 32.0, 43.0, 47.0, 51.0, 41.0, 29.0, 37.0, 24.0, 31.0, 35.0, 44.0, 29.0, 29.0, 26.0, 23.0, 19.0, 23.0, 15.0, 12.0, 14.0, 7.0, 12.0, 7.0, 8.0, 4.0, 3.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.543731689453125, -2.45269775390625, -2.361663818359375, -2.2706298828125, -2.179595947265625, -2.08856201171875, -1.997528076171875, -1.906494140625, -1.815460205078125, -1.72442626953125, -1.633392333984375, -1.5423583984375, -1.451324462890625, -1.36029052734375, -1.269256591796875, -1.17822265625, -1.087188720703125, -0.99615478515625, -0.905120849609375, -0.8140869140625, -0.723052978515625, -0.63201904296875, -0.540985107421875, -0.449951171875, -0.358917236328125, -0.26788330078125, -0.176849365234375, -0.0858154296875, 0.005218505859375, 0.09625244140625, 0.187286376953125, 0.2783203125, 0.369354248046875, 0.46038818359375, 0.551422119140625, 0.6424560546875, 0.733489990234375, 0.82452392578125, 0.915557861328125, 1.006591796875, 1.097625732421875, 1.18865966796875, 1.279693603515625, 1.3707275390625, 1.461761474609375, 1.55279541015625, 1.643829345703125, 1.73486328125, 1.825897216796875, 1.91693115234375, 2.007965087890625, 2.0989990234375, 2.190032958984375, 2.28106689453125, 2.372100830078125, 2.463134765625, 2.554168701171875, 2.64520263671875, 2.736236572265625, 2.8272705078125, 2.918304443359375, 3.00933837890625, 3.100372314453125, 3.19140625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 16.0, 19.0, 24.0, 40.0, 67.0, 96.0, 128.0, 195.0, 328.0, 466.0, 806.0, 1352.0, 2200.0, 3675.0, 6014.0, 10167.0, 17248.0, 28438.0, 46243.0, 73195.0, 108372.0, 142850.0, 158204.0, 143943.0, 109824.0, 74986.0, 47144.0, 29193.0, 17271.0, 10243.0, 6267.0, 3635.0, 2197.0, 1341.0, 858.0, 545.0, 355.0, 197.0, 140.0, 95.0, 58.0, 39.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-3.42578125, -3.323577880859375, -3.22137451171875, -3.119171142578125, -3.0169677734375, -2.914764404296875, -2.81256103515625, -2.710357666015625, -2.608154296875, -2.505950927734375, -2.40374755859375, -2.301544189453125, -2.1993408203125, -2.097137451171875, -1.99493408203125, -1.892730712890625, -1.79052734375, -1.688323974609375, -1.58612060546875, -1.483917236328125, -1.3817138671875, -1.279510498046875, -1.17730712890625, -1.075103759765625, -0.972900390625, -0.870697021484375, -0.76849365234375, -0.666290283203125, -0.5640869140625, -0.461883544921875, -0.35968017578125, -0.257476806640625, -0.1552734375, -0.053070068359375, 0.04913330078125, 0.151336669921875, 0.2535400390625, 0.355743408203125, 0.45794677734375, 0.560150146484375, 0.662353515625, 0.764556884765625, 0.86676025390625, 0.968963623046875, 1.0711669921875, 1.173370361328125, 1.27557373046875, 1.377777099609375, 1.47998046875, 1.582183837890625, 1.68438720703125, 1.786590576171875, 1.8887939453125, 1.990997314453125, 2.09320068359375, 2.195404052734375, 2.297607421875, 2.399810791015625, 2.50201416015625, 2.604217529296875, 2.7064208984375, 2.808624267578125, 2.91082763671875, 3.013031005859375, 3.115234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 9.0, 16.0, 7.0, 13.0, 10.0, 23.0, 17.0, 29.0, 31.0, 39.0, 36.0, 29.0, 37.0, 43.0, 35.0, 40.0, 40.0, 40.0, 45.0, 51.0, 39.0, 32.0, 40.0, 33.0, 36.0, 32.0, 22.0, 29.0, 15.0, 27.0, 15.0, 17.0, 13.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.98492431640625, -1.9210205078125, -1.85711669921875, -1.793212890625, -1.72930908203125, -1.6654052734375, -1.60150146484375, -1.53759765625, -1.47369384765625, -1.4097900390625, -1.34588623046875, -1.281982421875, -1.21807861328125, -1.1541748046875, -1.09027099609375, -1.0263671875, -0.96246337890625, -0.8985595703125, -0.83465576171875, -0.770751953125, -0.70684814453125, -0.6429443359375, -0.57904052734375, -0.51513671875, -0.45123291015625, -0.3873291015625, -0.32342529296875, -0.259521484375, -0.19561767578125, -0.1317138671875, -0.06781005859375, -0.00390625, 0.05999755859375, 0.1239013671875, 0.18780517578125, 0.251708984375, 0.31561279296875, 0.3795166015625, 0.44342041015625, 0.50732421875, 0.57122802734375, 0.6351318359375, 0.69903564453125, 0.762939453125, 0.82684326171875, 0.8907470703125, 0.95465087890625, 1.0185546875, 1.08245849609375, 1.1463623046875, 1.21026611328125, 1.274169921875, 1.33807373046875, 1.4019775390625, 1.46588134765625, 1.52978515625, 1.59368896484375, 1.6575927734375, 1.72149658203125, 1.785400390625, 1.84930419921875, 1.9132080078125, 1.97711181640625, 2.041015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 10.0, 19.0, 22.0, 38.0, 55.0, 109.0, 140.0, 223.0, 351.0, 556.0, 938.0, 1460.0, 2576.0, 4235.0, 7382.0, 12941.0, 22366.0, 39416.0, 68510.0, 111793.0, 161641.0, 185020.0, 159659.0, 110126.0, 67156.0, 39376.0, 22187.0, 12566.0, 7168.0, 4202.0, 2453.0, 1448.0, 899.0, 537.0, 346.0, 236.0, 129.0, 100.0, 52.0, 30.0, 20.0, 18.0, 9.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.099609375, -2.03497314453125, -1.9703369140625, -1.90570068359375, -1.841064453125, -1.77642822265625, -1.7117919921875, -1.64715576171875, -1.58251953125, -1.51788330078125, -1.4532470703125, -1.38861083984375, -1.323974609375, -1.25933837890625, -1.1947021484375, -1.13006591796875, -1.0654296875, -1.00079345703125, -0.9361572265625, -0.87152099609375, -0.806884765625, -0.74224853515625, -0.6776123046875, -0.61297607421875, -0.54833984375, -0.48370361328125, -0.4190673828125, -0.35443115234375, -0.289794921875, -0.22515869140625, -0.1605224609375, -0.09588623046875, -0.03125, 0.03338623046875, 0.0980224609375, 0.16265869140625, 0.227294921875, 0.29193115234375, 0.3565673828125, 0.42120361328125, 0.48583984375, 0.55047607421875, 0.6151123046875, 0.67974853515625, 0.744384765625, 0.80902099609375, 0.8736572265625, 0.93829345703125, 1.0029296875, 1.06756591796875, 1.1322021484375, 1.19683837890625, 1.261474609375, 1.32611083984375, 1.3907470703125, 1.45538330078125, 1.52001953125, 1.58465576171875, 1.6492919921875, 1.71392822265625, 1.778564453125, 1.84320068359375, 1.9078369140625, 1.97247314453125, 2.037109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 14.0, 15.0, 17.0, 16.0, 15.0, 24.0, 38.0, 23.0, 32.0, 42.0, 50.0, 48.0, 54.0, 68.0, 74.0, 49.0, 61.0, 44.0, 43.0, 40.0, 42.0, 24.0, 19.0, 27.0, 20.0, 20.0, 13.0, 10.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00019216537475585938, -0.0001864079385995865, -0.0001806505024433136, -0.0001748930662870407, -0.00016913563013076782, -0.00016337819397449493, -0.00015762075781822205, -0.00015186332166194916, -0.00014610588550567627, -0.00014034844934940338, -0.0001345910131931305, -0.0001288335770368576, -0.00012307614088058472, -0.00011731870472431183, -0.00011156126856803894, -0.00010580383241176605, -0.00010004639625549316, -9.428896009922028e-05, -8.853152394294739e-05, -8.27740877866745e-05, -7.701665163040161e-05, -7.125921547412872e-05, -6.550177931785583e-05, -5.974434316158295e-05, -5.398690700531006e-05, -4.822947084903717e-05, -4.247203469276428e-05, -3.6714598536491394e-05, -3.0957162380218506e-05, -2.5199726223945618e-05, -1.944229006767273e-05, -1.3684853911399841e-05, -7.927417755126953e-06, -2.169981598854065e-06, 3.5874545574188232e-06, 9.344890713691711e-06, 1.51023268699646e-05, 2.0859763026237488e-05, 2.6617199182510376e-05, 3.2374635338783264e-05, 3.813207149505615e-05, 4.388950765132904e-05, 4.964694380760193e-05, 5.540437996387482e-05, 6.11618161201477e-05, 6.69192522764206e-05, 7.267668843269348e-05, 7.843412458896637e-05, 8.419156074523926e-05, 8.994899690151215e-05, 9.570643305778503e-05, 0.00010146386921405792, 0.00010722130537033081, 0.0001129787415266037, 0.00011873617768287659, 0.00012449361383914948, 0.00013025104999542236, 0.00013600848615169525, 0.00014176592230796814, 0.00014752335846424103, 0.00015328079462051392, 0.0001590382307767868, 0.0001647956669330597, 0.00017055310308933258, 0.00017631053924560547]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 12.0, 11.0, 23.0, 37.0, 64.0, 94.0, 145.0, 251.0, 403.0, 651.0, 999.0, 1673.0, 2590.0, 4236.0, 6953.0, 11467.0, 18383.0, 29972.0, 48292.0, 75297.0, 110361.0, 143914.0, 157109.0, 140144.0, 105672.0, 71318.0, 45015.0, 28284.0, 17416.0, 10746.0, 6507.0, 4049.0, 2429.0, 1523.0, 977.0, 553.0, 371.0, 222.0, 141.0, 90.0, 51.0, 47.0, 25.0, 10.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7412109375, -1.6891326904296875, -1.637054443359375, -1.5849761962890625, -1.53289794921875, -1.4808197021484375, -1.428741455078125, -1.3766632080078125, -1.3245849609375, -1.2725067138671875, -1.220428466796875, -1.1683502197265625, -1.11627197265625, -1.0641937255859375, -1.012115478515625, -0.9600372314453125, -0.907958984375, -0.8558807373046875, -0.803802490234375, -0.7517242431640625, -0.69964599609375, -0.6475677490234375, -0.595489501953125, -0.5434112548828125, -0.4913330078125, -0.4392547607421875, -0.387176513671875, -0.3350982666015625, -0.28302001953125, -0.2309417724609375, -0.178863525390625, -0.1267852783203125, -0.07470703125, -0.0226287841796875, 0.029449462890625, 0.0815277099609375, 0.13360595703125, 0.1856842041015625, 0.237762451171875, 0.2898406982421875, 0.3419189453125, 0.3939971923828125, 0.446075439453125, 0.4981536865234375, 0.55023193359375, 0.6023101806640625, 0.654388427734375, 0.7064666748046875, 0.758544921875, 0.8106231689453125, 0.862701416015625, 0.9147796630859375, 0.96685791015625, 1.0189361572265625, 1.071014404296875, 1.1230926513671875, 1.1751708984375, 1.2272491455078125, 1.279327392578125, 1.3314056396484375, 1.38348388671875, 1.4355621337890625, 1.487640380859375, 1.5397186279296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 4.0, 9.0, 13.0, 15.0, 12.0, 18.0, 16.0, 23.0, 32.0, 30.0, 39.0, 54.0, 59.0, 59.0, 61.0, 57.0, 72.0, 56.0, 64.0, 54.0, 37.0, 23.0, 34.0, 30.0, 29.0, 22.0, 14.0, 12.0, 12.0, 11.0, 6.0, 4.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66064453125, -0.6390609741210938, -0.6174774169921875, -0.5958938598632812, -0.574310302734375, -0.5527267456054688, -0.5311431884765625, -0.5095596313476562, -0.48797607421875, -0.46639251708984375, -0.4448089599609375, -0.42322540283203125, -0.401641845703125, -0.38005828857421875, -0.3584747314453125, -0.33689117431640625, -0.3153076171875, -0.29372406005859375, -0.2721405029296875, -0.25055694580078125, -0.228973388671875, -0.20738983154296875, -0.1858062744140625, -0.16422271728515625, -0.14263916015625, -0.12105560302734375, -0.0994720458984375, -0.07788848876953125, -0.056304931640625, -0.03472137451171875, -0.0131378173828125, 0.00844573974609375, 0.030029296875, 0.05161285400390625, 0.0731964111328125, 0.09477996826171875, 0.116363525390625, 0.13794708251953125, 0.1595306396484375, 0.18111419677734375, 0.20269775390625, 0.22428131103515625, 0.2458648681640625, 0.26744842529296875, 0.289031982421875, 0.31061553955078125, 0.3321990966796875, 0.35378265380859375, 0.3753662109375, 0.39694976806640625, 0.4185333251953125, 0.44011688232421875, 0.461700439453125, 0.48328399658203125, 0.5048675537109375, 0.5264511108398438, 0.54803466796875, 0.5696182250976562, 0.5912017822265625, 0.6127853393554688, 0.634368896484375, 0.6559524536132812, 0.6775360107421875, 0.6991195678710938, 0.720703125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 11.0, 12.0, 11.0, 21.0, 29.0, 48.0, 45.0, 48.0, 62.0, 59.0, 66.0, 60.0, 62.0, 59.0, 56.0, 61.0, 46.0, 44.0, 27.0, 34.0, 26.0, 18.0, 9.0, 7.0, 11.0, 10.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9030683040618896, -3.753147840499878, -3.6032276153564453, -3.4533071517944336, -3.303386926651001, -3.1534664630889893, -3.0035462379455566, -2.853625774383545, -2.703705310821533, -2.5537848472595215, -2.403864622116089, -2.253944158554077, -2.1040239334106445, -1.9541034698486328, -1.8041831254959106, -1.6542627811431885, -1.5043425559997559, -1.3544222116470337, -1.2045018672943115, -1.0545814037322998, -0.9046611189842224, -0.7547407746315002, -0.6048203706741333, -0.45490002632141113, -0.30497968196868896, -0.1550593227148056, -0.005138963460922241, 0.14478141069412231, 0.2947017550468445, 0.44462209939956665, 0.5945425033569336, 0.7444628477096558, 0.894383430480957, 1.0443037748336792, 1.1942241191864014, 1.344144582748413, 1.4940648078918457, 1.6439852714538574, 1.7939056158065796, 1.9438259601593018, 2.0937461853027344, 2.243666648864746, 2.3935868740081787, 2.5435073375701904, 2.693427562713623, 2.8433480262756348, 2.9932684898376465, 3.143188714981079, 3.293109178543091, 3.4430296421051025, 3.592949867248535, 3.742870330810547, 3.8927905559539795, 4.042710781097412, 4.192631244659424, 4.3425517082214355, 4.492472171783447, 4.642392635345459, 4.792313098907471, 4.942233085632324, 5.092153549194336, 5.242074012756348, 5.391994476318359, 5.541914939880371, 5.691834926605225]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 1.0, 8.0, 1.0, 3.0, 6.0, 12.0, 13.0, 17.0, 12.0, 8.0, 14.0, 24.0, 21.0, 26.0, 35.0, 24.0, 33.0, 38.0, 38.0, 49.0, 44.0, 36.0, 43.0, 38.0, 34.0, 32.0, 31.0, 23.0, 28.0, 34.0, 26.0, 26.0, 32.0, 20.0, 25.0, 27.0, 16.0, 8.0, 11.0, 21.0, 9.0, 6.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0], "bins": [-2.761392116546631, -2.680264949798584, -2.599137544631958, -2.518010377883911, -2.4368832111358643, -2.3557558059692383, -2.2746286392211914, -2.1935014724731445, -2.1123740673065186, -2.0312469005584717, -1.9501196146011353, -1.8689923286437988, -1.7878650426864624, -1.706737756729126, -1.625610589981079, -1.5444833040237427, -1.4633561372756958, -1.3822288513183594, -1.3011016845703125, -1.219974398612976, -1.1388471126556396, -1.0577199459075928, -0.9765926599502563, -0.8954653739929199, -0.8143381476402283, -0.7332109212875366, -0.6520836353302002, -0.5709564089775085, -0.4898291528224945, -0.40870189666748047, -0.3275746703147888, -0.2464473843574524, -0.16532015800476074, -0.0841929093003273, -0.00306566059589386, 0.07806158065795898, 0.15918883681297302, 0.24031609296798706, 0.3214433193206787, 0.40257060527801514, 0.4836978316307068, 0.5648250579833984, 0.6459523439407349, 0.7270795702934265, 0.8082067966461182, 0.8893340826034546, 0.9704613089561462, 1.051588535308838, 1.1327158212661743, 1.2138431072235107, 1.2949702739715576, 1.376097559928894, 1.4572248458862305, 1.5383520126342773, 1.6194792985916138, 1.7006065845489502, 1.781733751296997, 1.8628610372543335, 1.9439882040023804, 2.025115489959717, 2.1062426567077637, 2.1873700618743896, 2.2684972286224365, 2.3496246337890625, 2.4307518005371094]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 9.0, 11.0, 23.0, 25.0, 38.0, 52.0, 68.0, 117.0, 212.0, 318.0, 446.0, 691.0, 1043.0, 1769.0, 2851.0, 4684.0, 7814.0, 13949.0, 25472.0, 49713.0, 101316.0, 222267.0, 517864.0, 1031953.0, 1113228.0, 602227.0, 257634.0, 115340.0, 56228.0, 28931.0, 15911.0, 8980.0, 5106.0, 3008.0, 1882.0, 1128.0, 747.0, 439.0, 254.0, 203.0, 132.0, 71.0, 45.0, 43.0, 18.0, 13.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-5.203125, -5.0589599609375, -4.914794921875, -4.7706298828125, -4.62646484375, -4.4822998046875, -4.338134765625, -4.1939697265625, -4.0498046875, -3.9056396484375, -3.761474609375, -3.6173095703125, -3.47314453125, -3.3289794921875, -3.184814453125, -3.0406494140625, -2.896484375, -2.7523193359375, -2.608154296875, -2.4639892578125, -2.31982421875, -2.1756591796875, -2.031494140625, -1.8873291015625, -1.7431640625, -1.5989990234375, -1.454833984375, -1.3106689453125, -1.16650390625, -1.0223388671875, -0.878173828125, -0.7340087890625, -0.58984375, -0.4456787109375, -0.301513671875, -0.1573486328125, -0.01318359375, 0.1309814453125, 0.275146484375, 0.4193115234375, 0.5634765625, 0.7076416015625, 0.851806640625, 0.9959716796875, 1.14013671875, 1.2843017578125, 1.428466796875, 1.5726318359375, 1.716796875, 1.8609619140625, 2.005126953125, 2.1492919921875, 2.29345703125, 2.4376220703125, 2.581787109375, 2.7259521484375, 2.8701171875, 3.0142822265625, 3.158447265625, 3.3026123046875, 3.44677734375, 3.5909423828125, 3.735107421875, 3.8792724609375, 4.0234375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 10.0, 17.0, 14.0, 15.0, 14.0, 17.0, 21.0, 28.0, 19.0, 30.0, 43.0, 29.0, 37.0, 39.0, 40.0, 38.0, 48.0, 47.0, 34.0, 39.0, 32.0, 30.0, 36.0, 41.0, 33.0, 23.0, 21.0, 22.0, 23.0, 25.0, 20.0, 13.0, 10.0, 11.0, 7.0, 14.0, 3.0, 5.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8919677734375, -1.831787109375, -1.7716064453125, -1.71142578125, -1.6512451171875, -1.591064453125, -1.5308837890625, -1.470703125, -1.4105224609375, -1.350341796875, -1.2901611328125, -1.22998046875, -1.1697998046875, -1.109619140625, -1.0494384765625, -0.9892578125, -0.9290771484375, -0.868896484375, -0.8087158203125, -0.74853515625, -0.6883544921875, -0.628173828125, -0.5679931640625, -0.5078125, -0.4476318359375, -0.387451171875, -0.3272705078125, -0.26708984375, -0.2069091796875, -0.146728515625, -0.0865478515625, -0.0263671875, 0.0338134765625, 0.093994140625, 0.1541748046875, 0.21435546875, 0.2745361328125, 0.334716796875, 0.3948974609375, 0.455078125, 0.5152587890625, 0.575439453125, 0.6356201171875, 0.69580078125, 0.7559814453125, 0.816162109375, 0.8763427734375, 0.9365234375, 0.9967041015625, 1.056884765625, 1.1170654296875, 1.17724609375, 1.2374267578125, 1.297607421875, 1.3577880859375, 1.41796875, 1.4781494140625, 1.538330078125, 1.5985107421875, 1.65869140625, 1.7188720703125, 1.779052734375, 1.8392333984375, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 31.0, 29.0, 50.0, 63.0, 117.0, 179.0, 263.0, 385.0, 651.0, 930.0, 1634.0, 2557.0, 4142.0, 6969.0, 12067.0, 20994.0, 38495.0, 73202.0, 143392.0, 285092.0, 562891.0, 936695.0, 936982.0, 567641.0, 289982.0, 144460.0, 73875.0, 38822.0, 21567.0, 12151.0, 6983.0, 4029.0, 2544.0, 1585.0, 1007.0, 597.0, 406.0, 277.0, 191.0, 100.0, 81.0, 49.0, 34.0, 28.0, 16.0, 6.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.05859375, -3.92333984375, -3.7880859375, -3.65283203125, -3.517578125, -3.38232421875, -3.2470703125, -3.11181640625, -2.9765625, -2.84130859375, -2.7060546875, -2.57080078125, -2.435546875, -2.30029296875, -2.1650390625, -2.02978515625, -1.89453125, -1.75927734375, -1.6240234375, -1.48876953125, -1.353515625, -1.21826171875, -1.0830078125, -0.94775390625, -0.8125, -0.67724609375, -0.5419921875, -0.40673828125, -0.271484375, -0.13623046875, -0.0009765625, 0.13427734375, 0.26953125, 0.40478515625, 0.5400390625, 0.67529296875, 0.810546875, 0.94580078125, 1.0810546875, 1.21630859375, 1.3515625, 1.48681640625, 1.6220703125, 1.75732421875, 1.892578125, 2.02783203125, 2.1630859375, 2.29833984375, 2.43359375, 2.56884765625, 2.7041015625, 2.83935546875, 2.974609375, 3.10986328125, 3.2451171875, 3.38037109375, 3.515625, 3.65087890625, 3.7861328125, 3.92138671875, 4.056640625, 4.19189453125, 4.3271484375, 4.46240234375, 4.59765625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 4.0, 10.0, 17.0, 22.0, 20.0, 27.0, 34.0, 55.0, 61.0, 82.0, 86.0, 113.0, 114.0, 148.0, 191.0, 226.0, 230.0, 246.0, 247.0, 246.0, 264.0, 224.0, 224.0, 200.0, 181.0, 147.0, 119.0, 104.0, 85.0, 67.0, 71.0, 44.0, 32.0, 27.0, 30.0, 14.0, 11.0, 8.0, 10.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.209442138671875, -1.17181396484375, -1.134185791015625, -1.0965576171875, -1.058929443359375, -1.02130126953125, -0.983673095703125, -0.946044921875, -0.908416748046875, -0.87078857421875, -0.833160400390625, -0.7955322265625, -0.757904052734375, -0.72027587890625, -0.682647705078125, -0.64501953125, -0.607391357421875, -0.56976318359375, -0.532135009765625, -0.4945068359375, -0.456878662109375, -0.41925048828125, -0.381622314453125, -0.343994140625, -0.306365966796875, -0.26873779296875, -0.231109619140625, -0.1934814453125, -0.155853271484375, -0.11822509765625, -0.080596923828125, -0.04296875, -0.005340576171875, 0.03228759765625, 0.069915771484375, 0.1075439453125, 0.145172119140625, 0.18280029296875, 0.220428466796875, 0.258056640625, 0.295684814453125, 0.33331298828125, 0.370941162109375, 0.4085693359375, 0.446197509765625, 0.48382568359375, 0.521453857421875, 0.55908203125, 0.596710205078125, 0.63433837890625, 0.671966552734375, 0.7095947265625, 0.747222900390625, 0.78485107421875, 0.822479248046875, 0.860107421875, 0.897735595703125, 0.93536376953125, 0.972991943359375, 1.0106201171875, 1.048248291015625, 1.08587646484375, 1.123504638671875, 1.1611328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 6.0, 7.0, 10.0, 15.0, 16.0, 14.0, 20.0, 28.0, 32.0, 33.0, 51.0, 43.0, 52.0, 56.0, 46.0, 53.0, 56.0, 61.0, 51.0, 45.0, 34.0, 36.0, 35.0, 33.0, 25.0, 24.0, 23.0, 15.0, 6.0, 20.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2587530612945557, -3.1374149322509766, -3.0160770416259766, -2.8947389125823975, -2.7734007835388184, -2.6520628929138184, -2.5307247638702393, -2.40938663482666, -2.28804874420166, -2.166710615158081, -2.045372724533081, -1.924034595489502, -1.8026965856552124, -1.6813585758209229, -1.5600204467773438, -1.4386824369430542, -1.3173444271087646, -1.196006417274475, -1.0746684074401855, -0.9533302783966064, -0.8319922685623169, -0.7106542587280273, -0.589316189289093, -0.4679781198501587, -0.34664011001586914, -0.2253020703792572, -0.10396403074264526, 0.017374008893966675, 0.1387120485305786, 0.26005005836486816, 0.3813881278038025, 0.5027261972427368, 0.6240639686584473, 0.7454019784927368, 0.8667400479316711, 0.9880781173706055, 1.109416127204895, 1.2307541370391846, 1.3520922660827637, 1.4734302759170532, 1.5947682857513428, 1.7161062955856323, 1.8374443054199219, 1.958782434463501, 2.08012056350708, 2.20145845413208, 2.322796583175659, 2.4441347122192383, 2.5654726028442383, 2.6868107318878174, 2.8081486225128174, 2.9294867515563965, 3.0508246421813965, 3.1721627712249756, 3.2935009002685547, 3.4148387908935547, 3.536176919937134, 3.657515048980713, 3.778852939605713, 3.900191068649292, 4.021529197692871, 4.142867088317871, 4.264204978942871, 4.385543346405029, 4.506881237030029]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 7.0, 12.0, 9.0, 6.0, 11.0, 9.0, 14.0, 15.0, 20.0, 23.0, 15.0, 17.0, 29.0, 34.0, 35.0, 29.0, 26.0, 38.0, 30.0, 46.0, 46.0, 50.0, 43.0, 28.0, 27.0, 29.0, 38.0, 36.0, 31.0, 37.0, 20.0, 22.0, 11.0, 20.0, 24.0, 17.0, 22.0, 13.0, 8.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.0733299255371094, -2.0040252208709717, -1.934720516204834, -1.8654159307479858, -1.7961112260818481, -1.7268065214157104, -1.6575019359588623, -1.5881972312927246, -1.518892526626587, -1.4495878219604492, -1.3802831172943115, -1.3109785318374634, -1.2416738271713257, -1.172369122505188, -1.1030645370483398, -1.0337598323822021, -0.9644551277160645, -0.8951504230499268, -0.8258457779884338, -0.7565411329269409, -0.6872364282608032, -0.6179317235946655, -0.5486270785331726, -0.4793224036693573, -0.410017728805542, -0.3407130539417267, -0.2714083790779114, -0.20210370421409607, -0.13279902935028076, -0.06349435448646545, 0.0058103203773498535, 0.07511499524116516, 0.14441990852355957, 0.21372458338737488, 0.2830292582511902, 0.3523339331150055, 0.4216386079788208, 0.4909432828426361, 0.5602479577064514, 0.6295526027679443, 0.698857307434082, 0.7681620121002197, 0.8374666571617126, 0.9067713022232056, 0.9760760068893433, 1.045380711555481, 1.114685297012329, 1.1839900016784668, 1.2532947063446045, 1.3225994110107422, 1.3919041156768799, 1.461208701133728, 1.5305134057998657, 1.5998181104660034, 1.6691226959228516, 1.7384274005889893, 1.807732105255127, 1.8770368099212646, 1.9463415145874023, 2.01564621925354, 2.0849509239196777, 2.1542553901672363, 2.223560094833374, 2.2928647994995117, 2.3621695041656494]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 23.0, 32.0, 56.0, 83.0, 115.0, 169.0, 296.0, 415.0, 628.0, 950.0, 1496.0, 2328.0, 3663.0, 5729.0, 9105.0, 14356.0, 22547.0, 35283.0, 54423.0, 82369.0, 117504.0, 148476.0, 153693.0, 128318.0, 93210.0, 62004.0, 40552.0, 25638.0, 16361.0, 10314.0, 6504.0, 4231.0, 2696.0, 1805.0, 1110.0, 681.0, 446.0, 324.0, 204.0, 121.0, 111.0, 48.0, 32.0, 23.0, 10.0, 15.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.315673828125, -0.3064308166503906, -0.29718780517578125, -0.2879447937011719, -0.2787017822265625, -0.2694587707519531, -0.26021575927734375, -0.2509727478027344, -0.241729736328125, -0.23248672485351562, -0.22324371337890625, -0.21400070190429688, -0.2047576904296875, -0.19551467895507812, -0.18627166748046875, -0.17702865600585938, -0.16778564453125, -0.15854263305664062, -0.14929962158203125, -0.14005661010742188, -0.1308135986328125, -0.12157058715820312, -0.11232757568359375, -0.10308456420898438, -0.093841552734375, -0.08459854125976562, -0.07535552978515625, -0.06611251831054688, -0.0568695068359375, -0.047626495361328125, -0.03838348388671875, -0.029140472412109375, -0.0198974609375, -0.010654449462890625, -0.00141143798828125, 0.007831573486328125, 0.0170745849609375, 0.026317596435546875, 0.03556060791015625, 0.044803619384765625, 0.054046630859375, 0.06328964233398438, 0.07253265380859375, 0.08177566528320312, 0.0910186767578125, 0.10026168823242188, 0.10950469970703125, 0.11874771118164062, 0.12799072265625, 0.13723373413085938, 0.14647674560546875, 0.15571975708007812, 0.1649627685546875, 0.17420578002929688, 0.18344879150390625, 0.19269180297851562, 0.201934814453125, 0.21117782592773438, 0.22042083740234375, 0.22966384887695312, 0.2389068603515625, 0.24814987182617188, 0.25739288330078125, 0.2666358947753906, 0.27587890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 16.0, 15.0, 23.0, 22.0, 18.0, 20.0, 36.0, 20.0, 26.0, 40.0, 25.0, 41.0, 45.0, 40.0, 44.0, 53.0, 40.0, 38.0, 47.0, 33.0, 30.0, 31.0, 34.0, 25.0, 19.0, 27.0, 19.0, 23.0, 11.0, 19.0, 19.0, 20.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28125, -2.198883056640625, -2.11651611328125, -2.034149169921875, -1.9517822265625, -1.869415283203125, -1.78704833984375, -1.704681396484375, -1.622314453125, -1.539947509765625, -1.45758056640625, -1.375213623046875, -1.2928466796875, -1.210479736328125, -1.12811279296875, -1.045745849609375, -0.96337890625, -0.881011962890625, -0.79864501953125, -0.716278076171875, -0.6339111328125, -0.551544189453125, -0.46917724609375, -0.386810302734375, -0.304443359375, -0.222076416015625, -0.13970947265625, -0.057342529296875, 0.0250244140625, 0.107391357421875, 0.18975830078125, 0.272125244140625, 0.3544921875, 0.436859130859375, 0.51922607421875, 0.601593017578125, 0.6839599609375, 0.766326904296875, 0.84869384765625, 0.931060791015625, 1.013427734375, 1.095794677734375, 1.17816162109375, 1.260528564453125, 1.3428955078125, 1.425262451171875, 1.50762939453125, 1.589996337890625, 1.67236328125, 1.754730224609375, 1.83709716796875, 1.919464111328125, 2.0018310546875, 2.084197998046875, 2.16656494140625, 2.248931884765625, 2.331298828125, 2.413665771484375, 2.49603271484375, 2.578399658203125, 2.6607666015625, 2.743133544921875, 2.82550048828125, 2.907867431640625, 2.990234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 7.0, 11.0, 16.0, 19.0, 25.0, 26.0, 59.0, 57.0, 85.0, 108.0, 148.0, 195.0, 308.0, 451.0, 649.0, 1094.0, 1778.0, 3170.0, 5974.0, 11518.0, 24087.0, 118039.0, 796702.0, 46413.0, 17614.0, 8661.0, 4488.0, 2536.0, 1451.0, 931.0, 610.0, 382.0, 260.0, 184.0, 123.0, 104.0, 59.0, 42.0, 34.0, 25.0, 20.0, 24.0, 11.0, 16.0, 10.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.95849609375, -0.92578125, -0.89306640625, -0.8603515625, -0.82763671875, -0.794921875, -0.76220703125, -0.7294921875, -0.69677734375, -0.6640625, -0.63134765625, -0.5986328125, -0.56591796875, -0.533203125, -0.50048828125, -0.4677734375, -0.43505859375, -0.40234375, -0.36962890625, -0.3369140625, -0.30419921875, -0.271484375, -0.23876953125, -0.2060546875, -0.17333984375, -0.140625, -0.10791015625, -0.0751953125, -0.04248046875, -0.009765625, 0.02294921875, 0.0556640625, 0.08837890625, 0.12109375, 0.15380859375, 0.1865234375, 0.21923828125, 0.251953125, 0.28466796875, 0.3173828125, 0.35009765625, 0.3828125, 0.41552734375, 0.4482421875, 0.48095703125, 0.513671875, 0.54638671875, 0.5791015625, 0.61181640625, 0.64453125, 0.67724609375, 0.7099609375, 0.74267578125, 0.775390625, 0.80810546875, 0.8408203125, 0.87353515625, 0.90625, 0.93896484375, 0.9716796875, 1.00439453125, 1.037109375, 1.06982421875, 1.1025390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 4.0, 8.0, 5.0, 14.0, 14.0, 13.0, 22.0, 21.0, 15.0, 24.0, 20.0, 30.0, 34.0, 30.0, 30.0, 42.0, 36.0, 34.0, 29.0, 36.0, 43.0, 30.0, 35.0, 34.0, 29.0, 36.0, 35.0, 31.0, 31.0, 34.0, 25.0, 19.0, 15.0, 20.0, 21.0, 13.0, 14.0, 9.0, 9.0, 10.0, 8.0, 10.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6951446533203125, -1.640289306640625, -1.5854339599609375, -1.53057861328125, -1.4757232666015625, -1.420867919921875, -1.3660125732421875, -1.3111572265625, -1.2563018798828125, -1.201446533203125, -1.1465911865234375, -1.09173583984375, -1.0368804931640625, -0.982025146484375, -0.9271697998046875, -0.872314453125, -0.8174591064453125, -0.762603759765625, -0.7077484130859375, -0.65289306640625, -0.5980377197265625, -0.543182373046875, -0.4883270263671875, -0.4334716796875, -0.3786163330078125, -0.323760986328125, -0.2689056396484375, -0.21405029296875, -0.1591949462890625, -0.104339599609375, -0.0494842529296875, 0.00537109375, 0.0602264404296875, 0.115081787109375, 0.1699371337890625, 0.22479248046875, 0.2796478271484375, 0.334503173828125, 0.3893585205078125, 0.4442138671875, 0.4990692138671875, 0.553924560546875, 0.6087799072265625, 0.66363525390625, 0.7184906005859375, 0.773345947265625, 0.8282012939453125, 0.883056640625, 0.9379119873046875, 0.992767333984375, 1.0476226806640625, 1.10247802734375, 1.1573333740234375, 1.212188720703125, 1.2670440673828125, 1.3218994140625, 1.3767547607421875, 1.431610107421875, 1.4864654541015625, 1.54132080078125, 1.5961761474609375, 1.651031494140625, 1.7058868408203125, 1.7607421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 2.0, 5.0, 13.0, 8.0, 17.0, 27.0, 41.0, 45.0, 52.0, 75.0, 95.0, 166.0, 267.0, 347.0, 566.0, 726.0, 1188.0, 1758.0, 2726.0, 4350.0, 7189.0, 12202.0, 22586.0, 81549.0, 834490.0, 35479.0, 16747.0, 9663.0, 5644.0, 3639.0, 2321.0, 1483.0, 988.0, 660.0, 424.0, 305.0, 211.0, 152.0, 95.0, 65.0, 49.0, 35.0, 32.0, 21.0, 13.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.259033203125, -0.24953460693359375, -0.2400360107421875, -0.23053741455078125, -0.221038818359375, -0.21154022216796875, -0.2020416259765625, -0.19254302978515625, -0.18304443359375, -0.17354583740234375, -0.1640472412109375, -0.15454864501953125, -0.145050048828125, -0.13555145263671875, -0.1260528564453125, -0.11655426025390625, -0.1070556640625, -0.09755706787109375, -0.0880584716796875, -0.07855987548828125, -0.069061279296875, -0.05956268310546875, -0.0500640869140625, -0.04056549072265625, -0.03106689453125, -0.02156829833984375, -0.0120697021484375, -0.00257110595703125, 0.006927490234375, 0.01642608642578125, 0.0259246826171875, 0.03542327880859375, 0.044921875, 0.05442047119140625, 0.0639190673828125, 0.07341766357421875, 0.082916259765625, 0.09241485595703125, 0.1019134521484375, 0.11141204833984375, 0.12091064453125, 0.13040924072265625, 0.1399078369140625, 0.14940643310546875, 0.158905029296875, 0.16840362548828125, 0.1779022216796875, 0.18740081787109375, 0.1968994140625, 0.20639801025390625, 0.2158966064453125, 0.22539520263671875, 0.234893798828125, 0.24439239501953125, 0.2538909912109375, 0.26338958740234375, 0.27288818359375, 0.28238677978515625, 0.2918853759765625, 0.30138397216796875, 0.310882568359375, 0.32038116455078125, 0.3298797607421875, 0.33937835693359375, 0.348876953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 6.0, 11.0, 17.0, 21.0, 19.0, 25.0, 18.0, 26.0, 19.0, 39.0, 32.0, 43.0, 40.0, 43.0, 35.0, 53.0, 37.0, 56.0, 42.0, 55.0, 40.0, 43.0, 45.0, 34.0, 26.0, 26.0, 24.0, 18.0, 17.0, 6.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.562999725341797e-05, -2.470053732395172e-05, -2.3771077394485474e-05, -2.2841617465019226e-05, -2.191215753555298e-05, -2.098269760608673e-05, -2.0053237676620483e-05, -1.9123777747154236e-05, -1.8194317817687988e-05, -1.726485788822174e-05, -1.6335397958755493e-05, -1.5405938029289246e-05, -1.4476478099822998e-05, -1.354701817035675e-05, -1.2617558240890503e-05, -1.1688098311424255e-05, -1.0758638381958008e-05, -9.82917845249176e-06, -8.899718523025513e-06, -7.970258593559265e-06, -7.040798664093018e-06, -6.11133873462677e-06, -5.1818788051605225e-06, -4.252418875694275e-06, -3.3229589462280273e-06, -2.3934990167617798e-06, -1.4640390872955322e-06, -5.345791578292847e-07, 3.948807716369629e-07, 1.3243407011032104e-06, 2.253800630569458e-06, 3.1832605600357056e-06, 4.112720489501953e-06, 5.042180418968201e-06, 5.971640348434448e-06, 6.901100277900696e-06, 7.830560207366943e-06, 8.760020136833191e-06, 9.689480066299438e-06, 1.0618939995765686e-05, 1.1548399925231934e-05, 1.2477859854698181e-05, 1.3407319784164429e-05, 1.4336779713630676e-05, 1.5266239643096924e-05, 1.619569957256317e-05, 1.712515950202942e-05, 1.8054619431495667e-05, 1.8984079360961914e-05, 1.991353929042816e-05, 2.084299921989441e-05, 2.1772459149360657e-05, 2.2701919078826904e-05, 2.3631379008293152e-05, 2.45608389377594e-05, 2.5490298867225647e-05, 2.6419758796691895e-05, 2.7349218726158142e-05, 2.827867865562439e-05, 2.9208138585090637e-05, 3.0137598514556885e-05, 3.106705844402313e-05, 3.199651837348938e-05, 3.292597830295563e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 23.0, 29.0, 40.0, 61.0, 68.0, 111.0, 172.0, 255.0, 422.0, 757.0, 1277.0, 2200.0, 3683.0, 6939.0, 13388.0, 27587.0, 58850.0, 130249.0, 254678.0, 271229.0, 146350.0, 66656.0, 30960.0, 15126.0, 7651.0, 4123.0, 2271.0, 1280.0, 823.0, 473.0, 291.0, 167.0, 126.0, 78.0, 50.0, 25.0, 15.0, 16.0, 5.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.1693115234375, -0.16434288024902344, -0.15937423706054688, -0.1544055938720703, -0.14943695068359375, -0.1444683074951172, -0.13949966430664062, -0.13453102111816406, -0.1295623779296875, -0.12459373474121094, -0.11962509155273438, -0.11465644836425781, -0.10968780517578125, -0.10471916198730469, -0.09975051879882812, -0.09478187561035156, -0.089813232421875, -0.08484458923339844, -0.07987594604492188, -0.07490730285644531, -0.06993865966796875, -0.06497001647949219, -0.060001373291015625, -0.05503273010253906, -0.0500640869140625, -0.04509544372558594, -0.040126800537109375, -0.03515815734863281, -0.03018951416015625, -0.025220870971679688, -0.020252227783203125, -0.015283584594726562, -0.01031494140625, -0.0053462982177734375, -0.000377655029296875, 0.0045909881591796875, 0.00955963134765625, 0.014528274536132812, 0.019496917724609375, 0.024465560913085938, 0.0294342041015625, 0.03440284729003906, 0.039371490478515625, 0.04434013366699219, 0.04930877685546875, 0.05427742004394531, 0.059246063232421875, 0.06421470642089844, 0.069183349609375, 0.07415199279785156, 0.07912063598632812, 0.08408927917480469, 0.08905792236328125, 0.09402656555175781, 0.09899520874023438, 0.10396385192871094, 0.1089324951171875, 0.11390113830566406, 0.11886978149414062, 0.12383842468261719, 0.12880706787109375, 0.1337757110595703, 0.13874435424804688, 0.14371299743652344, 0.148681640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 7.0, 16.0, 14.0, 10.0, 15.0, 16.0, 24.0, 29.0, 43.0, 62.0, 54.0, 76.0, 69.0, 85.0, 76.0, 56.0, 58.0, 54.0, 45.0, 22.0, 33.0, 18.0, 25.0, 20.0, 17.0, 10.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.06186485290527344, -0.059581756591796875, -0.05729866027832031, -0.05501556396484375, -0.05273246765136719, -0.050449371337890625, -0.04816627502441406, -0.0458831787109375, -0.04360008239746094, -0.041316986083984375, -0.03903388977050781, -0.03675079345703125, -0.03446769714355469, -0.032184600830078125, -0.029901504516601562, -0.027618408203125, -0.025335311889648438, -0.023052215576171875, -0.020769119262695312, -0.01848602294921875, -0.016202926635742188, -0.013919830322265625, -0.011636734008789062, -0.0093536376953125, -0.0070705413818359375, -0.004787445068359375, -0.0025043487548828125, -0.00022125244140625, 0.0020618438720703125, 0.004344940185546875, 0.0066280364990234375, 0.0089111328125, 0.011194229125976562, 0.013477325439453125, 0.015760421752929688, 0.01804351806640625, 0.020326614379882812, 0.022609710693359375, 0.024892807006835938, 0.0271759033203125, 0.029458999633789062, 0.031742095947265625, 0.03402519226074219, 0.03630828857421875, 0.03859138488769531, 0.040874481201171875, 0.04315757751464844, 0.045440673828125, 0.04772377014160156, 0.050006866455078125, 0.05228996276855469, 0.05457305908203125, 0.05685615539550781, 0.059139251708984375, 0.06142234802246094, 0.0637054443359375, 0.06598854064941406, 0.06827163696289062, 0.07055473327636719, 0.07283782958984375, 0.07512092590332031, 0.07740402221679688, 0.07968711853027344, 0.08197021484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 6.0, 10.0, 10.0, 11.0, 18.0, 15.0, 25.0, 20.0, 39.0, 35.0, 50.0, 44.0, 51.0, 56.0, 46.0, 60.0, 53.0, 61.0, 44.0, 48.0, 34.0, 34.0, 32.0, 39.0, 18.0, 26.0, 22.0, 14.0, 9.0, 18.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2084171772003174, -3.0880517959594727, -2.967686653137207, -2.8473212718963623, -2.7269558906555176, -2.606590747833252, -2.4862253665924072, -2.3658599853515625, -2.245494842529297, -2.125129461288452, -2.0047643184661865, -1.8843989372253418, -1.764033555984497, -1.643668293952942, -1.5233030319213867, -1.402937650680542, -1.2825722694396973, -1.162207007408142, -1.0418416261672974, -0.9214763641357422, -0.8011110424995422, -0.6807457208633423, -0.5603804588317871, -0.44001513719558716, -0.3196498155593872, -0.19928450882434845, -0.07891920208930969, 0.04144608974456787, 0.16181141138076782, 0.2821767330169678, 0.40254199504852295, 0.5229073166847229, 0.643272876739502, 0.7636381983757019, 0.8840035200119019, 1.004368782043457, 1.1247341632843018, 1.245099425315857, 1.365464687347412, 1.4858300685882568, 1.606195330619812, 1.7265605926513672, 1.846925973892212, 1.967291235923767, 2.0876564979553223, 2.208021879196167, 2.3283872604370117, 2.4487524032592773, 2.569117784500122, 2.689483165740967, 2.8098483085632324, 2.930213689804077, 3.050579071044922, 3.1709442138671875, 3.2913095951080322, 3.411674976348877, 3.5320401191711426, 3.6524055004119873, 3.772770643234253, 3.8931360244750977, 4.013501167297363, 4.133866786956787, 4.254231929779053, 4.374597072601318, 4.494962692260742]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 8.0, 9.0, 12.0, 6.0, 8.0, 10.0, 16.0, 17.0, 14.0, 26.0, 14.0, 19.0, 27.0, 40.0, 33.0, 30.0, 30.0, 29.0, 37.0, 40.0, 49.0, 50.0, 42.0, 26.0, 30.0, 31.0, 39.0, 33.0, 31.0, 36.0, 24.0, 17.0, 14.0, 18.0, 23.0, 22.0, 18.0, 10.0, 12.0, 11.0, 7.0, 6.0, 5.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.064056634902954, -1.9949069023132324, -1.9257571697235107, -1.856607437133789, -1.7874577045440674, -1.7183079719543457, -1.649158239364624, -1.5800085067749023, -1.5108587741851807, -1.441709041595459, -1.3725593090057373, -1.3034095764160156, -1.234259843826294, -1.1651101112365723, -1.0959603786468506, -1.026810646057129, -0.9576607942581177, -0.888511061668396, -0.8193613290786743, -0.7502115964889526, -0.681061863899231, -0.6119121313095093, -0.5427623391151428, -0.47361260652542114, -0.40446287393569946, -0.3353131413459778, -0.2661634087562561, -0.19701364636421204, -0.12786391377449036, -0.05871418118476868, 0.01043558120727539, 0.07958531379699707, 0.14873504638671875, 0.21788477897644043, 0.2870345115661621, 0.3561842739582062, 0.42533400654792786, 0.49448373913764954, 0.5636335015296936, 0.6327832341194153, 0.701932966709137, 0.7710826992988586, 0.8402324318885803, 0.9093822240829468, 0.9785319566726685, 1.0476816892623901, 1.1168314218521118, 1.1859811544418335, 1.2551308870315552, 1.3242806196212769, 1.3934303522109985, 1.4625800848007202, 1.531729817390442, 1.6008795499801636, 1.6700294017791748, 1.7391791343688965, 1.8083288669586182, 1.8774785995483398, 1.9466283321380615, 2.015778064727783, 2.084927797317505, 2.1540775299072266, 2.2232272624969482, 2.29237699508667, 2.3615267276763916]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 14.0, 19.0, 21.0, 34.0, 57.0, 84.0, 104.0, 166.0, 259.0, 423.0, 609.0, 913.0, 1560.0, 2424.0, 4022.0, 6612.0, 11138.0, 18550.0, 31169.0, 49787.0, 76607.0, 108486.0, 137858.0, 150213.0, 137697.0, 108016.0, 76042.0, 48777.0, 30343.0, 18343.0, 11057.0, 6567.0, 3908.0, 2419.0, 1487.0, 921.0, 591.0, 397.0, 284.0, 189.0, 126.0, 65.0, 73.0, 33.0, 27.0, 16.0, 16.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.451171875, -2.373321533203125, -2.29547119140625, -2.217620849609375, -2.1397705078125, -2.061920166015625, -1.98406982421875, -1.906219482421875, -1.828369140625, -1.750518798828125, -1.67266845703125, -1.594818115234375, -1.5169677734375, -1.439117431640625, -1.36126708984375, -1.283416748046875, -1.20556640625, -1.127716064453125, -1.04986572265625, -0.972015380859375, -0.8941650390625, -0.816314697265625, -0.73846435546875, -0.660614013671875, -0.582763671875, -0.504913330078125, -0.42706298828125, -0.349212646484375, -0.2713623046875, -0.193511962890625, -0.11566162109375, -0.037811279296875, 0.0400390625, 0.117889404296875, 0.19573974609375, 0.273590087890625, 0.3514404296875, 0.429290771484375, 0.50714111328125, 0.584991455078125, 0.662841796875, 0.740692138671875, 0.81854248046875, 0.896392822265625, 0.9742431640625, 1.052093505859375, 1.12994384765625, 1.207794189453125, 1.28564453125, 1.363494873046875, 1.44134521484375, 1.519195556640625, 1.5970458984375, 1.674896240234375, 1.75274658203125, 1.830596923828125, 1.908447265625, 1.986297607421875, 2.06414794921875, 2.141998291015625, 2.2198486328125, 2.297698974609375, 2.37554931640625, 2.453399658203125, 2.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 4.0, 10.0, 11.0, 10.0, 8.0, 17.0, 24.0, 20.0, 24.0, 22.0, 18.0, 33.0, 19.0, 35.0, 39.0, 26.0, 49.0, 46.0, 50.0, 41.0, 39.0, 29.0, 39.0, 43.0, 32.0, 30.0, 29.0, 28.0, 23.0, 28.0, 27.0, 18.0, 14.0, 19.0, 14.0, 13.0, 11.0, 9.0, 11.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-2.333984375, -2.254425048828125, -2.17486572265625, -2.095306396484375, -2.0157470703125, -1.936187744140625, -1.85662841796875, -1.777069091796875, -1.697509765625, -1.617950439453125, -1.53839111328125, -1.458831787109375, -1.3792724609375, -1.299713134765625, -1.22015380859375, -1.140594482421875, -1.06103515625, -0.981475830078125, -0.90191650390625, -0.822357177734375, -0.7427978515625, -0.663238525390625, -0.58367919921875, -0.504119873046875, -0.424560546875, -0.345001220703125, -0.26544189453125, -0.185882568359375, -0.1063232421875, -0.026763916015625, 0.05279541015625, 0.132354736328125, 0.2119140625, 0.291473388671875, 0.37103271484375, 0.450592041015625, 0.5301513671875, 0.609710693359375, 0.68927001953125, 0.768829345703125, 0.848388671875, 0.927947998046875, 1.00750732421875, 1.087066650390625, 1.1666259765625, 1.246185302734375, 1.32574462890625, 1.405303955078125, 1.48486328125, 1.564422607421875, 1.64398193359375, 1.723541259765625, 1.8031005859375, 1.882659912109375, 1.96221923828125, 2.041778564453125, 2.121337890625, 2.200897216796875, 2.28045654296875, 2.360015869140625, 2.4395751953125, 2.519134521484375, 2.59869384765625, 2.678253173828125, 2.7578125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 28.0, 41.0, 60.0, 97.0, 127.0, 228.0, 310.0, 407.0, 718.0, 1129.0, 1664.0, 2514.0, 3922.0, 5911.0, 8993.0, 14307.0, 21533.0, 32764.0, 47827.0, 69122.0, 93037.0, 115252.0, 129046.0, 125140.0, 107743.0, 83663.0, 60639.0, 41578.0, 27840.0, 18275.0, 11956.0, 7723.0, 5136.0, 3386.0, 2207.0, 1447.0, 927.0, 562.0, 420.0, 266.0, 175.0, 125.0, 104.0, 63.0, 36.0, 31.0, 13.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0], "bins": [-2.25, -2.181427001953125, -2.11285400390625, -2.044281005859375, -1.9757080078125, -1.907135009765625, -1.83856201171875, -1.769989013671875, -1.701416015625, -1.632843017578125, -1.56427001953125, -1.495697021484375, -1.4271240234375, -1.358551025390625, -1.28997802734375, -1.221405029296875, -1.15283203125, -1.084259033203125, -1.01568603515625, -0.947113037109375, -0.8785400390625, -0.809967041015625, -0.74139404296875, -0.672821044921875, -0.604248046875, -0.535675048828125, -0.46710205078125, -0.398529052734375, -0.3299560546875, -0.261383056640625, -0.19281005859375, -0.124237060546875, -0.0556640625, 0.012908935546875, 0.08148193359375, 0.150054931640625, 0.2186279296875, 0.287200927734375, 0.35577392578125, 0.424346923828125, 0.492919921875, 0.561492919921875, 0.63006591796875, 0.698638916015625, 0.7672119140625, 0.835784912109375, 0.90435791015625, 0.972930908203125, 1.04150390625, 1.110076904296875, 1.17864990234375, 1.247222900390625, 1.3157958984375, 1.384368896484375, 1.45294189453125, 1.521514892578125, 1.590087890625, 1.658660888671875, 1.72723388671875, 1.795806884765625, 1.8643798828125, 1.932952880859375, 2.00152587890625, 2.070098876953125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 13.0, 18.0, 16.0, 20.0, 26.0, 29.0, 18.0, 37.0, 40.0, 50.0, 48.0, 31.0, 43.0, 44.0, 37.0, 47.0, 48.0, 41.0, 42.0, 48.0, 35.0, 33.0, 36.0, 18.0, 25.0, 22.0, 22.0, 16.0, 11.0, 8.0, 9.0, 4.0, 8.0, 12.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.770233154296875, -1.71234130859375, -1.654449462890625, -1.5965576171875, -1.538665771484375, -1.48077392578125, -1.422882080078125, -1.364990234375, -1.307098388671875, -1.24920654296875, -1.191314697265625, -1.1334228515625, -1.075531005859375, -1.01763916015625, -0.959747314453125, -0.90185546875, -0.843963623046875, -0.78607177734375, -0.728179931640625, -0.6702880859375, -0.612396240234375, -0.55450439453125, -0.496612548828125, -0.438720703125, -0.380828857421875, -0.32293701171875, -0.265045166015625, -0.2071533203125, -0.149261474609375, -0.09136962890625, -0.033477783203125, 0.0244140625, 0.082305908203125, 0.14019775390625, 0.198089599609375, 0.2559814453125, 0.313873291015625, 0.37176513671875, 0.429656982421875, 0.487548828125, 0.545440673828125, 0.60333251953125, 0.661224365234375, 0.7191162109375, 0.777008056640625, 0.83489990234375, 0.892791748046875, 0.95068359375, 1.008575439453125, 1.06646728515625, 1.124359130859375, 1.1822509765625, 1.240142822265625, 1.29803466796875, 1.355926513671875, 1.413818359375, 1.471710205078125, 1.52960205078125, 1.587493896484375, 1.6453857421875, 1.703277587890625, 1.76116943359375, 1.819061279296875, 1.876953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 13.0, 14.0, 23.0, 29.0, 43.0, 64.0, 93.0, 154.0, 256.0, 403.0, 656.0, 1166.0, 1897.0, 3336.0, 5876.0, 10222.0, 18268.0, 32339.0, 56490.0, 93837.0, 143808.0, 182255.0, 174814.0, 129306.0, 81618.0, 48177.0, 27264.0, 15309.0, 8828.0, 4834.0, 2949.0, 1652.0, 989.0, 588.0, 362.0, 218.0, 145.0, 81.0, 58.0, 42.0, 19.0, 19.0, 14.0, 3.0, 12.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5177154541015625, -1.465118408203125, -1.4125213623046875, -1.35992431640625, -1.3073272705078125, -1.254730224609375, -1.2021331787109375, -1.1495361328125, -1.0969390869140625, -1.044342041015625, -0.9917449951171875, -0.93914794921875, -0.8865509033203125, -0.833953857421875, -0.7813568115234375, -0.728759765625, -0.6761627197265625, -0.623565673828125, -0.5709686279296875, -0.51837158203125, -0.4657745361328125, -0.413177490234375, -0.3605804443359375, -0.3079833984375, -0.2553863525390625, -0.202789306640625, -0.1501922607421875, -0.09759521484375, -0.0449981689453125, 0.007598876953125, 0.0601959228515625, 0.11279296875, 0.1653900146484375, 0.217987060546875, 0.2705841064453125, 0.32318115234375, 0.3757781982421875, 0.428375244140625, 0.4809722900390625, 0.5335693359375, 0.5861663818359375, 0.638763427734375, 0.6913604736328125, 0.74395751953125, 0.7965545654296875, 0.849151611328125, 0.9017486572265625, 0.954345703125, 1.0069427490234375, 1.059539794921875, 1.1121368408203125, 1.16473388671875, 1.2173309326171875, 1.269927978515625, 1.3225250244140625, 1.3751220703125, 1.4277191162109375, 1.480316162109375, 1.5329132080078125, 1.58551025390625, 1.6381072998046875, 1.690704345703125, 1.7433013916015625, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 6.0, 11.0, 14.0, 15.0, 13.0, 22.0, 31.0, 26.0, 36.0, 40.0, 39.0, 48.0, 39.0, 55.0, 41.0, 59.0, 45.0, 49.0, 54.0, 48.0, 41.0, 35.0, 36.0, 26.0, 25.0, 24.0, 16.0, 17.0, 18.0, 12.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001214146614074707, -0.00011733081191778183, -0.00011324696242809296, -0.00010916311293840408, -0.00010507926344871521, -0.00010099541395902634, -9.691156446933746e-05, -9.282771497964859e-05, -8.874386548995972e-05, -8.466001600027084e-05, -8.057616651058197e-05, -7.64923170208931e-05, -7.240846753120422e-05, -6.832461804151535e-05, -6.424076855182648e-05, -6.0156919062137604e-05, -5.607306957244873e-05, -5.198922008275986e-05, -4.7905370593070984e-05, -4.382152110338211e-05, -3.973767161369324e-05, -3.5653822124004364e-05, -3.156997263431549e-05, -2.7486123144626617e-05, -2.3402273654937744e-05, -1.931842416524887e-05, -1.5234574675559998e-05, -1.1150725185871124e-05, -7.066875696182251e-06, -2.9830262064933777e-06, 1.1008232831954956e-06, 5.184672772884369e-06, 9.268522262573242e-06, 1.3352371752262115e-05, 1.743622124195099e-05, 2.1520070731639862e-05, 2.5603920221328735e-05, 2.968776971101761e-05, 3.377161920070648e-05, 3.7855468690395355e-05, 4.193931818008423e-05, 4.60231676697731e-05, 5.0107017159461975e-05, 5.419086664915085e-05, 5.827471613883972e-05, 6.23585656285286e-05, 6.644241511821747e-05, 7.052626460790634e-05, 7.461011409759521e-05, 7.869396358728409e-05, 8.277781307697296e-05, 8.686166256666183e-05, 9.094551205635071e-05, 9.502936154603958e-05, 9.911321103572845e-05, 0.00010319706052541733, 0.0001072809100151062, 0.00011136475950479507, 0.00011544860899448395, 0.00011953245848417282, 0.0001236163079738617, 0.00012770015746355057, 0.00013178400695323944, 0.00013586785644292831, 0.0001399517059326172]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 22.0, 42.0, 46.0, 97.0, 139.0, 205.0, 343.0, 547.0, 880.0, 1436.0, 2382.0, 4010.0, 6724.0, 10976.0, 18127.0, 30230.0, 49581.0, 76893.0, 113280.0, 148222.0, 160438.0, 140719.0, 103589.0, 69046.0, 43475.0, 26562.0, 16209.0, 9600.0, 5827.0, 3471.0, 2056.0, 1290.0, 749.0, 459.0, 303.0, 203.0, 134.0, 83.0, 40.0, 44.0, 15.0, 12.0, 13.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3618621826171875, -1.318450927734375, -1.2750396728515625, -1.23162841796875, -1.1882171630859375, -1.144805908203125, -1.1013946533203125, -1.0579833984375, -1.0145721435546875, -0.971160888671875, -0.9277496337890625, -0.88433837890625, -0.8409271240234375, -0.797515869140625, -0.7541046142578125, -0.710693359375, -0.6672821044921875, -0.623870849609375, -0.5804595947265625, -0.53704833984375, -0.4936370849609375, -0.450225830078125, -0.4068145751953125, -0.3634033203125, -0.3199920654296875, -0.276580810546875, -0.2331695556640625, -0.18975830078125, -0.1463470458984375, -0.102935791015625, -0.0595245361328125, -0.01611328125, 0.0272979736328125, 0.070709228515625, 0.1141204833984375, 0.15753173828125, 0.2009429931640625, 0.244354248046875, 0.2877655029296875, 0.3311767578125, 0.3745880126953125, 0.417999267578125, 0.4614105224609375, 0.50482177734375, 0.5482330322265625, 0.591644287109375, 0.6350555419921875, 0.678466796875, 0.7218780517578125, 0.765289306640625, 0.8087005615234375, 0.85211181640625, 0.8955230712890625, 0.938934326171875, 0.9823455810546875, 1.0257568359375, 1.0691680908203125, 1.112579345703125, 1.1559906005859375, 1.19940185546875, 1.2428131103515625, 1.286224365234375, 1.3296356201171875, 1.373046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 9.0, 9.0, 5.0, 16.0, 13.0, 17.0, 22.0, 28.0, 23.0, 41.0, 40.0, 33.0, 41.0, 52.0, 41.0, 43.0, 56.0, 47.0, 54.0, 53.0, 47.0, 47.0, 37.0, 34.0, 35.0, 34.0, 22.0, 17.0, 18.0, 9.0, 16.0, 10.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.359283447265625, -0.34600830078125, -0.332733154296875, -0.3194580078125, -0.306182861328125, -0.29290771484375, -0.279632568359375, -0.266357421875, -0.253082275390625, -0.23980712890625, -0.226531982421875, -0.2132568359375, -0.199981689453125, -0.18670654296875, -0.173431396484375, -0.16015625, -0.146881103515625, -0.13360595703125, -0.120330810546875, -0.1070556640625, -0.093780517578125, -0.08050537109375, -0.067230224609375, -0.053955078125, -0.040679931640625, -0.02740478515625, -0.014129638671875, -0.0008544921875, 0.012420654296875, 0.02569580078125, 0.038970947265625, 0.05224609375, 0.065521240234375, 0.07879638671875, 0.092071533203125, 0.1053466796875, 0.118621826171875, 0.13189697265625, 0.145172119140625, 0.158447265625, 0.171722412109375, 0.18499755859375, 0.198272705078125, 0.2115478515625, 0.224822998046875, 0.23809814453125, 0.251373291015625, 0.2646484375, 0.277923583984375, 0.29119873046875, 0.304473876953125, 0.3177490234375, 0.331024169921875, 0.34429931640625, 0.357574462890625, 0.370849609375, 0.384124755859375, 0.39739990234375, 0.410675048828125, 0.4239501953125, 0.437225341796875, 0.45050048828125, 0.463775634765625, 0.47705078125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 14.0, 11.0, 9.0, 15.0, 18.0, 13.0, 17.0, 31.0, 27.0, 41.0, 43.0, 42.0, 55.0, 63.0, 61.0, 68.0, 61.0, 58.0, 45.0, 61.0, 31.0, 35.0, 25.0, 29.0, 32.0, 27.0, 16.0, 10.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737412691116333, -3.605987548828125, -3.474562406539917, -3.343137264251709, -3.211712121963501, -3.080286979675293, -2.948861837387085, -2.817436695098877, -2.686011552810669, -2.554586410522461, -2.423161268234253, -2.291736125946045, -2.160310983657837, -2.028885841369629, -1.897460699081421, -1.766035556793213, -1.6346104145050049, -1.5031852722167969, -1.3717601299285889, -1.2403349876403809, -1.1089098453521729, -0.9774847030639648, -0.8460595607757568, -0.7146344184875488, -0.5832092761993408, -0.4517841339111328, -0.3203589916229248, -0.1889338493347168, -0.05750870704650879, 0.07391643524169922, 0.20534157752990723, 0.33676671981811523, 0.46819162368774414, 0.5996167659759521, 0.7310419082641602, 0.8624670505523682, 0.9938921928405762, 1.1253173351287842, 1.2567424774169922, 1.3881676197052002, 1.5195927619934082, 1.6510179042816162, 1.7824430465698242, 1.9138681888580322, 2.0452933311462402, 2.1767184734344482, 2.3081436157226562, 2.4395687580108643, 2.5709939002990723, 2.7024190425872803, 2.8338441848754883, 2.9652693271636963, 3.0966944694519043, 3.2281196117401123, 3.3595447540283203, 3.4909698963165283, 3.6223950386047363, 3.7538201808929443, 3.8852453231811523, 4.016670227050781, 4.148095607757568, 4.2795209884643555, 4.410945892333984, 4.542370796203613, 4.6737961769104]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 9.0, 9.0, 14.0, 12.0, 24.0, 22.0, 30.0, 31.0, 25.0, 35.0, 35.0, 35.0, 40.0, 36.0, 33.0, 30.0, 39.0, 32.0, 44.0, 47.0, 49.0, 44.0, 37.0, 25.0, 27.0, 27.0, 19.0, 27.0, 15.0, 13.0, 17.0, 20.0, 11.0, 14.0, 6.0, 7.0, 4.0, 9.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0968737602233887, -2.024630546569824, -1.9523870944976807, -1.8801438808441162, -1.8079005479812622, -1.7356572151184082, -1.6634140014648438, -1.5911706686019897, -1.5189273357391357, -1.4466840028762817, -1.3744406700134277, -1.3021974563598633, -1.2299541234970093, -1.1577107906341553, -1.0854675769805908, -1.0132242441177368, -0.9409809112548828, -0.8687375783920288, -0.7964943051338196, -0.7242510318756104, -0.6520076990127563, -0.5797643661499023, -0.5075210928916931, -0.4352778196334839, -0.3630344867706299, -0.29079118371009827, -0.21854788064956665, -0.14630457758903503, -0.07406127452850342, -0.0018179714679718018, 0.07042533159255981, 0.14266860485076904, 0.21491169929504395, 0.28715500235557556, 0.3593983054161072, 0.4316416084766388, 0.5038849115371704, 0.5761282444000244, 0.6483715176582336, 0.7206147909164429, 0.7928581237792969, 0.8651014566421509, 0.9373447299003601, 1.0095880031585693, 1.0818313360214233, 1.1540746688842773, 1.2263178825378418, 1.2985612154006958, 1.3708045482635498, 1.4430478811264038, 1.5152912139892578, 1.5875344276428223, 1.6597777605056763, 1.7320210933685303, 1.8042643070220947, 1.8765076398849487, 1.9487509727478027, 2.020994186401367, 2.0932376384735107, 2.165480852127075, 2.2377243041992188, 2.309967517852783, 2.3822107315063477, 2.454453945159912, 2.5266973972320557]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 15.0, 15.0, 31.0, 53.0, 50.0, 84.0, 107.0, 164.0, 243.0, 360.0, 595.0, 951.0, 1362.0, 2329.0, 3856.0, 6858.0, 12539.0, 23711.0, 47416.0, 100038.0, 229439.0, 552685.0, 1117856.0, 1118593.0, 544901.0, 225033.0, 100026.0, 47521.0, 24514.0, 13433.0, 7620.0, 4376.0, 2776.0, 1663.0, 1092.0, 682.0, 473.0, 284.0, 187.0, 130.0, 73.0, 49.0, 28.0, 19.0, 13.0, 10.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 11.0, 5.0, 7.0, 17.0, 16.0, 10.0, 26.0, 18.0, 17.0, 37.0, 34.0, 29.0, 45.0, 42.0, 34.0, 38.0, 45.0, 40.0, 46.0, 40.0, 46.0, 54.0, 44.0, 22.0, 29.0, 28.0, 27.0, 24.0, 24.0, 25.0, 27.0, 13.0, 16.0, 14.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7919921875, -1.734954833984375, -1.67791748046875, -1.620880126953125, -1.5638427734375, -1.506805419921875, -1.44976806640625, -1.392730712890625, -1.335693359375, -1.278656005859375, -1.22161865234375, -1.164581298828125, -1.1075439453125, -1.050506591796875, -0.99346923828125, -0.936431884765625, -0.87939453125, -0.822357177734375, -0.76531982421875, -0.708282470703125, -0.6512451171875, -0.594207763671875, -0.53717041015625, -0.480133056640625, -0.423095703125, -0.366058349609375, -0.30902099609375, -0.251983642578125, -0.1949462890625, -0.137908935546875, -0.08087158203125, -0.023834228515625, 0.033203125, 0.090240478515625, 0.14727783203125, 0.204315185546875, 0.2613525390625, 0.318389892578125, 0.37542724609375, 0.432464599609375, 0.489501953125, 0.546539306640625, 0.60357666015625, 0.660614013671875, 0.7176513671875, 0.774688720703125, 0.83172607421875, 0.888763427734375, 0.94580078125, 1.002838134765625, 1.05987548828125, 1.116912841796875, 1.1739501953125, 1.230987548828125, 1.28802490234375, 1.345062255859375, 1.402099609375, 1.459136962890625, 1.51617431640625, 1.573211669921875, 1.6302490234375, 1.687286376953125, 1.74432373046875, 1.801361083984375, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 15.0, 20.0, 32.0, 57.0, 74.0, 131.0, 211.0, 321.0, 518.0, 853.0, 1404.0, 2213.0, 3707.0, 6283.0, 10778.0, 19348.0, 36010.0, 67104.0, 131689.0, 264487.0, 532742.0, 931319.0, 981830.0, 592995.0, 297473.0, 147644.0, 74988.0, 39427.0, 21663.0, 11878.0, 6744.0, 3924.0, 2364.0, 1483.0, 884.0, 566.0, 363.0, 256.0, 134.0, 88.0, 70.0, 49.0, 51.0, 21.0, 15.0, 16.0, 5.0, 7.0, 11.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.9658203125, -3.833984375, -3.7021484375, -3.5703125, -3.4384765625, -3.306640625, -3.1748046875, -3.04296875, -2.9111328125, -2.779296875, -2.6474609375, -2.515625, -2.3837890625, -2.251953125, -2.1201171875, -1.98828125, -1.8564453125, -1.724609375, -1.5927734375, -1.4609375, -1.3291015625, -1.197265625, -1.0654296875, -0.93359375, -0.8017578125, -0.669921875, -0.5380859375, -0.40625, -0.2744140625, -0.142578125, -0.0107421875, 0.12109375, 0.2529296875, 0.384765625, 0.5166015625, 0.6484375, 0.7802734375, 0.912109375, 1.0439453125, 1.17578125, 1.3076171875, 1.439453125, 1.5712890625, 1.703125, 1.8349609375, 1.966796875, 2.0986328125, 2.23046875, 2.3623046875, 2.494140625, 2.6259765625, 2.7578125, 2.8896484375, 3.021484375, 3.1533203125, 3.28515625, 3.4169921875, 3.548828125, 3.6806640625, 3.8125, 3.9443359375, 4.076171875, 4.2080078125, 4.33984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 6.0, 8.0, 21.0, 19.0, 11.0, 22.0, 35.0, 40.0, 39.0, 56.0, 63.0, 78.0, 86.0, 103.0, 143.0, 139.0, 176.0, 192.0, 193.0, 199.0, 215.0, 227.0, 224.0, 231.0, 199.0, 169.0, 151.0, 146.0, 146.0, 113.0, 108.0, 98.0, 80.0, 48.0, 45.0, 44.0, 40.0, 27.0, 26.0, 16.0, 17.0, 8.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0107421875, -0.9813995361328125, -0.952056884765625, -0.9227142333984375, -0.89337158203125, -0.8640289306640625, -0.834686279296875, -0.8053436279296875, -0.7760009765625, -0.7466583251953125, -0.717315673828125, -0.6879730224609375, -0.65863037109375, -0.6292877197265625, -0.599945068359375, -0.5706024169921875, -0.541259765625, -0.5119171142578125, -0.482574462890625, -0.4532318115234375, -0.42388916015625, -0.3945465087890625, -0.365203857421875, -0.3358612060546875, -0.3065185546875, -0.2771759033203125, -0.247833251953125, -0.2184906005859375, -0.18914794921875, -0.1598052978515625, -0.130462646484375, -0.1011199951171875, -0.07177734375, -0.0424346923828125, -0.013092041015625, 0.0162506103515625, 0.04559326171875, 0.0749359130859375, 0.104278564453125, 0.1336212158203125, 0.1629638671875, 0.1923065185546875, 0.221649169921875, 0.2509918212890625, 0.28033447265625, 0.3096771240234375, 0.339019775390625, 0.3683624267578125, 0.397705078125, 0.4270477294921875, 0.456390380859375, 0.4857330322265625, 0.51507568359375, 0.5444183349609375, 0.573760986328125, 0.6031036376953125, 0.6324462890625, 0.6617889404296875, 0.691131591796875, 0.7204742431640625, 0.74981689453125, 0.7791595458984375, 0.808502197265625, 0.8378448486328125, 0.8671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 2.0, 10.0, 8.0, 12.0, 11.0, 16.0, 22.0, 34.0, 42.0, 42.0, 38.0, 56.0, 70.0, 49.0, 75.0, 72.0, 64.0, 66.0, 53.0, 52.0, 38.0, 35.0, 21.0, 25.0, 21.0, 18.0, 9.0, 8.0, 3.0, 11.0, 2.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.347010850906372, -3.201976776123047, -3.0569427013397217, -2.9119086265563965, -2.766874313354492, -2.621840476989746, -2.476806163787842, -2.3317720890045166, -2.1867380142211914, -2.041703939437866, -1.896669864654541, -1.7516356706619263, -1.606601595878601, -1.4615675210952759, -1.3165333271026611, -1.171499252319336, -1.0264651775360107, -0.8814311027526855, -0.7363969683647156, -0.5913628339767456, -0.4463287591934204, -0.3012946844100952, -0.15626055002212524, -0.011226415634155273, 0.13380765914916992, 0.2788417637348175, 0.4238758683204651, 0.5689100027084351, 0.7139440774917603, 0.8589781522750854, 1.0040123462677002, 1.1490464210510254, 1.2940807342529297, 1.4391148090362549, 1.58414888381958, 1.7291830778121948, 1.87421715259552, 2.0192513465881348, 2.16428542137146, 2.309319496154785, 2.4543535709381104, 2.5993876457214355, 2.7444217205047607, 2.889455795288086, 3.0344901084899902, 3.1795239448547363, 3.3245582580566406, 3.469592332839966, 3.614626407623291, 3.759660482406616, 3.9046945571899414, 4.049728870391846, 4.194762706756592, 4.339797019958496, 4.484830856323242, 4.6298651695251465, 4.774899482727051, 4.919933795928955, 5.064967632293701, 5.2100019454956055, 5.355035781860352, 5.500070095062256, 5.645103931427002, 5.790138244628906, 5.935172080993652]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 14.0, 19.0, 16.0, 16.0, 29.0, 30.0, 28.0, 37.0, 23.0, 40.0, 38.0, 41.0, 53.0, 33.0, 38.0, 45.0, 51.0, 46.0, 43.0, 46.0, 35.0, 33.0, 28.0, 29.0, 25.0, 29.0, 25.0, 17.0, 11.0, 16.0, 9.0, 6.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9165393114089966, -1.8452924489974976, -1.7740455865859985, -1.7027987241744995, -1.6315518617630005, -1.5603049993515015, -1.4890581369400024, -1.4178112745285034, -1.3465644121170044, -1.2753175497055054, -1.2040706872940063, -1.1328238248825073, -1.0615769624710083, -0.9903301000595093, -0.9190832376480103, -0.8478363752365112, -0.7765895128250122, -0.7053426504135132, -0.6340957880020142, -0.5628489255905151, -0.4916020631790161, -0.4203552007675171, -0.34910833835601807, -0.27786147594451904, -0.20661461353302002, -0.135367751121521, -0.06412088871002197, 0.007125973701477051, 0.07837283611297607, 0.1496196985244751, 0.22086656093597412, 0.29211342334747314, 0.3633601665496826, 0.43460702896118164, 0.5058538913726807, 0.5771007537841797, 0.6483476161956787, 0.7195944786071777, 0.7908413410186768, 0.8620882034301758, 0.9333350658416748, 1.0045819282531738, 1.0758287906646729, 1.1470756530761719, 1.218322515487671, 1.28956937789917, 1.360816240310669, 1.432063102722168, 1.503309965133667, 1.574556827545166, 1.645803689956665, 1.717050552368164, 1.788297414779663, 1.859544277191162, 1.9307911396026611, 2.00203800201416, 2.073284864425659, 2.144531726837158, 2.2157785892486572, 2.2870254516601562, 2.3582723140716553, 2.4295191764831543, 2.5007660388946533, 2.5720129013061523, 2.6432597637176514]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 16.0, 20.0, 28.0, 39.0, 59.0, 66.0, 79.0, 129.0, 180.0, 214.0, 296.0, 422.0, 618.0, 885.0, 1406.0, 2312.0, 3879.0, 6637.0, 11992.0, 23685.0, 47682.0, 98091.0, 186254.0, 254527.0, 195861.0, 104975.0, 51522.0, 25398.0, 13129.0, 6948.0, 4026.0, 2386.0, 1501.0, 923.0, 644.0, 457.0, 336.0, 221.0, 185.0, 120.0, 114.0, 56.0, 60.0, 40.0, 29.0, 31.0, 21.0, 9.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5258369445800781, -0.5096817016601562, -0.4935264587402344, -0.4773712158203125, -0.4612159729003906, -0.44506072998046875, -0.4289054870605469, -0.412750244140625, -0.3965950012207031, -0.38043975830078125, -0.3642845153808594, -0.3481292724609375, -0.3319740295410156, -0.31581878662109375, -0.2996635437011719, -0.28350830078125, -0.2673530578613281, -0.25119781494140625, -0.23504257202148438, -0.2188873291015625, -0.20273208618164062, -0.18657684326171875, -0.17042160034179688, -0.154266357421875, -0.13811111450195312, -0.12195587158203125, -0.10580062866210938, -0.0896453857421875, -0.07349014282226562, -0.05733489990234375, -0.041179656982421875, -0.0250244140625, -0.008869171142578125, 0.00728607177734375, 0.023441314697265625, 0.0395965576171875, 0.055751800537109375, 0.07190704345703125, 0.08806228637695312, 0.104217529296875, 0.12037277221679688, 0.13652801513671875, 0.15268325805664062, 0.1688385009765625, 0.18499374389648438, 0.20114898681640625, 0.21730422973632812, 0.23345947265625, 0.24961471557617188, 0.26576995849609375, 0.2819252014160156, 0.2980804443359375, 0.3142356872558594, 0.33039093017578125, 0.3465461730957031, 0.362701416015625, 0.3788566589355469, 0.39501190185546875, 0.4111671447753906, 0.4273223876953125, 0.4434776306152344, 0.45963287353515625, 0.4757881164550781, 0.491943359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 13.0, 15.0, 18.0, 10.0, 21.0, 23.0, 27.0, 40.0, 34.0, 35.0, 35.0, 44.0, 42.0, 46.0, 45.0, 52.0, 43.0, 46.0, 42.0, 37.0, 37.0, 29.0, 38.0, 38.0, 25.0, 21.0, 23.0, 21.0, 17.0, 15.0, 10.0, 7.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.348663330078125, -2.26568603515625, -2.182708740234375, -2.0997314453125, -2.016754150390625, -1.93377685546875, -1.850799560546875, -1.767822265625, -1.684844970703125, -1.60186767578125, -1.518890380859375, -1.4359130859375, -1.352935791015625, -1.26995849609375, -1.186981201171875, -1.10400390625, -1.021026611328125, -0.93804931640625, -0.855072021484375, -0.7720947265625, -0.689117431640625, -0.60614013671875, -0.523162841796875, -0.440185546875, -0.357208251953125, -0.27423095703125, -0.191253662109375, -0.1082763671875, -0.025299072265625, 0.05767822265625, 0.140655517578125, 0.2236328125, 0.306610107421875, 0.38958740234375, 0.472564697265625, 0.5555419921875, 0.638519287109375, 0.72149658203125, 0.804473876953125, 0.887451171875, 0.970428466796875, 1.05340576171875, 1.136383056640625, 1.2193603515625, 1.302337646484375, 1.38531494140625, 1.468292236328125, 1.55126953125, 1.634246826171875, 1.71722412109375, 1.800201416015625, 1.8831787109375, 1.966156005859375, 2.04913330078125, 2.132110595703125, 2.215087890625, 2.298065185546875, 2.38104248046875, 2.464019775390625, 2.5469970703125, 2.629974365234375, 2.71295166015625, 2.795928955078125, 2.87890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 12.0, 16.0, 24.0, 22.0, 29.0, 62.0, 65.0, 116.0, 172.0, 218.0, 388.0, 608.0, 1143.0, 2225.0, 4933.0, 13626.0, 52366.0, 905642.0, 44735.0, 12511.0, 4720.0, 2129.0, 1059.0, 606.0, 347.0, 247.0, 141.0, 113.0, 64.0, 50.0, 43.0, 23.0, 22.0, 7.0, 15.0, 8.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0], "bins": [-1.7724609375, -1.719482421875, -1.66650390625, -1.613525390625, -1.560546875, -1.507568359375, -1.45458984375, -1.401611328125, -1.3486328125, -1.295654296875, -1.24267578125, -1.189697265625, -1.13671875, -1.083740234375, -1.03076171875, -0.977783203125, -0.9248046875, -0.871826171875, -0.81884765625, -0.765869140625, -0.712890625, -0.659912109375, -0.60693359375, -0.553955078125, -0.5009765625, -0.447998046875, -0.39501953125, -0.342041015625, -0.2890625, -0.236083984375, -0.18310546875, -0.130126953125, -0.0771484375, -0.024169921875, 0.02880859375, 0.081787109375, 0.134765625, 0.187744140625, 0.24072265625, 0.293701171875, 0.3466796875, 0.399658203125, 0.45263671875, 0.505615234375, 0.55859375, 0.611572265625, 0.66455078125, 0.717529296875, 0.7705078125, 0.823486328125, 0.87646484375, 0.929443359375, 0.982421875, 1.035400390625, 1.08837890625, 1.141357421875, 1.1943359375, 1.247314453125, 1.30029296875, 1.353271484375, 1.40625, 1.459228515625, 1.51220703125, 1.565185546875, 1.6181640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 2.0, 6.0, 15.0, 10.0, 12.0, 14.0, 18.0, 27.0, 18.0, 31.0, 18.0, 35.0, 26.0, 42.0, 30.0, 36.0, 43.0, 49.0, 49.0, 36.0, 38.0, 41.0, 33.0, 47.0, 27.0, 43.0, 32.0, 22.0, 19.0, 29.0, 24.0, 20.0, 19.0, 14.0, 15.0, 8.0, 9.0, 15.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.599609375, -1.5498504638671875, -1.500091552734375, -1.4503326416015625, -1.40057373046875, -1.3508148193359375, -1.301055908203125, -1.2512969970703125, -1.2015380859375, -1.1517791748046875, -1.102020263671875, -1.0522613525390625, -1.00250244140625, -0.9527435302734375, -0.902984619140625, -0.8532257080078125, -0.803466796875, -0.7537078857421875, -0.703948974609375, -0.6541900634765625, -0.60443115234375, -0.5546722412109375, -0.504913330078125, -0.4551544189453125, -0.4053955078125, -0.3556365966796875, -0.305877685546875, -0.2561187744140625, -0.20635986328125, -0.1566009521484375, -0.106842041015625, -0.0570831298828125, -0.00732421875, 0.0424346923828125, 0.092193603515625, 0.1419525146484375, 0.19171142578125, 0.2414703369140625, 0.291229248046875, 0.3409881591796875, 0.3907470703125, 0.4405059814453125, 0.490264892578125, 0.5400238037109375, 0.58978271484375, 0.6395416259765625, 0.689300537109375, 0.7390594482421875, 0.788818359375, 0.8385772705078125, 0.888336181640625, 0.9380950927734375, 0.98785400390625, 1.0376129150390625, 1.087371826171875, 1.1371307373046875, 1.1868896484375, 1.2366485595703125, 1.286407470703125, 1.3361663818359375, 1.38592529296875, 1.4356842041015625, 1.485443115234375, 1.5352020263671875, 1.5849609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 13.0, 10.0, 17.0, 18.0, 25.0, 31.0, 41.0, 46.0, 58.0, 80.0, 108.0, 152.0, 179.0, 247.0, 354.0, 475.0, 742.0, 1176.0, 2197.0, 4414.0, 9417.0, 24542.0, 689032.0, 274530.0, 22142.0, 8808.0, 4041.0, 2069.0, 1163.0, 716.0, 464.0, 307.0, 211.0, 150.0, 99.0, 107.0, 95.0, 52.0, 35.0, 43.0, 22.0, 27.0, 16.0, 21.0, 14.0, 8.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4404296875, -0.4266471862792969, -0.41286468505859375, -0.3990821838378906, -0.3852996826171875, -0.3715171813964844, -0.35773468017578125, -0.3439521789550781, -0.330169677734375, -0.3163871765136719, -0.30260467529296875, -0.2888221740722656, -0.2750396728515625, -0.2612571716308594, -0.24747467041015625, -0.23369216918945312, -0.21990966796875, -0.20612716674804688, -0.19234466552734375, -0.17856216430664062, -0.1647796630859375, -0.15099716186523438, -0.13721466064453125, -0.12343215942382812, -0.109649658203125, -0.09586715698242188, -0.08208465576171875, -0.06830215454101562, -0.0545196533203125, -0.040737152099609375, -0.02695465087890625, -0.013172149658203125, 0.0006103515625, 0.014392852783203125, 0.02817535400390625, 0.041957855224609375, 0.0557403564453125, 0.06952285766601562, 0.08330535888671875, 0.09708786010742188, 0.110870361328125, 0.12465286254882812, 0.13843536376953125, 0.15221786499023438, 0.1660003662109375, 0.17978286743164062, 0.19356536865234375, 0.20734786987304688, 0.22113037109375, 0.23491287231445312, 0.24869537353515625, 0.2624778747558594, 0.2762603759765625, 0.2900428771972656, 0.30382537841796875, 0.3176078796386719, 0.331390380859375, 0.3451728820800781, 0.35895538330078125, 0.3727378845214844, 0.3865203857421875, 0.4003028869628906, 0.41408538818359375, 0.4278678894042969, 0.441650390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 15.0, 14.0, 18.0, 28.0, 22.0, 46.0, 38.0, 45.0, 54.0, 52.0, 73.0, 72.0, 53.0, 76.0, 70.0, 61.0, 39.0, 43.0, 43.0, 27.0, 21.0, 12.0, 14.0, 12.0, 8.0, 9.0, 6.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0590763092041016e-05, -3.9091333746910095e-05, -3.7591904401779175e-05, -3.6092475056648254e-05, -3.4593045711517334e-05, -3.3093616366386414e-05, -3.159418702125549e-05, -3.0094757676124573e-05, -2.8595328330993652e-05, -2.7095898985862732e-05, -2.559646964073181e-05, -2.409704029560089e-05, -2.259761095046997e-05, -2.109818160533905e-05, -1.959875226020813e-05, -1.809932291507721e-05, -1.659989356994629e-05, -1.5100464224815369e-05, -1.3601034879684448e-05, -1.2101605534553528e-05, -1.0602176189422607e-05, -9.102746844291687e-06, -7.603317499160767e-06, -6.103888154029846e-06, -4.604458808898926e-06, -3.1050294637680054e-06, -1.605600118637085e-06, -1.0617077350616455e-07, 1.3932585716247559e-06, 2.8926879167556763e-06, 4.392117261886597e-06, 5.891546607017517e-06, 7.3909759521484375e-06, 8.890405297279358e-06, 1.0389834642410278e-05, 1.1889263987541199e-05, 1.3388693332672119e-05, 1.488812267780304e-05, 1.638755202293396e-05, 1.788698136806488e-05, 1.93864107131958e-05, 2.088584005832672e-05, 2.238526940345764e-05, 2.3884698748588562e-05, 2.5384128093719482e-05, 2.6883557438850403e-05, 2.8382986783981323e-05, 2.9882416129112244e-05, 3.1381845474243164e-05, 3.2881274819374084e-05, 3.4380704164505005e-05, 3.5880133509635925e-05, 3.7379562854766846e-05, 3.8878992199897766e-05, 4.0378421545028687e-05, 4.187785089015961e-05, 4.337728023529053e-05, 4.487670958042145e-05, 4.637613892555237e-05, 4.787556827068329e-05, 4.937499761581421e-05, 5.087442696094513e-05, 5.237385630607605e-05, 5.387328565120697e-05, 5.537271499633789e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 7.0, 10.0, 24.0, 29.0, 42.0, 61.0, 116.0, 178.0, 306.0, 530.0, 976.0, 1740.0, 3001.0, 5905.0, 11581.0, 24480.0, 56927.0, 144132.0, 315218.0, 277357.0, 117032.0, 47187.0, 20606.0, 9945.0, 4983.0, 2687.0, 1460.0, 807.0, 494.0, 263.0, 145.0, 98.0, 64.0, 43.0, 23.0, 19.0, 15.0, 12.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.15990257263183594, -0.15488815307617188, -0.1498737335205078, -0.14485931396484375, -0.1398448944091797, -0.13483047485351562, -0.12981605529785156, -0.1248016357421875, -0.11978721618652344, -0.11477279663085938, -0.10975837707519531, -0.10474395751953125, -0.09972953796386719, -0.09471511840820312, -0.08970069885253906, -0.084686279296875, -0.07967185974121094, -0.07465744018554688, -0.06964302062988281, -0.06462860107421875, -0.05961418151855469, -0.054599761962890625, -0.04958534240722656, -0.0445709228515625, -0.03955650329589844, -0.034542083740234375, -0.029527664184570312, -0.02451324462890625, -0.019498825073242188, -0.014484405517578125, -0.009469985961914062, -0.00445556640625, 0.0005588531494140625, 0.005573272705078125, 0.010587692260742188, 0.01560211181640625, 0.020616531372070312, 0.025630950927734375, 0.030645370483398438, 0.0356597900390625, 0.04067420959472656, 0.045688629150390625, 0.05070304870605469, 0.05571746826171875, 0.06073188781738281, 0.06574630737304688, 0.07076072692871094, 0.075775146484375, 0.08078956604003906, 0.08580398559570312, 0.09081840515136719, 0.09583282470703125, 0.10084724426269531, 0.10586166381835938, 0.11087608337402344, 0.1158905029296875, 0.12090492248535156, 0.12591934204101562, 0.1309337615966797, 0.13594818115234375, 0.1409626007080078, 0.14597702026367188, 0.15099143981933594, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 16.0, 7.0, 11.0, 19.0, 26.0, 22.0, 37.0, 38.0, 52.0, 50.0, 75.0, 74.0, 80.0, 82.0, 57.0, 72.0, 52.0, 44.0, 34.0, 29.0, 25.0, 13.0, 11.0, 10.0, 13.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037933349609375, -0.036604881286621094, -0.03527641296386719, -0.03394794464111328, -0.032619476318359375, -0.03129100799560547, -0.029962539672851562, -0.028634071350097656, -0.02730560302734375, -0.025977134704589844, -0.024648666381835938, -0.02332019805908203, -0.021991729736328125, -0.02066326141357422, -0.019334793090820312, -0.018006324768066406, -0.0166778564453125, -0.015349388122558594, -0.014020919799804688, -0.012692451477050781, -0.011363983154296875, -0.010035514831542969, -0.008707046508789062, -0.007378578186035156, -0.00605010986328125, -0.004721641540527344, -0.0033931732177734375, -0.0020647048950195312, -0.000736236572265625, 0.0005922317504882812, 0.0019207000732421875, 0.0032491683959960938, 0.00457763671875, 0.005906105041503906, 0.0072345733642578125, 0.008563041687011719, 0.009891510009765625, 0.011219978332519531, 0.012548446655273438, 0.013876914978027344, 0.01520538330078125, 0.016533851623535156, 0.017862319946289062, 0.01919078826904297, 0.020519256591796875, 0.02184772491455078, 0.023176193237304688, 0.024504661560058594, 0.0258331298828125, 0.027161598205566406, 0.028490066528320312, 0.02981853485107422, 0.031147003173828125, 0.03247547149658203, 0.03380393981933594, 0.035132408142089844, 0.03646087646484375, 0.037789344787597656, 0.03911781311035156, 0.04044628143310547, 0.041774749755859375, 0.04310321807861328, 0.04443168640136719, 0.045760154724121094, 0.047088623046875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 9.0, 8.0, 12.0, 14.0, 20.0, 26.0, 34.0, 44.0, 42.0, 44.0, 54.0, 72.0, 49.0, 91.0, 57.0, 68.0, 59.0, 55.0, 44.0, 36.0, 28.0, 24.0, 26.0, 15.0, 15.0, 10.0, 5.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2583179473876953, -3.1144847869873047, -2.970651626586914, -2.8268184661865234, -2.682985544204712, -2.5391523838043213, -2.3953192234039307, -2.251486301422119, -2.1076531410217285, -1.963819980621338, -1.8199869394302368, -1.6761537790298462, -1.5323207378387451, -1.3884875774383545, -1.2446544170379639, -1.1008213758468628, -0.9569880962371826, -0.8131549954414368, -0.6693218946456909, -0.5254887342453003, -0.38165563344955444, -0.2378225326538086, -0.09398937225341797, 0.049843668937683105, 0.19367682933807373, 0.3375099301338196, 0.4813430607318878, 0.625176191329956, 0.7690092921257019, 0.9128423929214478, 1.0566755533218384, 1.2005085945129395, 1.34434175491333, 1.4881749153137207, 1.6320079565048218, 1.7758411169052124, 1.9196741580963135, 2.063507318496704, 2.2073404788970947, 2.3511734008789062, 2.495006561279297, 2.6388397216796875, 2.782672882080078, 2.9265060424804688, 3.0703389644622803, 3.214172124862671, 3.3580052852630615, 3.501838207244873, 3.6456716060638428, 3.7895047664642334, 3.933337926864624, 4.0771708488464355, 4.221004009246826, 4.364837169647217, 4.508670330047607, 4.652503490447998, 4.796336650848389, 4.940169811248779, 5.08400297164917, 5.2278361320495605, 5.371669292449951, 5.515501976013184, 5.659335136413574, 5.803168296813965, 5.9470014572143555]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 0.0, 5.0, 3.0, 3.0, 6.0, 9.0, 12.0, 17.0, 19.0, 14.0, 30.0, 33.0, 26.0, 37.0, 20.0, 45.0, 44.0, 36.0, 48.0, 37.0, 34.0, 53.0, 43.0, 44.0, 50.0, 45.0, 31.0, 33.0, 31.0, 29.0, 25.0, 26.0, 25.0, 17.0, 12.0, 15.0, 9.0, 6.0, 7.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8723468780517578, -1.8014521598815918, -1.7305575609207153, -1.6596628427505493, -1.5887682437896729, -1.5178735256195068, -1.4469788074493408, -1.3760842084884644, -1.305189609527588, -1.2342948913574219, -1.1634002923965454, -1.0925055742263794, -1.021610975265503, -0.9507162570953369, -0.8798215985298157, -0.8089269399642944, -0.7380322217941284, -0.6671375632286072, -0.5962429046630859, -0.5253481864929199, -0.45445355772972107, -0.38355889916419983, -0.3126642107963562, -0.24176955223083496, -0.17087489366531372, -0.09998022764921188, -0.029085561633110046, 0.04180911183357239, 0.11270377039909363, 0.18359842896461487, 0.2544931173324585, 0.32538777589797974, 0.396282434463501, 0.4671770930290222, 0.5380717515945435, 0.6089664697647095, 0.6798610687255859, 0.750755786895752, 0.8216504454612732, 0.8925451040267944, 0.9634397625923157, 1.034334421157837, 1.105229139328003, 1.1761237382888794, 1.2470184564590454, 1.3179130554199219, 1.388807773590088, 1.459702491760254, 1.5305970907211304, 1.6014918088912964, 1.6723864078521729, 1.7432811260223389, 1.8141757249832153, 1.8850704431533813, 1.9559650421142578, 2.026859760284424, 2.09775447845459, 2.168649196624756, 2.239543914794922, 2.310438394546509, 2.381333112716675, 2.452227830886841, 2.523122549057007, 2.5940170288085938, 2.6649117469787598]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 11.0, 18.0, 29.0, 46.0, 80.0, 135.0, 152.0, 243.0, 368.0, 544.0, 781.0, 1198.0, 1843.0, 2801.0, 4347.0, 6658.0, 10642.0, 16859.0, 26331.0, 40831.0, 62197.0, 89107.0, 119286.0, 139780.0, 139628.0, 119168.0, 89375.0, 62131.0, 40817.0, 26163.0, 16846.0, 10651.0, 6846.0, 4386.0, 2808.0, 1831.0, 1201.0, 762.0, 545.0, 384.0, 236.0, 146.0, 107.0, 73.0, 53.0, 28.0, 25.0, 20.0, 10.0, 9.0, 0.0, 8.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.267578125, -2.19671630859375, -2.1258544921875, -2.05499267578125, -1.984130859375, -1.91326904296875, -1.8424072265625, -1.77154541015625, -1.70068359375, -1.62982177734375, -1.5589599609375, -1.48809814453125, -1.417236328125, -1.34637451171875, -1.2755126953125, -1.20465087890625, -1.1337890625, -1.06292724609375, -0.9920654296875, -0.92120361328125, -0.850341796875, -0.77947998046875, -0.7086181640625, -0.63775634765625, -0.56689453125, -0.49603271484375, -0.4251708984375, -0.35430908203125, -0.283447265625, -0.21258544921875, -0.1417236328125, -0.07086181640625, 0.0, 0.07086181640625, 0.1417236328125, 0.21258544921875, 0.283447265625, 0.35430908203125, 0.4251708984375, 0.49603271484375, 0.56689453125, 0.63775634765625, 0.7086181640625, 0.77947998046875, 0.850341796875, 0.92120361328125, 0.9920654296875, 1.06292724609375, 1.1337890625, 1.20465087890625, 1.2755126953125, 1.34637451171875, 1.417236328125, 1.48809814453125, 1.5589599609375, 1.62982177734375, 1.70068359375, 1.77154541015625, 1.8424072265625, 1.91326904296875, 1.984130859375, 2.05499267578125, 2.1258544921875, 2.19671630859375, 2.267578125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 14.0, 18.0, 14.0, 25.0, 32.0, 28.0, 37.0, 39.0, 41.0, 28.0, 43.0, 38.0, 44.0, 41.0, 36.0, 43.0, 50.0, 42.0, 41.0, 43.0, 35.0, 28.0, 38.0, 22.0, 13.0, 32.0, 20.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.638671875, -2.5579833984375, -2.477294921875, -2.3966064453125, -2.31591796875, -2.2352294921875, -2.154541015625, -2.0738525390625, -1.9931640625, -1.9124755859375, -1.831787109375, -1.7510986328125, -1.67041015625, -1.5897216796875, -1.509033203125, -1.4283447265625, -1.34765625, -1.2669677734375, -1.186279296875, -1.1055908203125, -1.02490234375, -0.9442138671875, -0.863525390625, -0.7828369140625, -0.7021484375, -0.6214599609375, -0.540771484375, -0.4600830078125, -0.37939453125, -0.2987060546875, -0.218017578125, -0.1373291015625, -0.056640625, 0.0240478515625, 0.104736328125, 0.1854248046875, 0.26611328125, 0.3468017578125, 0.427490234375, 0.5081787109375, 0.5888671875, 0.6695556640625, 0.750244140625, 0.8309326171875, 0.91162109375, 0.9923095703125, 1.072998046875, 1.1536865234375, 1.234375, 1.3150634765625, 1.395751953125, 1.4764404296875, 1.55712890625, 1.6378173828125, 1.718505859375, 1.7991943359375, 1.8798828125, 1.9605712890625, 2.041259765625, 2.1219482421875, 2.20263671875, 2.2833251953125, 2.364013671875, 2.4447021484375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 9.0, 7.0, 7.0, 10.0, 21.0, 31.0, 44.0, 49.0, 70.0, 112.0, 204.0, 315.0, 462.0, 722.0, 1159.0, 1797.0, 2922.0, 4496.0, 7597.0, 12275.0, 20201.0, 33183.0, 52551.0, 78899.0, 110832.0, 138860.0, 149269.0, 133426.0, 103732.0, 71641.0, 46834.0, 29523.0, 18213.0, 11049.0, 6710.0, 4189.0, 2593.0, 1588.0, 1065.0, 662.0, 422.0, 270.0, 181.0, 124.0, 72.0, 51.0, 46.0, 29.0, 13.0, 12.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.138671875, -2.065887451171875, -1.99310302734375, -1.920318603515625, -1.8475341796875, -1.774749755859375, -1.70196533203125, -1.629180908203125, -1.556396484375, -1.483612060546875, -1.41082763671875, -1.338043212890625, -1.2652587890625, -1.192474365234375, -1.11968994140625, -1.046905517578125, -0.97412109375, -0.901336669921875, -0.82855224609375, -0.755767822265625, -0.6829833984375, -0.610198974609375, -0.53741455078125, -0.464630126953125, -0.391845703125, -0.319061279296875, -0.24627685546875, -0.173492431640625, -0.1007080078125, -0.027923583984375, 0.04486083984375, 0.117645263671875, 0.1904296875, 0.263214111328125, 0.33599853515625, 0.408782958984375, 0.4815673828125, 0.554351806640625, 0.62713623046875, 0.699920654296875, 0.772705078125, 0.845489501953125, 0.91827392578125, 0.991058349609375, 1.0638427734375, 1.136627197265625, 1.20941162109375, 1.282196044921875, 1.35498046875, 1.427764892578125, 1.50054931640625, 1.573333740234375, 1.6461181640625, 1.718902587890625, 1.79168701171875, 1.864471435546875, 1.937255859375, 2.010040283203125, 2.08282470703125, 2.155609130859375, 2.2283935546875, 2.301177978515625, 2.37396240234375, 2.446746826171875, 2.51953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 9.0, 21.0, 11.0, 17.0, 23.0, 15.0, 20.0, 25.0, 28.0, 27.0, 22.0, 42.0, 33.0, 42.0, 35.0, 39.0, 49.0, 33.0, 47.0, 39.0, 37.0, 39.0, 35.0, 28.0, 33.0, 35.0, 26.0, 27.0, 22.0, 13.0, 21.0, 14.0, 12.0, 9.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.5205078125, -1.47528076171875, -1.4300537109375, -1.38482666015625, -1.339599609375, -1.29437255859375, -1.2491455078125, -1.20391845703125, -1.15869140625, -1.11346435546875, -1.0682373046875, -1.02301025390625, -0.977783203125, -0.93255615234375, -0.8873291015625, -0.84210205078125, -0.796875, -0.75164794921875, -0.7064208984375, -0.66119384765625, -0.615966796875, -0.57073974609375, -0.5255126953125, -0.48028564453125, -0.43505859375, -0.38983154296875, -0.3446044921875, -0.29937744140625, -0.254150390625, -0.20892333984375, -0.1636962890625, -0.11846923828125, -0.0732421875, -0.02801513671875, 0.0172119140625, 0.06243896484375, 0.107666015625, 0.15289306640625, 0.1981201171875, 0.24334716796875, 0.28857421875, 0.33380126953125, 0.3790283203125, 0.42425537109375, 0.469482421875, 0.51470947265625, 0.5599365234375, 0.60516357421875, 0.650390625, 0.69561767578125, 0.7408447265625, 0.78607177734375, 0.831298828125, 0.87652587890625, 0.9217529296875, 0.96697998046875, 1.01220703125, 1.05743408203125, 1.1026611328125, 1.14788818359375, 1.193115234375, 1.23834228515625, 1.2835693359375, 1.32879638671875, 1.3740234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 16.0, 15.0, 33.0, 48.0, 85.0, 135.0, 190.0, 282.0, 479.0, 818.0, 1425.0, 2497.0, 4452.0, 8546.0, 17122.0, 34491.0, 70453.0, 136416.0, 218914.0, 232280.0, 154749.0, 82283.0, 40966.0, 19931.0, 9976.0, 5108.0, 2848.0, 1583.0, 935.0, 556.0, 336.0, 226.0, 119.0, 79.0, 45.0, 31.0, 35.0, 18.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.962890625, -1.897705078125, -1.83251953125, -1.767333984375, -1.7021484375, -1.636962890625, -1.57177734375, -1.506591796875, -1.44140625, -1.376220703125, -1.31103515625, -1.245849609375, -1.1806640625, -1.115478515625, -1.05029296875, -0.985107421875, -0.919921875, -0.854736328125, -0.78955078125, -0.724365234375, -0.6591796875, -0.593994140625, -0.52880859375, -0.463623046875, -0.3984375, -0.333251953125, -0.26806640625, -0.202880859375, -0.1376953125, -0.072509765625, -0.00732421875, 0.057861328125, 0.123046875, 0.188232421875, 0.25341796875, 0.318603515625, 0.3837890625, 0.448974609375, 0.51416015625, 0.579345703125, 0.64453125, 0.709716796875, 0.77490234375, 0.840087890625, 0.9052734375, 0.970458984375, 1.03564453125, 1.100830078125, 1.166015625, 1.231201171875, 1.29638671875, 1.361572265625, 1.4267578125, 1.491943359375, 1.55712890625, 1.622314453125, 1.6875, 1.752685546875, 1.81787109375, 1.883056640625, 1.9482421875, 2.013427734375, 2.07861328125, 2.143798828125, 2.208984375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 20.0, 24.0, 33.0, 42.0, 46.0, 50.0, 69.0, 49.0, 76.0, 63.0, 61.0, 55.0, 62.0, 64.0, 44.0, 35.0, 34.0, 31.0, 16.0, 20.0, 10.0, 12.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00016999244689941406, -0.00016469135880470276, -0.00015939027070999146, -0.00015408918261528015, -0.00014878809452056885, -0.00014348700642585754, -0.00013818591833114624, -0.00013288483023643494, -0.00012758374214172363, -0.00012228265404701233, -0.00011698156595230103, -0.00011168047785758972, -0.00010637938976287842, -0.00010107830166816711, -9.577721357345581e-05, -9.047612547874451e-05, -8.51750373840332e-05, -7.98739492893219e-05, -7.45728611946106e-05, -6.927177309989929e-05, -6.397068500518799e-05, -5.8669596910476685e-05, -5.336850881576538e-05, -4.806742072105408e-05, -4.2766332626342773e-05, -3.746524453163147e-05, -3.2164156436920166e-05, -2.6863068342208862e-05, -2.156198024749756e-05, -1.6260892152786255e-05, -1.0959804058074951e-05, -5.6587159633636475e-06, -3.5762786865234375e-07, 4.94346022605896e-06, 1.0244548320770264e-05, 1.5545636415481567e-05, 2.084672451019287e-05, 2.6147812604904175e-05, 3.144890069961548e-05, 3.674998879432678e-05, 4.2051076889038086e-05, 4.735216498374939e-05, 5.265325307846069e-05, 5.7954341173172e-05, 6.32554292678833e-05, 6.85565173625946e-05, 7.385760545730591e-05, 7.915869355201721e-05, 8.445978164672852e-05, 8.976086974143982e-05, 9.506195783615112e-05, 0.00010036304593086243, 0.00010566413402557373, 0.00011096522212028503, 0.00011626631021499634, 0.00012156739830970764, 0.00012686848640441895, 0.00013216957449913025, 0.00013747066259384155, 0.00014277175068855286, 0.00014807283878326416, 0.00015337392687797546, 0.00015867501497268677, 0.00016397610306739807, 0.00016927719116210938]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 5.0, 8.0, 12.0, 24.0, 34.0, 40.0, 57.0, 81.0, 109.0, 217.0, 322.0, 523.0, 872.0, 1444.0, 2874.0, 5700.0, 12329.0, 27098.0, 61463.0, 130434.0, 228291.0, 254400.0, 167923.0, 83573.0, 37722.0, 16872.0, 7695.0, 3728.0, 1947.0, 1085.0, 576.0, 363.0, 204.0, 172.0, 115.0, 70.0, 44.0, 39.0, 30.0, 16.0, 11.0, 10.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.310546875, -2.24298095703125, -2.1754150390625, -2.10784912109375, -2.040283203125, -1.97271728515625, -1.9051513671875, -1.83758544921875, -1.77001953125, -1.70245361328125, -1.6348876953125, -1.56732177734375, -1.499755859375, -1.43218994140625, -1.3646240234375, -1.29705810546875, -1.2294921875, -1.16192626953125, -1.0943603515625, -1.02679443359375, -0.959228515625, -0.89166259765625, -0.8240966796875, -0.75653076171875, -0.68896484375, -0.62139892578125, -0.5538330078125, -0.48626708984375, -0.418701171875, -0.35113525390625, -0.2835693359375, -0.21600341796875, -0.1484375, -0.08087158203125, -0.0133056640625, 0.05426025390625, 0.121826171875, 0.18939208984375, 0.2569580078125, 0.32452392578125, 0.39208984375, 0.45965576171875, 0.5272216796875, 0.59478759765625, 0.662353515625, 0.72991943359375, 0.7974853515625, 0.86505126953125, 0.9326171875, 1.00018310546875, 1.0677490234375, 1.13531494140625, 1.202880859375, 1.27044677734375, 1.3380126953125, 1.40557861328125, 1.47314453125, 1.54071044921875, 1.6082763671875, 1.67584228515625, 1.743408203125, 1.81097412109375, 1.8785400390625, 1.94610595703125, 2.013671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 12.0, 6.0, 14.0, 5.0, 15.0, 19.0, 18.0, 34.0, 47.0, 50.0, 67.0, 80.0, 78.0, 85.0, 68.0, 63.0, 78.0, 54.0, 37.0, 39.0, 27.0, 20.0, 24.0, 15.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.48282623291015625, -0.4651641845703125, -0.44750213623046875, -0.429840087890625, -0.41217803955078125, -0.3945159912109375, -0.37685394287109375, -0.35919189453125, -0.34152984619140625, -0.3238677978515625, -0.30620574951171875, -0.288543701171875, -0.27088165283203125, -0.2532196044921875, -0.23555755615234375, -0.2178955078125, -0.20023345947265625, -0.1825714111328125, -0.16490936279296875, -0.147247314453125, -0.12958526611328125, -0.1119232177734375, -0.09426116943359375, -0.07659912109375, -0.05893707275390625, -0.0412750244140625, -0.02361297607421875, -0.005950927734375, 0.01171112060546875, 0.0293731689453125, 0.04703521728515625, 0.064697265625, 0.08235931396484375, 0.1000213623046875, 0.11768341064453125, 0.135345458984375, 0.15300750732421875, 0.1706695556640625, 0.18833160400390625, 0.20599365234375, 0.22365570068359375, 0.2413177490234375, 0.25897979736328125, 0.276641845703125, 0.29430389404296875, 0.3119659423828125, 0.32962799072265625, 0.3472900390625, 0.36495208740234375, 0.3826141357421875, 0.40027618408203125, 0.417938232421875, 0.43560028076171875, 0.4532623291015625, 0.47092437744140625, 0.48858642578125, 0.5062484741210938, 0.5239105224609375, 0.5415725708007812, 0.559234619140625, 0.5768966674804688, 0.5945587158203125, 0.6122207641601562, 0.6298828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 25.0, 26.0, 27.0, 30.0, 42.0, 51.0, 36.0, 60.0, 62.0, 66.0, 83.0, 76.0, 68.0, 50.0, 48.0, 51.0, 31.0, 24.0, 29.0, 14.0, 20.0, 11.0, 6.0, 7.0, 6.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1759355068206787, -3.0269339084625244, -2.877932071685791, -2.7289304733276367, -2.5799286365509033, -2.430927038192749, -2.2819252014160156, -2.1329236030578613, -1.9839218854904175, -1.8349201679229736, -1.6859184503555298, -1.536916732788086, -1.3879151344299316, -1.2389132976531982, -1.089911699295044, -0.9409099817276001, -0.7919082641601562, -0.6429065465927124, -0.49390485882759094, -0.3449031710624695, -0.19590145349502563, -0.04689973592758179, 0.10210192203521729, 0.25110363960266113, 0.400105357170105, 0.5491070747375488, 0.6981087923049927, 0.8471104502677917, 0.9961121678352356, 1.1451139450073242, 1.2941155433654785, 1.4431172609329224, 1.592118740081787, 1.741120457649231, 1.8901221752166748, 2.039123773574829, 2.1881256103515625, 2.337127208709717, 2.486128807067871, 2.6351306438446045, 2.784132480621338, 2.933134078979492, 3.0821359157562256, 3.23113751411438, 3.3801393508911133, 3.5291409492492676, 3.678142547607422, 3.8271443843841553, 3.9761459827423096, 4.125147819519043, 4.274149417877197, 4.423151016235352, 4.572152614593506, 4.721154689788818, 4.870156288146973, 5.019157886505127, 5.168159484863281, 5.3171610832214355, 5.46616268157959, 5.615164756774902, 5.764166355133057, 5.913167953491211, 6.062169551849365, 6.2111711502075195, 6.360173225402832]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 11.0, 9.0, 7.0, 13.0, 24.0, 21.0, 32.0, 35.0, 19.0, 31.0, 42.0, 33.0, 36.0, 40.0, 40.0, 34.0, 37.0, 48.0, 43.0, 33.0, 37.0, 28.0, 42.0, 34.0, 36.0, 22.0, 24.0, 25.0, 20.0, 19.0, 13.0, 23.0, 19.0, 14.0, 6.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1072566509246826, -2.0383243560791016, -1.96939218044281, -1.900459885597229, -1.8315277099609375, -1.7625954151153564, -1.6936631202697754, -1.6247308254241943, -1.5557986497879028, -1.4868663549423218, -1.4179341793060303, -1.3490018844604492, -1.2800695896148682, -1.2111374139785767, -1.1422051191329956, -1.073272943496704, -1.004340648651123, -0.9354084134101868, -0.8664761781692505, -0.7975438833236694, -0.7286116480827332, -0.6596794128417969, -0.5907471179962158, -0.5218148827552795, -0.45288264751434326, -0.383950412273407, -0.3150181472301483, -0.24608589708805084, -0.17715364694595337, -0.10822141170501709, -0.03928914666175842, 0.029643118381500244, 0.09857535362243652, 0.167507603764534, 0.23643985390663147, 0.30537211894989014, 0.3743043541908264, 0.4432365894317627, 0.5121688842773438, 0.58110111951828, 0.6500333547592163, 0.7189655900001526, 0.7878978252410889, 0.8568301200866699, 0.9257623553276062, 0.9946945905685425, 1.0636268854141235, 1.132559061050415, 1.201491355895996, 1.2704236507415771, 1.3393558263778687, 1.4082881212234497, 1.4772202968597412, 1.5461525917053223, 1.6150848865509033, 1.6840171813964844, 1.7529493570327759, 1.821881651878357, 1.8908138275146484, 1.9597461223602295, 2.0286784172058105, 2.0976104736328125, 2.1665427684783936, 2.2354750633239746, 2.3044073581695557]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 8.0, 3.0, 6.0, 5.0, 16.0, 18.0, 31.0, 25.0, 43.0, 68.0, 77.0, 119.0, 168.0, 223.0, 339.0, 495.0, 772.0, 1151.0, 1826.0, 2863.0, 4612.0, 7647.0, 12852.0, 22804.0, 41960.0, 81546.0, 167286.0, 372217.0, 809354.0, 1163699.0, 799715.0, 362097.0, 162759.0, 78841.0, 41532.0, 22924.0, 13196.0, 7871.0, 4791.0, 3019.0, 1889.0, 1172.0, 722.0, 508.0, 330.0, 221.0, 166.0, 108.0, 74.0, 45.0, 31.0, 12.0, 10.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-4.2265625, -4.100341796875, -3.97412109375, -3.847900390625, -3.7216796875, -3.595458984375, -3.46923828125, -3.343017578125, -3.216796875, -3.090576171875, -2.96435546875, -2.838134765625, -2.7119140625, -2.585693359375, -2.45947265625, -2.333251953125, -2.20703125, -2.080810546875, -1.95458984375, -1.828369140625, -1.7021484375, -1.575927734375, -1.44970703125, -1.323486328125, -1.197265625, -1.071044921875, -0.94482421875, -0.818603515625, -0.6923828125, -0.566162109375, -0.43994140625, -0.313720703125, -0.1875, -0.061279296875, 0.06494140625, 0.191162109375, 0.3173828125, 0.443603515625, 0.56982421875, 0.696044921875, 0.822265625, 0.948486328125, 1.07470703125, 1.200927734375, 1.3271484375, 1.453369140625, 1.57958984375, 1.705810546875, 1.83203125, 1.958251953125, 2.08447265625, 2.210693359375, 2.3369140625, 2.463134765625, 2.58935546875, 2.715576171875, 2.841796875, 2.968017578125, 3.09423828125, 3.220458984375, 3.3466796875, 3.472900390625, 3.59912109375, 3.725341796875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 11.0, 11.0, 10.0, 16.0, 20.0, 30.0, 20.0, 42.0, 29.0, 31.0, 31.0, 26.0, 45.0, 30.0, 47.0, 39.0, 33.0, 31.0, 29.0, 39.0, 32.0, 35.0, 45.0, 33.0, 26.0, 28.0, 27.0, 25.0, 22.0, 15.0, 12.0, 13.0, 11.0, 14.0, 10.0, 12.0, 4.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6083984375, -1.5599517822265625, -1.511505126953125, -1.4630584716796875, -1.41461181640625, -1.3661651611328125, -1.317718505859375, -1.2692718505859375, -1.2208251953125, -1.1723785400390625, -1.123931884765625, -1.0754852294921875, -1.02703857421875, -0.9785919189453125, -0.930145263671875, -0.8816986083984375, -0.833251953125, -0.7848052978515625, -0.736358642578125, -0.6879119873046875, -0.63946533203125, -0.5910186767578125, -0.542572021484375, -0.4941253662109375, -0.4456787109375, -0.3972320556640625, -0.348785400390625, -0.3003387451171875, -0.25189208984375, -0.2034454345703125, -0.154998779296875, -0.1065521240234375, -0.05810546875, -0.0096588134765625, 0.038787841796875, 0.0872344970703125, 0.13568115234375, 0.1841278076171875, 0.232574462890625, 0.2810211181640625, 0.3294677734375, 0.3779144287109375, 0.426361083984375, 0.4748077392578125, 0.52325439453125, 0.5717010498046875, 0.620147705078125, 0.6685943603515625, 0.717041015625, 0.7654876708984375, 0.813934326171875, 0.8623809814453125, 0.91082763671875, 0.9592742919921875, 1.007720947265625, 1.0561676025390625, 1.1046142578125, 1.1530609130859375, 1.201507568359375, 1.2499542236328125, 1.29840087890625, 1.3468475341796875, 1.395294189453125, 1.4437408447265625, 1.4921875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 15.0, 29.0, 50.0, 64.0, 99.0, 185.0, 266.0, 455.0, 781.0, 1220.0, 2101.0, 3397.0, 5882.0, 10704.0, 19212.0, 36738.0, 70946.0, 148270.0, 320188.0, 685952.0, 1124935.0, 904769.0, 449266.0, 205279.0, 97639.0, 48815.0, 25193.0, 13506.0, 7581.0, 4274.0, 2447.0, 1529.0, 911.0, 554.0, 340.0, 249.0, 138.0, 113.0, 55.0, 29.0, 27.0, 23.0, 11.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.20233154296875, -4.0609130859375, -3.91949462890625, -3.778076171875, -3.63665771484375, -3.4952392578125, -3.35382080078125, -3.21240234375, -3.07098388671875, -2.9295654296875, -2.78814697265625, -2.646728515625, -2.50531005859375, -2.3638916015625, -2.22247314453125, -2.0810546875, -1.93963623046875, -1.7982177734375, -1.65679931640625, -1.515380859375, -1.37396240234375, -1.2325439453125, -1.09112548828125, -0.94970703125, -0.80828857421875, -0.6668701171875, -0.52545166015625, -0.384033203125, -0.24261474609375, -0.1011962890625, 0.04022216796875, 0.181640625, 0.32305908203125, 0.4644775390625, 0.60589599609375, 0.747314453125, 0.88873291015625, 1.0301513671875, 1.17156982421875, 1.31298828125, 1.45440673828125, 1.5958251953125, 1.73724365234375, 1.878662109375, 2.02008056640625, 2.1614990234375, 2.30291748046875, 2.4443359375, 2.58575439453125, 2.7271728515625, 2.86859130859375, 3.010009765625, 3.15142822265625, 3.2928466796875, 3.43426513671875, 3.57568359375, 3.71710205078125, 3.8585205078125, 3.99993896484375, 4.141357421875, 4.28277587890625, 4.4241943359375, 4.56561279296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 15.0, 13.0, 22.0, 17.0, 29.0, 34.0, 51.0, 63.0, 68.0, 77.0, 114.0, 146.0, 152.0, 201.0, 230.0, 259.0, 244.0, 282.0, 281.0, 279.0, 244.0, 233.0, 212.0, 158.0, 150.0, 103.0, 69.0, 67.0, 56.0, 47.0, 34.0, 26.0, 21.0, 19.0, 13.0, 15.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.239715576171875, -1.20306396484375, -1.166412353515625, -1.1297607421875, -1.093109130859375, -1.05645751953125, -1.019805908203125, -0.983154296875, -0.946502685546875, -0.90985107421875, -0.873199462890625, -0.8365478515625, -0.799896240234375, -0.76324462890625, -0.726593017578125, -0.68994140625, -0.653289794921875, -0.61663818359375, -0.579986572265625, -0.5433349609375, -0.506683349609375, -0.47003173828125, -0.433380126953125, -0.396728515625, -0.360076904296875, -0.32342529296875, -0.286773681640625, -0.2501220703125, -0.213470458984375, -0.17681884765625, -0.140167236328125, -0.103515625, -0.066864013671875, -0.03021240234375, 0.006439208984375, 0.0430908203125, 0.079742431640625, 0.11639404296875, 0.153045654296875, 0.189697265625, 0.226348876953125, 0.26300048828125, 0.299652099609375, 0.3363037109375, 0.372955322265625, 0.40960693359375, 0.446258544921875, 0.48291015625, 0.519561767578125, 0.55621337890625, 0.592864990234375, 0.6295166015625, 0.666168212890625, 0.70281982421875, 0.739471435546875, 0.776123046875, 0.812774658203125, 0.84942626953125, 0.886077880859375, 0.9227294921875, 0.959381103515625, 0.99603271484375, 1.032684326171875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 14.0, 16.0, 15.0, 27.0, 29.0, 30.0, 50.0, 47.0, 56.0, 55.0, 86.0, 78.0, 63.0, 66.0, 60.0, 64.0, 44.0, 40.0, 27.0, 21.0, 17.0, 16.0, 11.0, 12.0, 8.0, 11.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52296781539917, -4.3727850914001465, -4.222602844238281, -4.072420120239258, -3.9222373962402344, -3.772054672241211, -3.6218721866607666, -3.4716897010803223, -3.321506977081299, -3.1713242530822754, -3.021141767501831, -2.8709592819213867, -2.7207765579223633, -2.57059383392334, -2.4204113483428955, -2.270228862762451, -2.1200461387634277, -1.9698635339736938, -1.81968092918396, -1.669498324394226, -1.5193157196044922, -1.3691331148147583, -1.2189505100250244, -1.0687679052352905, -0.9185853004455566, -0.7684026956558228, -0.6182200908660889, -0.468037486076355, -0.3178548812866211, -0.1676722764968872, -0.01748967170715332, 0.13269293308258057, 0.28287506103515625, 0.43305766582489014, 0.583240270614624, 0.7334228754043579, 0.8836054801940918, 1.0337880849838257, 1.1839706897735596, 1.3341532945632935, 1.4843358993530273, 1.6345185041427612, 1.7847011089324951, 1.934883713722229, 2.085066318511963, 2.2352490425109863, 2.3854315280914307, 2.535614013671875, 2.6857967376708984, 2.835979461669922, 2.986161947250366, 3.1363444328308105, 3.286527156829834, 3.4367098808288574, 3.5868923664093018, 3.737074851989746, 3.8872575759887695, 4.037440299987793, 4.187623023986816, 4.337805271148682, 4.487987995147705, 4.6381707191467285, 4.788352966308594, 4.938535690307617, 5.088718414306641]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 11.0, 7.0, 16.0, 17.0, 17.0, 15.0, 23.0, 20.0, 26.0, 23.0, 32.0, 27.0, 36.0, 36.0, 25.0, 49.0, 36.0, 44.0, 40.0, 34.0, 27.0, 35.0, 41.0, 34.0, 36.0, 38.0, 24.0, 32.0, 20.0, 16.0, 22.0, 23.0, 20.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 10.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7342405319213867, -1.6759778261184692, -1.6177152395248413, -1.5594525337219238, -1.5011898279190063, -1.4429271221160889, -1.384664535522461, -1.3264018297195435, -1.268139123916626, -1.2098764181137085, -1.1516138315200806, -1.093351125717163, -1.0350884199142456, -0.9768257737159729, -0.9185631275177002, -0.8603004217147827, -0.8020378351211548, -0.7437751889228821, -0.6855124831199646, -0.6272498369216919, -0.5689871311187744, -0.5107244849205017, -0.452461838722229, -0.3941991627216339, -0.3359364867210388, -0.2776738107204437, -0.21941114962100983, -0.16114848852157593, -0.10288581252098083, -0.04462313652038574, 0.013639509677886963, 0.07190218567848206, 0.13016486167907715, 0.18842753767967224, 0.24669019877910614, 0.30495285987854004, 0.36321553587913513, 0.4214782118797302, 0.47974085807800293, 0.5380035638809204, 0.5962662100791931, 0.6545288562774658, 0.7127915620803833, 0.771054208278656, 0.8293168544769287, 0.8875795602798462, 0.9458422064781189, 1.0041048526763916, 1.062367558479309, 1.1206302642822266, 1.1788928508758545, 1.237155556678772, 1.2954182624816895, 1.3536808490753174, 1.4119435548782349, 1.4702062606811523, 1.5284688472747803, 1.5867315530776978, 1.6449941396713257, 1.7032568454742432, 1.7615195512771606, 1.8197822570800781, 1.878044843673706, 1.9363075494766235, 1.994570255279541]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 14.0, 29.0, 39.0, 86.0, 164.0, 220.0, 390.0, 604.0, 1095.0, 1785.0, 3161.0, 6031.0, 10358.0, 19464.0, 36833.0, 68971.0, 124869.0, 194771.0, 218822.0, 159262.0, 93230.0, 49961.0, 26749.0, 13998.0, 7681.0, 4259.0, 2444.0, 1315.0, 747.0, 467.0, 295.0, 169.0, 93.0, 52.0, 38.0, 29.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4033203125, -0.3921928405761719, -0.38106536865234375, -0.3699378967285156, -0.3588104248046875, -0.3476829528808594, -0.33655548095703125, -0.3254280090332031, -0.314300537109375, -0.3031730651855469, -0.29204559326171875, -0.2809181213378906, -0.2697906494140625, -0.2586631774902344, -0.24753570556640625, -0.23640823364257812, -0.22528076171875, -0.21415328979492188, -0.20302581787109375, -0.19189834594726562, -0.1807708740234375, -0.16964340209960938, -0.15851593017578125, -0.14738845825195312, -0.136260986328125, -0.12513351440429688, -0.11400604248046875, -0.10287857055664062, -0.0917510986328125, -0.08062362670898438, -0.06949615478515625, -0.058368682861328125, -0.0472412109375, -0.036113739013671875, -0.02498626708984375, -0.013858795166015625, -0.0027313232421875, 0.008396148681640625, 0.01952362060546875, 0.030651092529296875, 0.041778564453125, 0.052906036376953125, 0.06403350830078125, 0.07516098022460938, 0.0862884521484375, 0.09741592407226562, 0.10854339599609375, 0.11967086791992188, 0.13079833984375, 0.14192581176757812, 0.15305328369140625, 0.16418075561523438, 0.1753082275390625, 0.18643569946289062, 0.19756317138671875, 0.20869064331054688, 0.219818115234375, 0.23094558715820312, 0.24207305908203125, 0.2532005310058594, 0.2643280029296875, 0.2754554748535156, 0.28658294677734375, 0.2977104187011719, 0.308837890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 6.0, 15.0, 9.0, 16.0, 12.0, 15.0, 34.0, 25.0, 26.0, 24.0, 29.0, 28.0, 27.0, 34.0, 34.0, 31.0, 30.0, 35.0, 35.0, 34.0, 41.0, 35.0, 27.0, 30.0, 27.0, 33.0, 23.0, 32.0, 21.0, 28.0, 21.0, 24.0, 21.0, 12.0, 23.0, 10.0, 9.0, 8.0, 12.0, 5.0, 6.0, 11.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7475433349609375, -1.687469482421875, -1.6273956298828125, -1.56732177734375, -1.5072479248046875, -1.447174072265625, -1.3871002197265625, -1.3270263671875, -1.2669525146484375, -1.206878662109375, -1.1468048095703125, -1.08673095703125, -1.0266571044921875, -0.966583251953125, -0.9065093994140625, -0.846435546875, -0.7863616943359375, -0.726287841796875, -0.6662139892578125, -0.60614013671875, -0.5460662841796875, -0.485992431640625, -0.4259185791015625, -0.3658447265625, -0.3057708740234375, -0.245697021484375, -0.1856231689453125, -0.12554931640625, -0.0654754638671875, -0.005401611328125, 0.0546722412109375, 0.11474609375, 0.1748199462890625, 0.234893798828125, 0.2949676513671875, 0.35504150390625, 0.4151153564453125, 0.475189208984375, 0.5352630615234375, 0.5953369140625, 0.6554107666015625, 0.715484619140625, 0.7755584716796875, 0.83563232421875, 0.8957061767578125, 0.955780029296875, 1.0158538818359375, 1.075927734375, 1.1360015869140625, 1.196075439453125, 1.2561492919921875, 1.31622314453125, 1.3762969970703125, 1.436370849609375, 1.4964447021484375, 1.5565185546875, 1.6165924072265625, 1.676666259765625, 1.7367401123046875, 1.79681396484375, 1.8568878173828125, 1.916961669921875, 1.9770355224609375, 2.037109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 13.0, 7.0, 10.0, 9.0, 23.0, 27.0, 35.0, 45.0, 62.0, 86.0, 107.0, 171.0, 212.0, 367.0, 511.0, 798.0, 1344.0, 2176.0, 4090.0, 7837.0, 17034.0, 45426.0, 817685.0, 104685.0, 23152.0, 10193.0, 5227.0, 2753.0, 1623.0, 908.0, 581.0, 401.0, 277.0, 177.0, 142.0, 94.0, 61.0, 55.0, 40.0, 30.0, 19.0, 14.0, 16.0, 11.0, 7.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8077774047851562, -0.7796173095703125, -0.7514572143554688, -0.723297119140625, -0.6951370239257812, -0.6669769287109375, -0.6388168334960938, -0.61065673828125, -0.5824966430664062, -0.5543365478515625, -0.5261764526367188, -0.498016357421875, -0.46985626220703125, -0.4416961669921875, -0.41353607177734375, -0.3853759765625, -0.35721588134765625, -0.3290557861328125, -0.30089569091796875, -0.272735595703125, -0.24457550048828125, -0.2164154052734375, -0.18825531005859375, -0.16009521484375, -0.13193511962890625, -0.1037750244140625, -0.07561492919921875, -0.047454833984375, -0.01929473876953125, 0.0088653564453125, 0.03702545166015625, 0.065185546875, 0.09334564208984375, 0.1215057373046875, 0.14966583251953125, 0.177825927734375, 0.20598602294921875, 0.2341461181640625, 0.26230621337890625, 0.29046630859375, 0.31862640380859375, 0.3467864990234375, 0.37494659423828125, 0.403106689453125, 0.43126678466796875, 0.4594268798828125, 0.48758697509765625, 0.5157470703125, 0.5439071655273438, 0.5720672607421875, 0.6002273559570312, 0.628387451171875, 0.6565475463867188, 0.6847076416015625, 0.7128677368164062, 0.74102783203125, 0.7691879272460938, 0.7973480224609375, 0.8255081176757812, 0.853668212890625, 0.8818283081054688, 0.9099884033203125, 0.9381484985351562, 0.96630859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 9.0, 14.0, 13.0, 14.0, 9.0, 12.0, 18.0, 28.0, 31.0, 23.0, 37.0, 38.0, 32.0, 36.0, 41.0, 36.0, 31.0, 38.0, 46.0, 41.0, 30.0, 33.0, 34.0, 37.0, 30.0, 31.0, 29.0, 18.0, 20.0, 22.0, 24.0, 12.0, 20.0, 12.0, 12.0, 10.0, 8.0, 8.0, 13.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2724609375, -1.230499267578125, -1.18853759765625, -1.146575927734375, -1.1046142578125, -1.062652587890625, -1.02069091796875, -0.978729248046875, -0.936767578125, -0.894805908203125, -0.85284423828125, -0.810882568359375, -0.7689208984375, -0.726959228515625, -0.68499755859375, -0.643035888671875, -0.60107421875, -0.559112548828125, -0.51715087890625, -0.475189208984375, -0.4332275390625, -0.391265869140625, -0.34930419921875, -0.307342529296875, -0.265380859375, -0.223419189453125, -0.18145751953125, -0.139495849609375, -0.0975341796875, -0.055572509765625, -0.01361083984375, 0.028350830078125, 0.0703125, 0.112274169921875, 0.15423583984375, 0.196197509765625, 0.2381591796875, 0.280120849609375, 0.32208251953125, 0.364044189453125, 0.406005859375, 0.447967529296875, 0.48992919921875, 0.531890869140625, 0.5738525390625, 0.615814208984375, 0.65777587890625, 0.699737548828125, 0.74169921875, 0.783660888671875, 0.82562255859375, 0.867584228515625, 0.9095458984375, 0.951507568359375, 0.99346923828125, 1.035430908203125, 1.077392578125, 1.119354248046875, 1.16131591796875, 1.203277587890625, 1.2452392578125, 1.287200927734375, 1.32916259765625, 1.371124267578125, 1.4130859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 17.0, 19.0, 35.0, 38.0, 65.0, 96.0, 174.0, 268.0, 418.0, 637.0, 1136.0, 1815.0, 3097.0, 5285.0, 9482.0, 18389.0, 41509.0, 872844.0, 49095.0, 19737.0, 10362.0, 5755.0, 3300.0, 1882.0, 1185.0, 667.0, 465.0, 268.0, 182.0, 93.0, 69.0, 46.0, 41.0, 21.0, 20.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21637725830078125, -0.2097320556640625, -0.20308685302734375, -0.196441650390625, -0.18979644775390625, -0.1831512451171875, -0.17650604248046875, -0.16986083984375, -0.16321563720703125, -0.1565704345703125, -0.14992523193359375, -0.143280029296875, -0.13663482666015625, -0.1299896240234375, -0.12334442138671875, -0.11669921875, -0.11005401611328125, -0.1034088134765625, -0.09676361083984375, -0.090118408203125, -0.08347320556640625, -0.0768280029296875, -0.07018280029296875, -0.06353759765625, -0.05689239501953125, -0.0502471923828125, -0.04360198974609375, -0.036956787109375, -0.03031158447265625, -0.0236663818359375, -0.01702117919921875, -0.0103759765625, -0.00373077392578125, 0.0029144287109375, 0.00955963134765625, 0.016204833984375, 0.02285003662109375, 0.0294952392578125, 0.03614044189453125, 0.04278564453125, 0.04943084716796875, 0.0560760498046875, 0.06272125244140625, 0.069366455078125, 0.07601165771484375, 0.0826568603515625, 0.08930206298828125, 0.095947265625, 0.10259246826171875, 0.1092376708984375, 0.11588287353515625, 0.122528076171875, 0.12917327880859375, 0.1358184814453125, 0.14246368408203125, 0.14910888671875, 0.15575408935546875, 0.1623992919921875, 0.16904449462890625, 0.175689697265625, 0.18233489990234375, 0.1889801025390625, 0.19562530517578125, 0.2022705078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 9.0, 14.0, 23.0, 29.0, 28.0, 39.0, 49.0, 47.0, 64.0, 71.0, 82.0, 71.0, 65.0, 59.0, 63.0, 62.0, 42.0, 39.0, 31.0, 29.0, 15.0, 13.0, 5.0, 9.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.7637691497802734e-05, -5.59687614440918e-05, -5.429983139038086e-05, -5.263090133666992e-05, -5.0961971282958984e-05, -4.929304122924805e-05, -4.762411117553711e-05, -4.595518112182617e-05, -4.4286251068115234e-05, -4.26173210144043e-05, -4.094839096069336e-05, -3.927946090698242e-05, -3.7610530853271484e-05, -3.594160079956055e-05, -3.427267074584961e-05, -3.260374069213867e-05, -3.0934810638427734e-05, -2.9265880584716797e-05, -2.759695053100586e-05, -2.5928020477294922e-05, -2.4259090423583984e-05, -2.2590160369873047e-05, -2.092123031616211e-05, -1.9252300262451172e-05, -1.7583370208740234e-05, -1.5914440155029297e-05, -1.424551010131836e-05, -1.2576580047607422e-05, -1.0907649993896484e-05, -9.238719940185547e-06, -7.569789886474609e-06, -5.900859832763672e-06, -4.231929779052734e-06, -2.562999725341797e-06, -8.940696716308594e-07, 7.748603820800781e-07, 2.4437904357910156e-06, 4.112720489501953e-06, 5.781650543212891e-06, 7.450580596923828e-06, 9.119510650634766e-06, 1.0788440704345703e-05, 1.245737075805664e-05, 1.4126300811767578e-05, 1.5795230865478516e-05, 1.7464160919189453e-05, 1.913309097290039e-05, 2.0802021026611328e-05, 2.2470951080322266e-05, 2.4139881134033203e-05, 2.580881118774414e-05, 2.7477741241455078e-05, 2.9146671295166016e-05, 3.081560134887695e-05, 3.248453140258789e-05, 3.415346145629883e-05, 3.5822391510009766e-05, 3.74913215637207e-05, 3.916025161743164e-05, 4.082918167114258e-05, 4.2498111724853516e-05, 4.416704177856445e-05, 4.583597183227539e-05, 4.750490188598633e-05, 4.9173831939697266e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 16.0, 30.0, 50.0, 59.0, 97.0, 153.0, 254.0, 354.0, 548.0, 887.0, 1365.0, 2205.0, 3612.0, 5744.0, 9350.0, 15719.0, 26414.0, 44122.0, 76052.0, 125850.0, 182444.0, 193555.0, 142334.0, 88334.0, 52021.0, 30322.0, 18254.0, 10655.0, 6620.0, 4070.0, 2552.0, 1611.0, 1051.0, 635.0, 443.0, 251.0, 169.0, 117.0, 67.0, 49.0, 38.0, 15.0, 19.0, 9.0, 4.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.07196044921875, -0.06985282897949219, -0.06774520874023438, -0.06563758850097656, -0.06352996826171875, -0.06142234802246094, -0.059314727783203125, -0.05720710754394531, -0.0550994873046875, -0.05299186706542969, -0.050884246826171875, -0.04877662658691406, -0.04666900634765625, -0.04456138610839844, -0.042453765869140625, -0.04034614562988281, -0.038238525390625, -0.03613090515136719, -0.034023284912109375, -0.03191566467285156, -0.02980804443359375, -0.027700424194335938, -0.025592803955078125, -0.023485183715820312, -0.0213775634765625, -0.019269943237304688, -0.017162322998046875, -0.015054702758789062, -0.01294708251953125, -0.010839462280273438, -0.008731842041015625, -0.0066242218017578125, -0.0045166015625, -0.0024089813232421875, -0.000301361083984375, 0.0018062591552734375, 0.00391387939453125, 0.0060214996337890625, 0.008129119873046875, 0.010236740112304688, 0.0123443603515625, 0.014451980590820312, 0.016559600830078125, 0.018667221069335938, 0.02077484130859375, 0.022882461547851562, 0.024990081787109375, 0.027097702026367188, 0.029205322265625, 0.03131294250488281, 0.033420562744140625, 0.03552818298339844, 0.03763580322265625, 0.03974342346191406, 0.041851043701171875, 0.04395866394042969, 0.0460662841796875, 0.04817390441894531, 0.050281524658203125, 0.05238914489746094, 0.05449676513671875, 0.05660438537597656, 0.058712005615234375, 0.06081962585449219, 0.06292724609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 9.0, 9.0, 9.0, 8.0, 14.0, 16.0, 19.0, 16.0, 22.0, 32.0, 26.0, 34.0, 44.0, 40.0, 57.0, 29.0, 47.0, 56.0, 52.0, 48.0, 51.0, 58.0, 41.0, 47.0, 27.0, 26.0, 27.0, 23.0, 13.0, 16.0, 14.0, 6.0, 9.0, 8.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.017547607421875, -0.017049312591552734, -0.01655101776123047, -0.016052722930908203, -0.015554428100585938, -0.015056133270263672, -0.014557838439941406, -0.01405954360961914, -0.013561248779296875, -0.01306295394897461, -0.012564659118652344, -0.012066364288330078, -0.011568069458007812, -0.011069774627685547, -0.010571479797363281, -0.010073184967041016, -0.00957489013671875, -0.009076595306396484, -0.008578300476074219, -0.008080005645751953, -0.0075817108154296875, -0.007083415985107422, -0.006585121154785156, -0.006086826324462891, -0.005588531494140625, -0.005090236663818359, -0.004591941833496094, -0.004093647003173828, -0.0035953521728515625, -0.003097057342529297, -0.0025987625122070312, -0.0021004676818847656, -0.0016021728515625, -0.0011038780212402344, -0.0006055831909179688, -0.00010728836059570312, 0.0003910064697265625, 0.0008893013000488281, 0.0013875961303710938, 0.0018858909606933594, 0.002384185791015625, 0.0028824806213378906, 0.0033807754516601562, 0.003879070281982422, 0.0043773651123046875, 0.004875659942626953, 0.005373954772949219, 0.005872249603271484, 0.00637054443359375, 0.006868839263916016, 0.007367134094238281, 0.007865428924560547, 0.008363723754882812, 0.008862018585205078, 0.009360313415527344, 0.00985860824584961, 0.010356903076171875, 0.01085519790649414, 0.011353492736816406, 0.011851787567138672, 0.012350082397460938, 0.012848377227783203, 0.013346672058105469, 0.013844966888427734, 0.01434326171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 13.0, 19.0, 13.0, 26.0, 28.0, 30.0, 39.0, 63.0, 47.0, 54.0, 86.0, 82.0, 57.0, 67.0, 57.0, 68.0, 50.0, 38.0, 29.0, 21.0, 17.0, 16.0, 14.0, 10.0, 9.0, 11.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.529380798339844, -4.3796868324279785, -4.229992866516113, -4.080298900604248, -3.930605173110962, -3.7809112071990967, -3.6312174797058105, -3.4815235137939453, -3.33182954788208, -3.182135581970215, -3.0324416160583496, -2.8827478885650635, -2.7330539226531982, -2.583359956741333, -2.433666229248047, -2.2839722633361816, -2.1342782974243164, -1.9845843315124512, -1.8348904848098755, -1.6851966381072998, -1.5355026721954346, -1.3858087062835693, -1.2361148595809937, -1.086421012878418, -0.9367270469665527, -0.7870331406593323, -0.6373392343521118, -0.48764532804489136, -0.3379514217376709, -0.18825751543045044, -0.03856360912322998, 0.1111302375793457, 0.26082468032836914, 0.4105185866355896, 0.5602124929428101, 0.7099063992500305, 0.859600305557251, 1.0092942714691162, 1.158988118171692, 1.3086819648742676, 1.4583759307861328, 1.608069896697998, 1.7577637434005737, 1.9074575901031494, 2.0571515560150146, 2.20684552192688, 2.356539249420166, 2.5062332153320312, 2.6559271812438965, 2.8056211471557617, 2.955315113067627, 3.105008840560913, 3.2547028064727783, 3.4043967723846436, 3.5540904998779297, 3.703784465789795, 3.85347843170166, 4.003172397613525, 4.152866363525391, 4.302560329437256, 4.452254295349121, 4.601947784423828, 4.751641750335693, 4.901335716247559, 5.051029682159424]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 5.0, 16.0, 19.0, 14.0, 17.0, 23.0, 21.0, 25.0, 25.0, 30.0, 26.0, 38.0, 33.0, 28.0, 46.0, 38.0, 43.0, 42.0, 33.0, 26.0, 41.0, 33.0, 33.0, 41.0, 35.0, 27.0, 31.0, 20.0, 16.0, 21.0, 25.0, 19.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7494254112243652, -1.6914043426513672, -1.6333832740783691, -1.575362205505371, -1.517341136932373, -1.459320068359375, -1.401298999786377, -1.343277931213379, -1.2852568626403809, -1.2272357940673828, -1.1692147254943848, -1.1111936569213867, -1.0531725883483887, -0.9951515197753906, -0.9371304512023926, -0.8791093826293945, -0.8210883140563965, -0.7630672454833984, -0.7050461769104004, -0.6470251083374023, -0.5890040397644043, -0.5309829711914062, -0.4729619026184082, -0.41494083404541016, -0.3569197654724121, -0.29889869689941406, -0.24087762832641602, -0.18285655975341797, -0.12483549118041992, -0.06681442260742188, -0.008793354034423828, 0.04922771453857422, 0.10724878311157227, 0.1652698516845703, 0.22329092025756836, 0.2813119888305664, 0.33933305740356445, 0.3973541259765625, 0.45537519454956055, 0.5133962631225586, 0.5714173316955566, 0.6294384002685547, 0.6874594688415527, 0.7454805374145508, 0.8035016059875488, 0.8615226745605469, 0.9195437431335449, 0.977564811706543, 1.035585880279541, 1.093606948852539, 1.151628017425537, 1.2096490859985352, 1.2676701545715332, 1.3256912231445312, 1.3837122917175293, 1.4417333602905273, 1.4997544288635254, 1.5577754974365234, 1.6157965660095215, 1.6738176345825195, 1.7318387031555176, 1.7898597717285156, 1.8478808403015137, 1.9059019088745117, 1.9639229774475098]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 27.0, 38.0, 57.0, 97.0, 163.0, 211.0, 317.0, 554.0, 809.0, 1272.0, 2022.0, 3350.0, 5101.0, 8424.0, 13640.0, 22573.0, 36626.0, 58771.0, 90041.0, 124956.0, 151061.0, 151670.0, 127535.0, 91557.0, 59864.0, 37578.0, 23229.0, 14002.0, 8603.0, 5253.0, 3255.0, 2146.0, 1289.0, 845.0, 549.0, 372.0, 221.0, 155.0, 93.0, 65.0, 51.0, 32.0, 15.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.455078125, -2.37841796875, -2.3017578125, -2.22509765625, -2.1484375, -2.07177734375, -1.9951171875, -1.91845703125, -1.841796875, -1.76513671875, -1.6884765625, -1.61181640625, -1.53515625, -1.45849609375, -1.3818359375, -1.30517578125, -1.228515625, -1.15185546875, -1.0751953125, -0.99853515625, -0.921875, -0.84521484375, -0.7685546875, -0.69189453125, -0.615234375, -0.53857421875, -0.4619140625, -0.38525390625, -0.30859375, -0.23193359375, -0.1552734375, -0.07861328125, -0.001953125, 0.07470703125, 0.1513671875, 0.22802734375, 0.3046875, 0.38134765625, 0.4580078125, 0.53466796875, 0.611328125, 0.68798828125, 0.7646484375, 0.84130859375, 0.91796875, 0.99462890625, 1.0712890625, 1.14794921875, 1.224609375, 1.30126953125, 1.3779296875, 1.45458984375, 1.53125, 1.60791015625, 1.6845703125, 1.76123046875, 1.837890625, 1.91455078125, 1.9912109375, 2.06787109375, 2.14453125, 2.22119140625, 2.2978515625, 2.37451171875, 2.451171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 11.0, 14.0, 18.0, 25.0, 18.0, 22.0, 32.0, 29.0, 27.0, 37.0, 34.0, 23.0, 38.0, 38.0, 51.0, 44.0, 44.0, 40.0, 36.0, 35.0, 36.0, 35.0, 28.0, 29.0, 28.0, 28.0, 25.0, 24.0, 19.0, 14.0, 8.0, 11.0, 15.0, 11.0, 2.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.955596923828125, -1.88775634765625, -1.819915771484375, -1.7520751953125, -1.684234619140625, -1.61639404296875, -1.548553466796875, -1.480712890625, -1.412872314453125, -1.34503173828125, -1.277191162109375, -1.2093505859375, -1.141510009765625, -1.07366943359375, -1.005828857421875, -0.93798828125, -0.870147705078125, -0.80230712890625, -0.734466552734375, -0.6666259765625, -0.598785400390625, -0.53094482421875, -0.463104248046875, -0.395263671875, -0.327423095703125, -0.25958251953125, -0.191741943359375, -0.1239013671875, -0.056060791015625, 0.01177978515625, 0.079620361328125, 0.1474609375, 0.215301513671875, 0.28314208984375, 0.350982666015625, 0.4188232421875, 0.486663818359375, 0.55450439453125, 0.622344970703125, 0.690185546875, 0.758026123046875, 0.82586669921875, 0.893707275390625, 0.9615478515625, 1.029388427734375, 1.09722900390625, 1.165069580078125, 1.23291015625, 1.300750732421875, 1.36859130859375, 1.436431884765625, 1.5042724609375, 1.572113037109375, 1.63995361328125, 1.707794189453125, 1.775634765625, 1.843475341796875, 1.91131591796875, 1.979156494140625, 2.0469970703125, 2.114837646484375, 2.18267822265625, 2.250518798828125, 2.318359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 17.0, 19.0, 41.0, 50.0, 76.0, 105.0, 177.0, 287.0, 352.0, 568.0, 844.0, 1387.0, 2294.0, 3789.0, 6142.0, 10569.0, 17988.0, 30935.0, 52496.0, 83792.0, 123336.0, 157414.0, 165512.0, 137665.0, 98118.0, 62314.0, 37769.0, 22045.0, 12906.0, 7640.0, 4486.0, 2709.0, 1716.0, 1047.0, 666.0, 424.0, 265.0, 201.0, 135.0, 85.0, 44.0, 45.0, 17.0, 18.0, 14.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.527587890625, -2.44384765625, -2.360107421875, -2.2763671875, -2.192626953125, -2.10888671875, -2.025146484375, -1.94140625, -1.857666015625, -1.77392578125, -1.690185546875, -1.6064453125, -1.522705078125, -1.43896484375, -1.355224609375, -1.271484375, -1.187744140625, -1.10400390625, -1.020263671875, -0.9365234375, -0.852783203125, -0.76904296875, -0.685302734375, -0.6015625, -0.517822265625, -0.43408203125, -0.350341796875, -0.2666015625, -0.182861328125, -0.09912109375, -0.015380859375, 0.068359375, 0.152099609375, 0.23583984375, 0.319580078125, 0.4033203125, 0.487060546875, 0.57080078125, 0.654541015625, 0.73828125, 0.822021484375, 0.90576171875, 0.989501953125, 1.0732421875, 1.156982421875, 1.24072265625, 1.324462890625, 1.408203125, 1.491943359375, 1.57568359375, 1.659423828125, 1.7431640625, 1.826904296875, 1.91064453125, 1.994384765625, 2.078125, 2.161865234375, 2.24560546875, 2.329345703125, 2.4130859375, 2.496826171875, 2.58056640625, 2.664306640625, 2.748046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 5.0, 12.0, 16.0, 19.0, 27.0, 23.0, 24.0, 37.0, 25.0, 30.0, 40.0, 32.0, 36.0, 38.0, 36.0, 52.0, 44.0, 36.0, 47.0, 43.0, 35.0, 38.0, 27.0, 20.0, 24.0, 28.0, 29.0, 14.0, 12.0, 19.0, 7.0, 12.0, 7.0, 8.0, 13.0, 5.0, 2.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.13092041015625, -1.0899658203125, -1.04901123046875, -1.008056640625, -0.96710205078125, -0.9261474609375, -0.88519287109375, -0.84423828125, -0.80328369140625, -0.7623291015625, -0.72137451171875, -0.680419921875, -0.63946533203125, -0.5985107421875, -0.55755615234375, -0.5166015625, -0.47564697265625, -0.4346923828125, -0.39373779296875, -0.352783203125, -0.31182861328125, -0.2708740234375, -0.22991943359375, -0.18896484375, -0.14801025390625, -0.1070556640625, -0.06610107421875, -0.025146484375, 0.01580810546875, 0.0567626953125, 0.09771728515625, 0.138671875, 0.17962646484375, 0.2205810546875, 0.26153564453125, 0.302490234375, 0.34344482421875, 0.3843994140625, 0.42535400390625, 0.46630859375, 0.50726318359375, 0.5482177734375, 0.58917236328125, 0.630126953125, 0.67108154296875, 0.7120361328125, 0.75299072265625, 0.7939453125, 0.83489990234375, 0.8758544921875, 0.91680908203125, 0.957763671875, 0.99871826171875, 1.0396728515625, 1.08062744140625, 1.12158203125, 1.16253662109375, 1.2034912109375, 1.24444580078125, 1.285400390625, 1.32635498046875, 1.3673095703125, 1.40826416015625, 1.44921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 12.0, 17.0, 17.0, 36.0, 48.0, 66.0, 123.0, 205.0, 307.0, 504.0, 829.0, 1428.0, 2382.0, 4214.0, 7388.0, 13151.0, 23990.0, 42627.0, 75139.0, 124603.0, 177281.0, 191828.0, 152613.0, 98457.0, 57875.0, 32195.0, 17738.0, 10187.0, 5525.0, 3166.0, 1889.0, 1059.0, 661.0, 383.0, 232.0, 132.0, 91.0, 63.0, 36.0, 32.0, 14.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4732513427734375, -1.421112060546875, -1.3689727783203125, -1.31683349609375, -1.2646942138671875, -1.212554931640625, -1.1604156494140625, -1.1082763671875, -1.0561370849609375, -1.003997802734375, -0.9518585205078125, -0.89971923828125, -0.8475799560546875, -0.795440673828125, -0.7433013916015625, -0.691162109375, -0.6390228271484375, -0.586883544921875, -0.5347442626953125, -0.48260498046875, -0.4304656982421875, -0.378326416015625, -0.3261871337890625, -0.2740478515625, -0.2219085693359375, -0.169769287109375, -0.1176300048828125, -0.06549072265625, -0.0133514404296875, 0.038787841796875, 0.0909271240234375, 0.14306640625, 0.1952056884765625, 0.247344970703125, 0.2994842529296875, 0.35162353515625, 0.4037628173828125, 0.455902099609375, 0.5080413818359375, 0.5601806640625, 0.6123199462890625, 0.664459228515625, 0.7165985107421875, 0.76873779296875, 0.8208770751953125, 0.873016357421875, 0.9251556396484375, 0.977294921875, 1.0294342041015625, 1.081573486328125, 1.1337127685546875, 1.18585205078125, 1.2379913330078125, 1.290130615234375, 1.3422698974609375, 1.3944091796875, 1.4465484619140625, 1.498687744140625, 1.5508270263671875, 1.60296630859375, 1.6551055908203125, 1.707244873046875, 1.7593841552734375, 1.8115234375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 6.0, 9.0, 17.0, 17.0, 28.0, 40.0, 45.0, 52.0, 75.0, 106.0, 101.0, 101.0, 90.0, 76.0, 66.0, 37.0, 43.0, 18.0, 27.0, 13.0, 15.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019490718841552734, -0.00018788687884807587, -0.0001808665692806244, -0.0001738462597131729, -0.00016682595014572144, -0.00015980564057826996, -0.00015278533101081848, -0.000145765021443367, -0.00013874471187591553, -0.00013172440230846405, -0.00012470409274101257, -0.0001176837831735611, -0.00011066347360610962, -0.00010364316403865814, -9.662285447120667e-05, -8.960254490375519e-05, -8.258223533630371e-05, -7.556192576885223e-05, -6.854161620140076e-05, -6.152130663394928e-05, -5.45009970664978e-05, -4.7480687499046326e-05, -4.046037793159485e-05, -3.344006836414337e-05, -2.6419758796691895e-05, -1.9399449229240417e-05, -1.237913966178894e-05, -5.358830094337463e-06, 1.6614794731140137e-06, 8.68178904056549e-06, 1.5702098608016968e-05, 2.2722408175468445e-05, 2.9742717742919922e-05, 3.67630273103714e-05, 4.3783336877822876e-05, 5.080364644527435e-05, 5.782395601272583e-05, 6.484426558017731e-05, 7.186457514762878e-05, 7.888488471508026e-05, 8.590519428253174e-05, 9.292550384998322e-05, 9.994581341743469e-05, 0.00010696612298488617, 0.00011398643255233765, 0.00012100674211978912, 0.0001280270516872406, 0.00013504736125469208, 0.00014206767082214355, 0.00014908798038959503, 0.0001561082899570465, 0.00016312859952449799, 0.00017014890909194946, 0.00017716921865940094, 0.00018418952822685242, 0.0001912098377943039, 0.00019823014736175537, 0.00020525045692920685, 0.00021227076649665833, 0.0002192910760641098, 0.00022631138563156128, 0.00023333169519901276, 0.00024035200476646423, 0.0002473723143339157, 0.0002543926239013672]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 5.0, 13.0, 16.0, 19.0, 38.0, 43.0, 58.0, 124.0, 151.0, 239.0, 352.0, 537.0, 829.0, 1228.0, 1876.0, 2971.0, 4544.0, 7138.0, 11260.0, 17251.0, 27439.0, 42794.0, 65154.0, 94782.0, 127091.0, 147868.0, 142009.0, 115157.0, 82496.0, 55309.0, 36010.0, 22997.0, 14392.0, 9351.0, 6029.0, 3758.0, 2494.0, 1615.0, 1050.0, 699.0, 462.0, 313.0, 183.0, 146.0, 83.0, 52.0, 49.0, 20.0, 15.0, 12.0, 11.0, 6.0, 9.0, 6.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.177734375, -1.1407012939453125, -1.103668212890625, -1.0666351318359375, -1.02960205078125, -0.9925689697265625, -0.955535888671875, -0.9185028076171875, -0.8814697265625, -0.8444366455078125, -0.807403564453125, -0.7703704833984375, -0.73333740234375, -0.6963043212890625, -0.659271240234375, -0.6222381591796875, -0.585205078125, -0.5481719970703125, -0.511138916015625, -0.4741058349609375, -0.43707275390625, -0.4000396728515625, -0.363006591796875, -0.3259735107421875, -0.2889404296875, -0.2519073486328125, -0.214874267578125, -0.1778411865234375, -0.14080810546875, -0.1037750244140625, -0.066741943359375, -0.0297088623046875, 0.00732421875, 0.0443572998046875, 0.081390380859375, 0.1184234619140625, 0.15545654296875, 0.1924896240234375, 0.229522705078125, 0.2665557861328125, 0.3035888671875, 0.3406219482421875, 0.377655029296875, 0.4146881103515625, 0.45172119140625, 0.4887542724609375, 0.525787353515625, 0.5628204345703125, 0.599853515625, 0.6368865966796875, 0.673919677734375, 0.7109527587890625, 0.74798583984375, 0.7850189208984375, 0.822052001953125, 0.8590850830078125, 0.8961181640625, 0.9331512451171875, 0.970184326171875, 1.0072174072265625, 1.04425048828125, 1.0812835693359375, 1.118316650390625, 1.1553497314453125, 1.1923828125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 10.0, 12.0, 20.0, 16.0, 18.0, 22.0, 23.0, 35.0, 38.0, 41.0, 41.0, 39.0, 48.0, 63.0, 48.0, 49.0, 36.0, 52.0, 42.0, 28.0, 41.0, 34.0, 31.0, 26.0, 24.0, 26.0, 22.0, 13.0, 15.0, 9.0, 8.0, 12.0, 11.0, 1.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2984199523925781, -0.28775787353515625, -0.2770957946777344, -0.2664337158203125, -0.2557716369628906, -0.24510955810546875, -0.23444747924804688, -0.223785400390625, -0.21312332153320312, -0.20246124267578125, -0.19179916381835938, -0.1811370849609375, -0.17047500610351562, -0.15981292724609375, -0.14915084838867188, -0.13848876953125, -0.12782669067382812, -0.11716461181640625, -0.10650253295898438, -0.0958404541015625, -0.08517837524414062, -0.07451629638671875, -0.06385421752929688, -0.053192138671875, -0.042530059814453125, -0.03186798095703125, -0.021205902099609375, -0.0105438232421875, 0.000118255615234375, 0.01078033447265625, 0.021442413330078125, 0.0321044921875, 0.042766571044921875, 0.05342864990234375, 0.06409072875976562, 0.0747528076171875, 0.08541488647460938, 0.09607696533203125, 0.10673904418945312, 0.117401123046875, 0.12806320190429688, 0.13872528076171875, 0.14938735961914062, 0.1600494384765625, 0.17071151733398438, 0.18137359619140625, 0.19203567504882812, 0.20269775390625, 0.21335983276367188, 0.22402191162109375, 0.23468399047851562, 0.2453460693359375, 0.2560081481933594, 0.26667022705078125, 0.2773323059082031, 0.287994384765625, 0.2986564636230469, 0.30931854248046875, 0.3199806213378906, 0.3306427001953125, 0.3413047790527344, 0.35196685791015625, 0.3626289367675781, 0.373291015625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 15.0, 12.0, 17.0, 15.0, 14.0, 30.0, 39.0, 53.0, 56.0, 61.0, 63.0, 66.0, 76.0, 63.0, 77.0, 54.0, 56.0, 47.0, 37.0, 22.0, 17.0, 23.0, 16.0, 14.0, 9.0, 10.0, 3.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.714277267456055, -4.566986083984375, -4.419694900512695, -4.272403717041016, -4.125112533569336, -3.9778213500976562, -3.8305299282073975, -3.6832387447357178, -3.535947561264038, -3.3886563777923584, -3.2413651943206787, -3.094074010848999, -2.9467825889587402, -2.7994914054870605, -2.652200222015381, -2.504909038543701, -2.3576178550720215, -2.210326671600342, -2.063035488128662, -1.9157441854476929, -1.7684530019760132, -1.6211618185043335, -1.4738705158233643, -1.3265793323516846, -1.1792881488800049, -1.0319969654083252, -0.8847057223320007, -0.7374144792556763, -0.5901232957839966, -0.4428321123123169, -0.29554086923599243, -0.14824962615966797, -0.0009589195251464844, 0.1463322937488556, 0.29362350702285767, 0.44091472029685974, 0.5882059335708618, 0.7354971170425415, 0.882788360118866, 1.0300796031951904, 1.1773707866668701, 1.3246619701385498, 1.4719531536102295, 1.6192444562911987, 1.7665356397628784, 1.913826823234558, 2.0611181259155273, 2.208409309387207, 2.3557004928588867, 2.5029916763305664, 2.650282859802246, 2.797574043273926, 2.9448652267456055, 3.092156410217285, 3.239447832107544, 3.3867390155792236, 3.5340301990509033, 3.681321382522583, 3.8286125659942627, 3.9759037494659424, 4.123195171356201, 4.270486354827881, 4.4177775382995605, 4.56506872177124, 4.71235990524292]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 4.0, 1.0, 8.0, 8.0, 9.0, 9.0, 11.0, 20.0, 15.0, 10.0, 19.0, 19.0, 24.0, 31.0, 26.0, 25.0, 36.0, 30.0, 28.0, 37.0, 44.0, 50.0, 38.0, 35.0, 38.0, 32.0, 29.0, 24.0, 28.0, 36.0, 25.0, 34.0, 30.0, 26.0, 19.0, 22.0, 24.0, 11.0, 8.0, 10.0, 14.0, 10.0, 7.0, 7.0, 9.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.959781289100647, -1.899973750114441, -1.8401663303375244, -1.7803587913513184, -1.7205513715744019, -1.6607438325881958, -1.6009364128112793, -1.5411288738250732, -1.4813213348388672, -1.4215137958526611, -1.3617063760757446, -1.3018988370895386, -1.242091417312622, -1.182283878326416, -1.12247633934021, -1.0626689195632935, -1.002861499786377, -0.9430540204048157, -0.8832465410232544, -0.8234390020370483, -0.7636315822601318, -0.7038240432739258, -0.6440165638923645, -0.5842090845108032, -0.5244016051292419, -0.46459412574768066, -0.4047866463661194, -0.3449791371822357, -0.28517165780067444, -0.22536417841911316, -0.1655566692352295, -0.10574918985366821, -0.045941710472106934, 0.013865776360034943, 0.07367326319217682, 0.1334807574748993, 0.19328823685646057, 0.25309571623802185, 0.3129032254219055, 0.3727107048034668, 0.4325181841850281, 0.49232566356658936, 0.5521331429481506, 0.6119406223297119, 0.671748161315918, 0.7315555810928345, 0.7913631200790405, 0.8511705994606018, 0.9109780788421631, 0.9707855582237244, 1.0305930376052856, 1.0904005765914917, 1.1502079963684082, 1.2100155353546143, 1.2698230743408203, 1.3296304941177368, 1.3894379138946533, 1.4492454528808594, 1.5090528726577759, 1.568860411643982, 1.6286678314208984, 1.6884753704071045, 1.7482829093933105, 1.808090329170227, 1.867897868156433]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 8.0, 13.0, 24.0, 31.0, 45.0, 81.0, 96.0, 135.0, 206.0, 328.0, 492.0, 762.0, 1116.0, 1753.0, 2804.0, 4488.0, 7367.0, 11936.0, 20540.0, 36259.0, 67500.0, 133005.0, 278507.0, 600425.0, 1037957.0, 969389.0, 520258.0, 242263.0, 117210.0, 60344.0, 32393.0, 18549.0, 10894.0, 6470.0, 3895.0, 2428.0, 1514.0, 1015.0, 598.0, 393.0, 281.0, 179.0, 118.0, 79.0, 44.0, 30.0, 25.0, 13.0, 9.0, 7.0, 5.0, 2.0, 1.0], "bins": [-4.3046875, -4.184783935546875, -4.06488037109375, -3.944976806640625, -3.8250732421875, -3.705169677734375, -3.58526611328125, -3.465362548828125, -3.345458984375, -3.225555419921875, -3.10565185546875, -2.985748291015625, -2.8658447265625, -2.745941162109375, -2.62603759765625, -2.506134033203125, -2.38623046875, -2.266326904296875, -2.14642333984375, -2.026519775390625, -1.9066162109375, -1.786712646484375, -1.66680908203125, -1.546905517578125, -1.427001953125, -1.307098388671875, -1.18719482421875, -1.067291259765625, -0.9473876953125, -0.827484130859375, -0.70758056640625, -0.587677001953125, -0.4677734375, -0.347869873046875, -0.22796630859375, -0.108062744140625, 0.0118408203125, 0.131744384765625, 0.25164794921875, 0.371551513671875, 0.491455078125, 0.611358642578125, 0.73126220703125, 0.851165771484375, 0.9710693359375, 1.090972900390625, 1.21087646484375, 1.330780029296875, 1.45068359375, 1.570587158203125, 1.69049072265625, 1.810394287109375, 1.9302978515625, 2.050201416015625, 2.17010498046875, 2.290008544921875, 2.409912109375, 2.529815673828125, 2.64971923828125, 2.769622802734375, 2.8895263671875, 3.009429931640625, 3.12933349609375, 3.249237060546875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 14.0, 10.0, 10.0, 10.0, 18.0, 20.0, 20.0, 21.0, 24.0, 31.0, 20.0, 47.0, 35.0, 36.0, 38.0, 31.0, 41.0, 38.0, 47.0, 39.0, 42.0, 48.0, 36.0, 48.0, 28.0, 38.0, 34.0, 29.0, 12.0, 24.0, 7.0, 17.0, 10.0, 19.0, 10.0, 13.0, 6.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.87890625, -1.8269805908203125, -1.775054931640625, -1.7231292724609375, -1.67120361328125, -1.6192779541015625, -1.567352294921875, -1.5154266357421875, -1.4635009765625, -1.4115753173828125, -1.359649658203125, -1.3077239990234375, -1.25579833984375, -1.2038726806640625, -1.151947021484375, -1.1000213623046875, -1.048095703125, -0.9961700439453125, -0.944244384765625, -0.8923187255859375, -0.84039306640625, -0.7884674072265625, -0.736541748046875, -0.6846160888671875, -0.6326904296875, -0.5807647705078125, -0.528839111328125, -0.4769134521484375, -0.42498779296875, -0.3730621337890625, -0.321136474609375, -0.2692108154296875, -0.21728515625, -0.1653594970703125, -0.113433837890625, -0.0615081787109375, -0.00958251953125, 0.0423431396484375, 0.094268798828125, 0.1461944580078125, 0.1981201171875, 0.2500457763671875, 0.301971435546875, 0.3538970947265625, 0.40582275390625, 0.4577484130859375, 0.509674072265625, 0.5615997314453125, 0.613525390625, 0.6654510498046875, 0.717376708984375, 0.7693023681640625, 0.82122802734375, 0.8731536865234375, 0.925079345703125, 0.9770050048828125, 1.0289306640625, 1.0808563232421875, 1.132781982421875, 1.1847076416015625, 1.23663330078125, 1.2885589599609375, 1.340484619140625, 1.3924102783203125, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 8.0, 18.0, 27.0, 45.0, 59.0, 87.0, 145.0, 225.0, 361.0, 564.0, 861.0, 1291.0, 2038.0, 3275.0, 5463.0, 8708.0, 14303.0, 23790.0, 40590.0, 69876.0, 124796.0, 226503.0, 414431.0, 707492.0, 906769.0, 708604.0, 413161.0, 225275.0, 124499.0, 70042.0, 40275.0, 23608.0, 14370.0, 8596.0, 5232.0, 3268.0, 2005.0, 1304.0, 830.0, 520.0, 321.0, 233.0, 120.0, 98.0, 66.0, 50.0, 24.0, 19.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.484375, -3.373748779296875, -3.26312255859375, -3.152496337890625, -3.0418701171875, -2.931243896484375, -2.82061767578125, -2.709991455078125, -2.599365234375, -2.488739013671875, -2.37811279296875, -2.267486572265625, -2.1568603515625, -2.046234130859375, -1.93560791015625, -1.824981689453125, -1.71435546875, -1.603729248046875, -1.49310302734375, -1.382476806640625, -1.2718505859375, -1.161224365234375, -1.05059814453125, -0.939971923828125, -0.829345703125, -0.718719482421875, -0.60809326171875, -0.497467041015625, -0.3868408203125, -0.276214599609375, -0.16558837890625, -0.054962158203125, 0.0556640625, 0.166290283203125, 0.27691650390625, 0.387542724609375, 0.4981689453125, 0.608795166015625, 0.71942138671875, 0.830047607421875, 0.940673828125, 1.051300048828125, 1.16192626953125, 1.272552490234375, 1.3831787109375, 1.493804931640625, 1.60443115234375, 1.715057373046875, 1.82568359375, 1.936309814453125, 2.04693603515625, 2.157562255859375, 2.2681884765625, 2.378814697265625, 2.48944091796875, 2.600067138671875, 2.710693359375, 2.821319580078125, 2.93194580078125, 3.042572021484375, 3.1531982421875, 3.263824462890625, 3.37445068359375, 3.485076904296875, 3.595703125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 12.0, 8.0, 14.0, 21.0, 25.0, 39.0, 30.0, 48.0, 45.0, 60.0, 71.0, 86.0, 99.0, 98.0, 136.0, 139.0, 166.0, 185.0, 198.0, 223.0, 236.0, 217.0, 206.0, 216.0, 205.0, 155.0, 182.0, 130.0, 126.0, 124.0, 98.0, 77.0, 69.0, 68.0, 45.0, 38.0, 37.0, 27.0, 21.0, 14.0, 13.0, 14.0, 8.0, 7.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8623046875, -0.8345413208007812, -0.8067779541015625, -0.7790145874023438, -0.751251220703125, -0.7234878540039062, -0.6957244873046875, -0.6679611206054688, -0.64019775390625, -0.6124343872070312, -0.5846710205078125, -0.5569076538085938, -0.529144287109375, -0.5013809204101562, -0.4736175537109375, -0.44585418701171875, -0.4180908203125, -0.39032745361328125, -0.3625640869140625, -0.33480072021484375, -0.307037353515625, -0.27927398681640625, -0.2515106201171875, -0.22374725341796875, -0.19598388671875, -0.16822052001953125, -0.1404571533203125, -0.11269378662109375, -0.084930419921875, -0.05716705322265625, -0.0294036865234375, -0.00164031982421875, 0.026123046875, 0.05388641357421875, 0.0816497802734375, 0.10941314697265625, 0.137176513671875, 0.16493988037109375, 0.1927032470703125, 0.22046661376953125, 0.24822998046875, 0.27599334716796875, 0.3037567138671875, 0.33152008056640625, 0.359283447265625, 0.38704681396484375, 0.4148101806640625, 0.44257354736328125, 0.4703369140625, 0.49810028076171875, 0.5258636474609375, 0.5536270141601562, 0.581390380859375, 0.6091537475585938, 0.6369171142578125, 0.6646804809570312, 0.69244384765625, 0.7202072143554688, 0.7479705810546875, 0.7757339477539062, 0.803497314453125, 0.8312606811523438, 0.8590240478515625, 0.8867874145507812, 0.91455078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 9.0, 4.0, 6.0, 4.0, 6.0, 13.0, 13.0, 20.0, 27.0, 26.0, 34.0, 52.0, 60.0, 64.0, 67.0, 66.0, 64.0, 71.0, 64.0, 58.0, 60.0, 34.0, 27.0, 28.0, 30.0, 16.0, 20.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.285930633544922, -4.141051292419434, -3.996171712875366, -3.851292133331299, -3.7064127922058105, -3.561533212661743, -3.416653633117676, -3.2717742919921875, -3.12689471244812, -2.9820151329040527, -2.8371357917785645, -2.692256212234497, -2.5473766326904297, -2.4024972915649414, -2.257617712020874, -2.1127381324768066, -1.9678587913513184, -1.8229793310165405, -1.6780998706817627, -1.5332202911376953, -1.3883408308029175, -1.2434613704681396, -1.0985817909240723, -0.9537023305892944, -0.8088228702545166, -0.6639434099197388, -0.5190638899803162, -0.37418439984321594, -0.22930490970611572, -0.08442544937133789, 0.06045407056808472, 0.20533359050750732, 0.35021352767944336, 0.4950930178165436, 0.6399725079536438, 0.7848520278930664, 0.9297314882278442, 1.074610948562622, 1.2194905281066895, 1.3643699884414673, 1.5092494487762451, 1.654128909111023, 1.7990083694458008, 1.9438879489898682, 2.0887675285339355, 2.233646869659424, 2.378526449203491, 2.5234060287475586, 2.668285369873047, 2.8131649494171143, 2.9580442905426025, 3.10292387008667, 3.247803211212158, 3.3926827907562256, 3.537562370300293, 3.6824417114257812, 3.8273212909698486, 3.972200870513916, 4.117080211639404, 4.261959552764893, 4.406839370727539, 4.551718711853027, 4.696598052978516, 4.841477870941162, 4.98635721206665]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 10.0, 13.0, 12.0, 11.0, 12.0, 11.0, 15.0, 21.0, 25.0, 17.0, 23.0, 26.0, 24.0, 31.0, 36.0, 32.0, 37.0, 29.0, 25.0, 37.0, 52.0, 44.0, 32.0, 37.0, 38.0, 40.0, 34.0, 36.0, 33.0, 26.0, 22.0, 23.0, 18.0, 26.0, 13.0, 18.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7316498756408691, -1.6734554767608643, -1.6152609586715698, -1.557066559791565, -1.4988720417022705, -1.4406776428222656, -1.3824831247329712, -1.3242887258529663, -1.2660942077636719, -1.207899808883667, -1.1497052907943726, -1.0915108919143677, -1.0333163738250732, -0.9751219749450684, -0.9169274568557739, -0.858733057975769, -0.8005385994911194, -0.7423441410064697, -0.6841496825218201, -0.6259552240371704, -0.5677607655525208, -0.5095663070678711, -0.4513718783855438, -0.39317741990089417, -0.3349829614162445, -0.27678850293159485, -0.2185940444469452, -0.16039960086345673, -0.10220514237880707, -0.044010698795318604, 0.014183759689331055, 0.07237821817398071, 0.13057267665863037, 0.18876713514328003, 0.2469615936279297, 0.30515605211257935, 0.363350510597229, 0.4215449392795563, 0.47973939776420593, 0.5379338264465332, 0.5961283445358276, 0.6543228030204773, 0.712517261505127, 0.7707117199897766, 0.8289061784744263, 0.8871005773544312, 0.9452950954437256, 1.0034894943237305, 1.0616838932037354, 1.1198782920837402, 1.1780728101730347, 1.2362672090530396, 1.294461727142334, 1.3526561260223389, 1.4108506441116333, 1.4690450429916382, 1.5272395610809326, 1.5854339599609375, 1.643628478050232, 1.7018228769302368, 1.7600173950195312, 1.8182117938995361, 1.8764063119888306, 1.9346007108688354, 1.9927952289581299]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 18.0, 15.0, 23.0, 38.0, 75.0, 123.0, 150.0, 253.0, 431.0, 660.0, 1107.0, 1918.0, 3246.0, 6093.0, 11105.0, 20615.0, 39160.0, 73818.0, 134500.0, 211318.0, 220414.0, 147458.0, 81425.0, 43648.0, 23108.0, 12175.0, 6649.0, 3775.0, 1994.0, 1231.0, 764.0, 483.0, 260.0, 176.0, 113.0, 56.0, 46.0, 33.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3155326843261719, -0.30538177490234375, -0.2952308654785156, -0.2850799560546875, -0.2749290466308594, -0.26477813720703125, -0.2546272277832031, -0.244476318359375, -0.23432540893554688, -0.22417449951171875, -0.21402359008789062, -0.2038726806640625, -0.19372177124023438, -0.18357086181640625, -0.17341995239257812, -0.16326904296875, -0.15311813354492188, -0.14296722412109375, -0.13281631469726562, -0.1226654052734375, -0.11251449584960938, -0.10236358642578125, -0.09221267700195312, -0.082061767578125, -0.07191085815429688, -0.06175994873046875, -0.051609039306640625, -0.0414581298828125, -0.031307220458984375, -0.02115631103515625, -0.011005401611328125, -0.0008544921875, 0.009296417236328125, 0.01944732666015625, 0.029598236083984375, 0.0397491455078125, 0.049900054931640625, 0.06005096435546875, 0.07020187377929688, 0.080352783203125, 0.09050369262695312, 0.10065460205078125, 0.11080551147460938, 0.1209564208984375, 0.13110733032226562, 0.14125823974609375, 0.15140914916992188, 0.16156005859375, 0.17171096801757812, 0.18186187744140625, 0.19201278686523438, 0.2021636962890625, 0.21231460571289062, 0.22246551513671875, 0.23261642456054688, 0.242767333984375, 0.2529182434082031, 0.26306915283203125, 0.2732200622558594, 0.2833709716796875, 0.2935218811035156, 0.30367279052734375, 0.3138236999511719, 0.323974609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 17.0, 5.0, 13.0, 9.0, 11.0, 20.0, 22.0, 19.0, 23.0, 30.0, 34.0, 33.0, 30.0, 18.0, 32.0, 33.0, 48.0, 48.0, 42.0, 51.0, 53.0, 37.0, 42.0, 41.0, 41.0, 39.0, 29.0, 32.0, 18.0, 12.0, 20.0, 17.0, 12.0, 15.0, 6.0, 12.0, 7.0, 7.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.25, -2.1741943359375, -2.098388671875, -2.0225830078125, -1.94677734375, -1.8709716796875, -1.795166015625, -1.7193603515625, -1.6435546875, -1.5677490234375, -1.491943359375, -1.4161376953125, -1.34033203125, -1.2645263671875, -1.188720703125, -1.1129150390625, -1.037109375, -0.9613037109375, -0.885498046875, -0.8096923828125, -0.73388671875, -0.6580810546875, -0.582275390625, -0.5064697265625, -0.4306640625, -0.3548583984375, -0.279052734375, -0.2032470703125, -0.12744140625, -0.0516357421875, 0.024169921875, 0.0999755859375, 0.17578125, 0.2515869140625, 0.327392578125, 0.4031982421875, 0.47900390625, 0.5548095703125, 0.630615234375, 0.7064208984375, 0.7822265625, 0.8580322265625, 0.933837890625, 1.0096435546875, 1.08544921875, 1.1612548828125, 1.237060546875, 1.3128662109375, 1.388671875, 1.4644775390625, 1.540283203125, 1.6160888671875, 1.69189453125, 1.7677001953125, 1.843505859375, 1.9193115234375, 1.9951171875, 2.0709228515625, 2.146728515625, 2.2225341796875, 2.29833984375, 2.3741455078125, 2.449951171875, 2.5257568359375, 2.6015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 13.0, 24.0, 39.0, 49.0, 61.0, 70.0, 110.0, 151.0, 201.0, 363.0, 497.0, 749.0, 1258.0, 2142.0, 3781.0, 7894.0, 17018.0, 47203.0, 830002.0, 93310.0, 22229.0, 9632.0, 4901.0, 2628.0, 1528.0, 882.0, 560.0, 390.0, 235.0, 169.0, 111.0, 82.0, 63.0, 36.0, 34.0, 24.0, 20.0, 22.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8016128540039062, -0.7736358642578125, -0.7456588745117188, -0.717681884765625, -0.6897048950195312, -0.6617279052734375, -0.6337509155273438, -0.60577392578125, -0.5777969360351562, -0.5498199462890625, -0.5218429565429688, -0.493865966796875, -0.46588897705078125, -0.4379119873046875, -0.40993499755859375, -0.3819580078125, -0.35398101806640625, -0.3260040283203125, -0.29802703857421875, -0.270050048828125, -0.24207305908203125, -0.2140960693359375, -0.18611907958984375, -0.15814208984375, -0.13016510009765625, -0.1021881103515625, -0.07421112060546875, -0.046234130859375, -0.01825714111328125, 0.0097198486328125, 0.03769683837890625, 0.065673828125, 0.09365081787109375, 0.1216278076171875, 0.14960479736328125, 0.177581787109375, 0.20555877685546875, 0.2335357666015625, 0.26151275634765625, 0.28948974609375, 0.31746673583984375, 0.3454437255859375, 0.37342071533203125, 0.401397705078125, 0.42937469482421875, 0.4573516845703125, 0.48532867431640625, 0.5133056640625, 0.5412826538085938, 0.5692596435546875, 0.5972366333007812, 0.625213623046875, 0.6531906127929688, 0.6811676025390625, 0.7091445922851562, 0.73712158203125, 0.7650985717773438, 0.7930755615234375, 0.8210525512695312, 0.849029541015625, 0.8770065307617188, 0.9049835205078125, 0.9329605102539062, 0.9609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 5.0, 10.0, 11.0, 12.0, 13.0, 13.0, 17.0, 30.0, 29.0, 16.0, 27.0, 30.0, 32.0, 30.0, 30.0, 37.0, 38.0, 34.0, 34.0, 41.0, 42.0, 48.0, 38.0, 36.0, 34.0, 28.0, 23.0, 23.0, 19.0, 23.0, 23.0, 22.0, 24.0, 15.0, 17.0, 10.0, 16.0, 11.0, 7.0, 8.0, 3.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2261810302734375, -1.183807373046875, -1.1414337158203125, -1.09906005859375, -1.0566864013671875, -1.014312744140625, -0.9719390869140625, -0.9295654296875, -0.8871917724609375, -0.844818115234375, -0.8024444580078125, -0.76007080078125, -0.7176971435546875, -0.675323486328125, -0.6329498291015625, -0.590576171875, -0.5482025146484375, -0.505828857421875, -0.4634552001953125, -0.42108154296875, -0.3787078857421875, -0.336334228515625, -0.2939605712890625, -0.2515869140625, -0.2092132568359375, -0.166839599609375, -0.1244659423828125, -0.08209228515625, -0.0397186279296875, 0.002655029296875, 0.0450286865234375, 0.08740234375, 0.1297760009765625, 0.172149658203125, 0.2145233154296875, 0.25689697265625, 0.2992706298828125, 0.341644287109375, 0.3840179443359375, 0.4263916015625, 0.4687652587890625, 0.511138916015625, 0.5535125732421875, 0.59588623046875, 0.6382598876953125, 0.680633544921875, 0.7230072021484375, 0.765380859375, 0.8077545166015625, 0.850128173828125, 0.8925018310546875, 0.93487548828125, 0.9772491455078125, 1.019622802734375, 1.0619964599609375, 1.1043701171875, 1.1467437744140625, 1.189117431640625, 1.2314910888671875, 1.27386474609375, 1.3162384033203125, 1.358612060546875, 1.4009857177734375, 1.443359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 24.0, 15.0, 27.0, 46.0, 59.0, 90.0, 109.0, 210.0, 308.0, 516.0, 731.0, 1193.0, 1766.0, 2802.0, 4689.0, 7983.0, 14481.0, 28652.0, 596362.0, 328898.0, 26547.0, 13487.0, 7548.0, 4452.0, 2775.0, 1746.0, 1026.0, 689.0, 425.0, 308.0, 195.0, 127.0, 73.0, 47.0, 36.0, 31.0, 21.0, 14.0, 7.0, 12.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.17181968688964844, -0.16675949096679688, -0.1616992950439453, -0.15663909912109375, -0.1515789031982422, -0.14651870727539062, -0.14145851135253906, -0.1363983154296875, -0.13133811950683594, -0.12627792358398438, -0.12121772766113281, -0.11615753173828125, -0.11109733581542969, -0.10603713989257812, -0.10097694396972656, -0.095916748046875, -0.09085655212402344, -0.08579635620117188, -0.08073616027832031, -0.07567596435546875, -0.07061576843261719, -0.06555557250976562, -0.06049537658691406, -0.0554351806640625, -0.05037498474121094, -0.045314788818359375, -0.04025459289550781, -0.03519439697265625, -0.030134201049804688, -0.025074005126953125, -0.020013809204101562, -0.01495361328125, -0.009893417358398438, -0.004833221435546875, 0.0002269744873046875, 0.00528717041015625, 0.010347366333007812, 0.015407562255859375, 0.020467758178710938, 0.0255279541015625, 0.030588150024414062, 0.035648345947265625, 0.04070854187011719, 0.04576873779296875, 0.05082893371582031, 0.055889129638671875, 0.06094932556152344, 0.066009521484375, 0.07106971740722656, 0.07612991333007812, 0.08119010925292969, 0.08625030517578125, 0.09131050109863281, 0.09637069702148438, 0.10143089294433594, 0.1064910888671875, 0.11155128479003906, 0.11661148071289062, 0.12167167663574219, 0.12673187255859375, 0.1317920684814453, 0.13685226440429688, 0.14191246032714844, 0.14697265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 9.0, 11.0, 17.0, 24.0, 19.0, 38.0, 33.0, 48.0, 46.0, 56.0, 52.0, 67.0, 74.0, 56.0, 63.0, 56.0, 51.0, 43.0, 32.0, 29.0, 38.0, 30.0, 13.0, 17.0, 11.0, 13.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.1313858926296234e-05, -3.0143186450004578e-05, -2.897251397371292e-05, -2.7801841497421265e-05, -2.6631169021129608e-05, -2.546049654483795e-05, -2.4289824068546295e-05, -2.311915159225464e-05, -2.1948479115962982e-05, -2.0777806639671326e-05, -1.960713416337967e-05, -1.8436461687088013e-05, -1.7265789210796356e-05, -1.60951167345047e-05, -1.4924444258213043e-05, -1.3753771781921387e-05, -1.258309930562973e-05, -1.1412426829338074e-05, -1.0241754353046417e-05, -9.07108187675476e-06, -7.900409400463104e-06, -6.729736924171448e-06, -5.559064447879791e-06, -4.388391971588135e-06, -3.2177194952964783e-06, -2.0470470190048218e-06, -8.763745427131653e-07, 2.942979335784912e-07, 1.4649704098701477e-06, 2.635642886161804e-06, 3.8063153624534607e-06, 4.976987838745117e-06, 6.147660315036774e-06, 7.31833279132843e-06, 8.489005267620087e-06, 9.659677743911743e-06, 1.08303502202034e-05, 1.2001022696495056e-05, 1.3171695172786713e-05, 1.4342367649078369e-05, 1.5513040125370026e-05, 1.6683712601661682e-05, 1.785438507795334e-05, 1.9025057554244995e-05, 2.019573003053665e-05, 2.1366402506828308e-05, 2.2537074983119965e-05, 2.370774745941162e-05, 2.4878419935703278e-05, 2.6049092411994934e-05, 2.721976488828659e-05, 2.8390437364578247e-05, 2.9561109840869904e-05, 3.073178231716156e-05, 3.1902454793453217e-05, 3.307312726974487e-05, 3.424379974603653e-05, 3.5414472222328186e-05, 3.658514469861984e-05, 3.77558171749115e-05, 3.8926489651203156e-05, 4.009716212749481e-05, 4.126783460378647e-05, 4.2438507080078125e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 12.0, 29.0, 50.0, 55.0, 88.0, 168.0, 244.0, 338.0, 524.0, 938.0, 1530.0, 2553.0, 4356.0, 7806.0, 14568.0, 27175.0, 51326.0, 97521.0, 170502.0, 231786.0, 192073.0, 113840.0, 60271.0, 31694.0, 17046.0, 9338.0, 5179.0, 3035.0, 1673.0, 1027.0, 678.0, 361.0, 242.0, 156.0, 120.0, 82.0, 50.0, 40.0, 16.0, 18.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058837890625, -0.056708335876464844, -0.05457878112792969, -0.05244922637939453, -0.050319671630859375, -0.04819011688232422, -0.04606056213378906, -0.043931007385253906, -0.04180145263671875, -0.039671897888183594, -0.03754234313964844, -0.03541278839111328, -0.033283233642578125, -0.03115367889404297, -0.029024124145507812, -0.026894569396972656, -0.0247650146484375, -0.022635459899902344, -0.020505905151367188, -0.01837635040283203, -0.016246795654296875, -0.014117240905761719, -0.011987686157226562, -0.009858131408691406, -0.00772857666015625, -0.005599021911621094, -0.0034694671630859375, -0.0013399124145507812, 0.000789642333984375, 0.0029191970825195312, 0.0050487518310546875, 0.007178306579589844, 0.009307861328125, 0.011437416076660156, 0.013566970825195312, 0.01569652557373047, 0.017826080322265625, 0.01995563507080078, 0.022085189819335938, 0.024214744567871094, 0.02634429931640625, 0.028473854064941406, 0.030603408813476562, 0.03273296356201172, 0.034862518310546875, 0.03699207305908203, 0.03912162780761719, 0.041251182556152344, 0.0433807373046875, 0.045510292053222656, 0.04763984680175781, 0.04976940155029297, 0.051898956298828125, 0.05402851104736328, 0.05615806579589844, 0.058287620544433594, 0.06041717529296875, 0.0625467300415039, 0.06467628479003906, 0.06680583953857422, 0.06893539428710938, 0.07106494903564453, 0.07319450378417969, 0.07532405853271484, 0.07745361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 7.0, 18.0, 27.0, 21.0, 32.0, 39.0, 27.0, 48.0, 53.0, 61.0, 61.0, 70.0, 60.0, 54.0, 56.0, 49.0, 39.0, 40.0, 31.0, 37.0, 26.0, 15.0, 13.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0193328857421875, -0.018761157989501953, -0.018189430236816406, -0.01761770248413086, -0.017045974731445312, -0.016474246978759766, -0.01590251922607422, -0.015330791473388672, -0.014759063720703125, -0.014187335968017578, -0.013615608215332031, -0.013043880462646484, -0.012472152709960938, -0.01190042495727539, -0.011328697204589844, -0.010756969451904297, -0.01018524169921875, -0.009613513946533203, -0.009041786193847656, -0.00847005844116211, -0.007898330688476562, -0.007326602935791016, -0.006754875183105469, -0.006183147430419922, -0.005611419677734375, -0.005039691925048828, -0.004467964172363281, -0.0038962364196777344, -0.0033245086669921875, -0.0027527809143066406, -0.0021810531616210938, -0.0016093254089355469, -0.00103759765625, -0.0004658699035644531, 0.00010585784912109375, 0.0006775856018066406, 0.0012493133544921875, 0.0018210411071777344, 0.0023927688598632812, 0.002964496612548828, 0.003536224365234375, 0.004107952117919922, 0.004679679870605469, 0.005251407623291016, 0.0058231353759765625, 0.006394863128662109, 0.006966590881347656, 0.007538318634033203, 0.00811004638671875, 0.008681774139404297, 0.009253501892089844, 0.00982522964477539, 0.010396957397460938, 0.010968685150146484, 0.011540412902832031, 0.012112140655517578, 0.012683868408203125, 0.013255596160888672, 0.013827323913574219, 0.014399051666259766, 0.014970779418945312, 0.01554250717163086, 0.016114234924316406, 0.016685962677001953, 0.0172576904296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 9.0, 3.0, 7.0, 4.0, 4.0, 17.0, 13.0, 21.0, 28.0, 27.0, 34.0, 51.0, 57.0, 70.0, 62.0, 64.0, 70.0, 73.0, 66.0, 61.0, 52.0, 34.0, 27.0, 28.0, 26.0, 20.0, 16.0, 9.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.278392314910889, -4.133045196533203, -3.9876976013183594, -3.842350482940674, -3.697003126144409, -3.5516557693481445, -3.406308650970459, -3.2609612941741943, -3.1156139373779297, -2.970266580581665, -2.8249192237854004, -2.679572105407715, -2.53422474861145, -2.3888773918151855, -2.2435302734375, -2.0981829166412354, -1.9528355598449707, -1.807488203048706, -1.662140965461731, -1.5167937278747559, -1.3714463710784912, -1.2260990142822266, -1.0807517766952515, -0.9354045391082764, -0.7900571823120117, -0.6447098851203918, -0.499362587928772, -0.3540152907371521, -0.20866799354553223, -0.06332069635391235, 0.08202660083770752, 0.22737383842468262, 0.37272071838378906, 0.5180680155754089, 0.6634153127670288, 0.8087626099586487, 0.9541099071502686, 1.0994572639465332, 1.2448045015335083, 1.3901517391204834, 1.535499095916748, 1.6808464527130127, 1.8261936902999878, 1.971540927886963, 2.1168882846832275, 2.262235641479492, 2.4075827598571777, 2.5529301166534424, 2.698277473449707, 2.8436248302459717, 2.9889721870422363, 3.134319305419922, 3.2796666622161865, 3.425014019012451, 3.5703611373901367, 3.7157084941864014, 3.861055850982666, 4.006402969360352, 4.151750564575195, 4.297097682952881, 4.442444801330566, 4.58779239654541, 4.733139514923096, 4.878486633300781, 5.023834228515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 10.0, 11.0, 11.0, 16.0, 8.0, 13.0, 17.0, 18.0, 25.0, 22.0, 19.0, 28.0, 26.0, 33.0, 28.0, 33.0, 37.0, 31.0, 27.0, 35.0, 54.0, 41.0, 35.0, 40.0, 30.0, 41.0, 38.0, 34.0, 30.0, 27.0, 23.0, 23.0, 18.0, 24.0, 12.0, 19.0, 11.0, 8.0, 10.0, 4.0, 9.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7050451040267944, -1.6472798585891724, -1.5895144939422607, -1.5317492485046387, -1.473983883857727, -1.416218638420105, -1.3584532737731934, -1.3006880283355713, -1.2429227828979492, -1.1851575374603271, -1.1273921728134155, -1.0696269273757935, -1.0118615627288818, -0.9540963172912598, -0.8963310122489929, -0.8385657072067261, -0.7808003425598145, -0.7230350375175476, -0.6652697324752808, -0.6075044870376587, -0.5497391223907471, -0.4919738471508026, -0.43420857191085815, -0.3764432668685913, -0.31867796182632446, -0.2609126567840576, -0.20314736664295197, -0.1453820765018463, -0.08761677145957947, -0.029851466417312622, 0.027913808822631836, 0.08567911386489868, 0.14344441890716553, 0.20120972394943237, 0.2589750289916992, 0.3167403042316437, 0.3745056092739105, 0.43227091431617737, 0.4900361895561218, 0.5478014945983887, 0.6055667996406555, 0.6633321046829224, 0.7210974097251892, 0.778862714767456, 0.8366279602050781, 0.8943933248519897, 0.9521585702896118, 1.0099239349365234, 1.0676891803741455, 1.1254544258117676, 1.1832197904586792, 1.2409850358963013, 1.298750400543213, 1.356515645980835, 1.414280891418457, 1.4720462560653687, 1.5298116207122803, 1.5875768661499023, 1.645342230796814, 1.703107476234436, 1.7608728408813477, 1.8186380863189697, 1.8764033317565918, 1.9341686964035034, 1.9919339418411255]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 11.0, 20.0, 20.0, 42.0, 77.0, 98.0, 128.0, 218.0, 349.0, 585.0, 975.0, 1551.0, 2663.0, 4779.0, 8291.0, 14726.0, 26864.0, 48478.0, 82217.0, 130019.0, 174190.0, 180841.0, 144901.0, 96157.0, 57218.0, 31781.0, 18156.0, 9759.0, 5586.0, 3123.0, 1839.0, 1040.0, 675.0, 428.0, 264.0, 179.0, 106.0, 79.0, 32.0, 18.0, 24.0, 12.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.412353515625, -2.32666015625, -2.240966796875, -2.1552734375, -2.069580078125, -1.98388671875, -1.898193359375, -1.8125, -1.726806640625, -1.64111328125, -1.555419921875, -1.4697265625, -1.384033203125, -1.29833984375, -1.212646484375, -1.126953125, -1.041259765625, -0.95556640625, -0.869873046875, -0.7841796875, -0.698486328125, -0.61279296875, -0.527099609375, -0.44140625, -0.355712890625, -0.27001953125, -0.184326171875, -0.0986328125, -0.012939453125, 0.07275390625, 0.158447265625, 0.244140625, 0.329833984375, 0.41552734375, 0.501220703125, 0.5869140625, 0.672607421875, 0.75830078125, 0.843994140625, 0.9296875, 1.015380859375, 1.10107421875, 1.186767578125, 1.2724609375, 1.358154296875, 1.44384765625, 1.529541015625, 1.615234375, 1.700927734375, 1.78662109375, 1.872314453125, 1.9580078125, 2.043701171875, 2.12939453125, 2.215087890625, 2.30078125, 2.386474609375, 2.47216796875, 2.557861328125, 2.6435546875, 2.729248046875, 2.81494140625, 2.900634765625, 2.986328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 13.0, 6.0, 16.0, 13.0, 17.0, 26.0, 24.0, 15.0, 14.0, 27.0, 22.0, 29.0, 26.0, 36.0, 29.0, 39.0, 33.0, 33.0, 33.0, 30.0, 40.0, 45.0, 43.0, 40.0, 37.0, 35.0, 35.0, 31.0, 30.0, 18.0, 27.0, 23.0, 19.0, 17.0, 7.0, 13.0, 15.0, 10.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.0311279296875, -1.964599609375, -1.8980712890625, -1.83154296875, -1.7650146484375, -1.698486328125, -1.6319580078125, -1.5654296875, -1.4989013671875, -1.432373046875, -1.3658447265625, -1.29931640625, -1.2327880859375, -1.166259765625, -1.0997314453125, -1.033203125, -0.9666748046875, -0.900146484375, -0.8336181640625, -0.76708984375, -0.7005615234375, -0.634033203125, -0.5675048828125, -0.5009765625, -0.4344482421875, -0.367919921875, -0.3013916015625, -0.23486328125, -0.1683349609375, -0.101806640625, -0.0352783203125, 0.03125, 0.0977783203125, 0.164306640625, 0.2308349609375, 0.29736328125, 0.3638916015625, 0.430419921875, 0.4969482421875, 0.5634765625, 0.6300048828125, 0.696533203125, 0.7630615234375, 0.82958984375, 0.8961181640625, 0.962646484375, 1.0291748046875, 1.095703125, 1.1622314453125, 1.228759765625, 1.2952880859375, 1.36181640625, 1.4283447265625, 1.494873046875, 1.5614013671875, 1.6279296875, 1.6944580078125, 1.760986328125, 1.8275146484375, 1.89404296875, 1.9605712890625, 2.027099609375, 2.0936279296875, 2.16015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 8.0, 15.0, 18.0, 46.0, 42.0, 68.0, 98.0, 179.0, 226.0, 350.0, 587.0, 903.0, 1424.0, 2294.0, 3856.0, 6355.0, 10891.0, 18187.0, 30565.0, 49960.0, 79273.0, 115614.0, 149237.0, 159552.0, 139697.0, 103913.0, 68673.0, 42416.0, 25448.0, 15387.0, 8994.0, 5552.0, 3264.0, 1986.0, 1254.0, 737.0, 485.0, 335.0, 210.0, 140.0, 96.0, 62.0, 50.0, 34.0, 18.0, 10.0, 16.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.443359375, -2.365386962890625, -2.28741455078125, -2.209442138671875, -2.1314697265625, -2.053497314453125, -1.97552490234375, -1.897552490234375, -1.819580078125, -1.741607666015625, -1.66363525390625, -1.585662841796875, -1.5076904296875, -1.429718017578125, -1.35174560546875, -1.273773193359375, -1.19580078125, -1.117828369140625, -1.03985595703125, -0.961883544921875, -0.8839111328125, -0.805938720703125, -0.72796630859375, -0.649993896484375, -0.572021484375, -0.494049072265625, -0.41607666015625, -0.338104248046875, -0.2601318359375, -0.182159423828125, -0.10418701171875, -0.026214599609375, 0.0517578125, 0.129730224609375, 0.20770263671875, 0.285675048828125, 0.3636474609375, 0.441619873046875, 0.51959228515625, 0.597564697265625, 0.675537109375, 0.753509521484375, 0.83148193359375, 0.909454345703125, 0.9874267578125, 1.065399169921875, 1.14337158203125, 1.221343994140625, 1.29931640625, 1.377288818359375, 1.45526123046875, 1.533233642578125, 1.6112060546875, 1.689178466796875, 1.76715087890625, 1.845123291015625, 1.923095703125, 2.001068115234375, 2.07904052734375, 2.157012939453125, 2.2349853515625, 2.312957763671875, 2.39093017578125, 2.468902587890625, 2.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 6.0, 13.0, 14.0, 14.0, 19.0, 22.0, 18.0, 22.0, 28.0, 17.0, 16.0, 23.0, 30.0, 30.0, 42.0, 32.0, 45.0, 34.0, 24.0, 37.0, 41.0, 39.0, 45.0, 37.0, 29.0, 51.0, 32.0, 34.0, 21.0, 21.0, 19.0, 17.0, 13.0, 16.0, 13.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2705078125, -1.2288055419921875, -1.187103271484375, -1.1454010009765625, -1.10369873046875, -1.0619964599609375, -1.020294189453125, -0.9785919189453125, -0.9368896484375, -0.8951873779296875, -0.853485107421875, -0.8117828369140625, -0.77008056640625, -0.7283782958984375, -0.686676025390625, -0.6449737548828125, -0.603271484375, -0.5615692138671875, -0.519866943359375, -0.4781646728515625, -0.43646240234375, -0.3947601318359375, -0.353057861328125, -0.3113555908203125, -0.2696533203125, -0.2279510498046875, -0.186248779296875, -0.1445465087890625, -0.10284423828125, -0.0611419677734375, -0.019439697265625, 0.0222625732421875, 0.06396484375, 0.1056671142578125, 0.147369384765625, 0.1890716552734375, 0.23077392578125, 0.2724761962890625, 0.314178466796875, 0.3558807373046875, 0.3975830078125, 0.4392852783203125, 0.480987548828125, 0.5226898193359375, 0.56439208984375, 0.6060943603515625, 0.647796630859375, 0.6894989013671875, 0.731201171875, 0.7729034423828125, 0.814605712890625, 0.8563079833984375, 0.89801025390625, 0.9397125244140625, 0.981414794921875, 1.0231170654296875, 1.0648193359375, 1.1065216064453125, 1.148223876953125, 1.1899261474609375, 1.23162841796875, 1.2733306884765625, 1.315032958984375, 1.3567352294921875, 1.3984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 4.0, 15.0, 12.0, 16.0, 18.0, 34.0, 52.0, 95.0, 112.0, 180.0, 260.0, 425.0, 645.0, 1055.0, 1622.0, 2684.0, 4336.0, 7315.0, 12311.0, 21421.0, 38694.0, 68384.0, 118096.0, 177524.0, 201459.0, 158868.0, 99524.0, 56996.0, 31973.0, 18074.0, 10507.0, 6053.0, 3822.0, 2150.0, 1345.0, 907.0, 549.0, 307.0, 249.0, 162.0, 103.0, 63.0, 35.0, 33.0, 24.0, 14.0, 10.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2935028076171875, -1.246185302734375, -1.1988677978515625, -1.15155029296875, -1.1042327880859375, -1.056915283203125, -1.0095977783203125, -0.9622802734375, -0.9149627685546875, -0.867645263671875, -0.8203277587890625, -0.77301025390625, -0.7256927490234375, -0.678375244140625, -0.6310577392578125, -0.583740234375, -0.5364227294921875, -0.489105224609375, -0.4417877197265625, -0.39447021484375, -0.3471527099609375, -0.299835205078125, -0.2525177001953125, -0.2052001953125, -0.1578826904296875, -0.110565185546875, -0.0632476806640625, -0.01593017578125, 0.0313873291015625, 0.078704833984375, 0.1260223388671875, 0.17333984375, 0.2206573486328125, 0.267974853515625, 0.3152923583984375, 0.36260986328125, 0.4099273681640625, 0.457244873046875, 0.5045623779296875, 0.5518798828125, 0.5991973876953125, 0.646514892578125, 0.6938323974609375, 0.74114990234375, 0.7884674072265625, 0.835784912109375, 0.8831024169921875, 0.930419921875, 0.9777374267578125, 1.025054931640625, 1.0723724365234375, 1.11968994140625, 1.1670074462890625, 1.214324951171875, 1.2616424560546875, 1.3089599609375, 1.3562774658203125, 1.403594970703125, 1.4509124755859375, 1.49822998046875, 1.5455474853515625, 1.592864990234375, 1.6401824951171875, 1.6875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 10.0, 17.0, 16.0, 20.0, 28.0, 40.0, 36.0, 47.0, 67.0, 83.0, 69.0, 79.0, 76.0, 71.0, 69.0, 49.0, 51.0, 35.0, 27.0, 27.0, 11.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017762184143066406, -0.00017231516540050507, -0.00016700848937034607, -0.00016170181334018707, -0.00015639513731002808, -0.00015108846127986908, -0.00014578178524971008, -0.00014047510921955109, -0.0001351684331893921, -0.0001298617571592331, -0.0001245550811290741, -0.0001192484050989151, -0.0001139417290687561, -0.00010863505303859711, -0.00010332837700843811, -9.802170097827911e-05, -9.271502494812012e-05, -8.740834891796112e-05, -8.210167288780212e-05, -7.679499685764313e-05, -7.148832082748413e-05, -6.618164479732513e-05, -6.087496876716614e-05, -5.556829273700714e-05, -5.0261616706848145e-05, -4.495494067668915e-05, -3.964826464653015e-05, -3.4341588616371155e-05, -2.9034912586212158e-05, -2.372823655605316e-05, -1.8421560525894165e-05, -1.3114884495735168e-05, -7.808208465576172e-06, -2.5015324354171753e-06, 2.8051435947418213e-06, 8.111819624900818e-06, 1.3418495655059814e-05, 1.872517168521881e-05, 2.4031847715377808e-05, 2.9338523745536804e-05, 3.46451997756958e-05, 3.99518758058548e-05, 4.5258551836013794e-05, 5.056522786617279e-05, 5.587190389633179e-05, 6.117857992649078e-05, 6.648525595664978e-05, 7.179193198680878e-05, 7.709860801696777e-05, 8.240528404712677e-05, 8.771196007728577e-05, 9.301863610744476e-05, 9.832531213760376e-05, 0.00010363198816776276, 0.00010893866419792175, 0.00011424534022808075, 0.00011955201625823975, 0.00012485869228839874, 0.00013016536831855774, 0.00013547204434871674, 0.00014077872037887573, 0.00014608539640903473, 0.00015139207243919373, 0.00015669874846935272, 0.00016200542449951172]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 5.0, 9.0, 17.0, 30.0, 50.0, 66.0, 84.0, 142.0, 216.0, 305.0, 439.0, 595.0, 956.0, 1435.0, 2398.0, 3601.0, 5798.0, 9505.0, 15782.0, 26081.0, 44170.0, 73606.0, 115551.0, 160099.0, 175035.0, 148360.0, 103196.0, 64003.0, 37971.0, 22636.0, 13627.0, 8365.0, 5224.0, 3295.0, 2029.0, 1322.0, 851.0, 585.0, 334.0, 289.0, 146.0, 115.0, 77.0, 39.0, 28.0, 29.0, 15.0, 13.0, 11.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.3056640625, -1.2665252685546875, -1.227386474609375, -1.1882476806640625, -1.14910888671875, -1.1099700927734375, -1.070831298828125, -1.0316925048828125, -0.9925537109375, -0.9534149169921875, -0.914276123046875, -0.8751373291015625, -0.83599853515625, -0.7968597412109375, -0.757720947265625, -0.7185821533203125, -0.679443359375, -0.6403045654296875, -0.601165771484375, -0.5620269775390625, -0.52288818359375, -0.4837493896484375, -0.444610595703125, -0.4054718017578125, -0.3663330078125, -0.3271942138671875, -0.288055419921875, -0.2489166259765625, -0.20977783203125, -0.1706390380859375, -0.131500244140625, -0.0923614501953125, -0.05322265625, -0.0140838623046875, 0.025054931640625, 0.0641937255859375, 0.10333251953125, 0.1424713134765625, 0.181610107421875, 0.2207489013671875, 0.2598876953125, 0.2990264892578125, 0.338165283203125, 0.3773040771484375, 0.41644287109375, 0.4555816650390625, 0.494720458984375, 0.5338592529296875, 0.572998046875, 0.6121368408203125, 0.651275634765625, 0.6904144287109375, 0.72955322265625, 0.7686920166015625, 0.807830810546875, 0.8469696044921875, 0.8861083984375, 0.9252471923828125, 0.964385986328125, 1.0035247802734375, 1.04266357421875, 1.0818023681640625, 1.120941162109375, 1.1600799560546875, 1.19921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 3.0, 5.0, 9.0, 16.0, 24.0, 17.0, 20.0, 42.0, 36.0, 49.0, 52.0, 55.0, 57.0, 72.0, 55.0, 66.0, 74.0, 51.0, 50.0, 39.0, 44.0, 26.0, 22.0, 23.0, 25.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2727622985839844, -0.26061248779296875, -0.24846267700195312, -0.2363128662109375, -0.22416305541992188, -0.21201324462890625, -0.19986343383789062, -0.187713623046875, -0.17556381225585938, -0.16341400146484375, -0.15126419067382812, -0.1391143798828125, -0.12696456909179688, -0.11481475830078125, -0.10266494750976562, -0.09051513671875, -0.07836532592773438, -0.06621551513671875, -0.054065704345703125, -0.0419158935546875, -0.029766082763671875, -0.01761627197265625, -0.005466461181640625, 0.006683349609375, 0.018833160400390625, 0.03098297119140625, 0.043132781982421875, 0.0552825927734375, 0.06743240356445312, 0.07958221435546875, 0.09173202514648438, 0.1038818359375, 0.11603164672851562, 0.12818145751953125, 0.14033126831054688, 0.1524810791015625, 0.16463088989257812, 0.17678070068359375, 0.18893051147460938, 0.201080322265625, 0.21323013305664062, 0.22537994384765625, 0.23752975463867188, 0.2496795654296875, 0.2618293762207031, 0.27397918701171875, 0.2861289978027344, 0.29827880859375, 0.3104286193847656, 0.32257843017578125, 0.3347282409667969, 0.3468780517578125, 0.3590278625488281, 0.37117767333984375, 0.3833274841308594, 0.395477294921875, 0.4076271057128906, 0.41977691650390625, 0.4319267272949219, 0.4440765380859375, 0.4562263488769531, 0.46837615966796875, 0.4805259704589844, 0.49267578125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 18.0, 29.0, 26.0, 33.0, 43.0, 46.0, 64.0, 60.0, 61.0, 64.0, 71.0, 64.0, 72.0, 57.0, 47.0, 37.0, 28.0, 17.0, 29.0, 24.0, 11.0, 9.0, 4.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.868194103240967, -4.724942207336426, -4.581690311431885, -4.438438415527344, -4.2951860427856445, -4.1519341468811035, -4.0086822509765625, -3.8654303550720215, -3.7221784591674805, -3.5789265632629395, -3.4356744289398193, -3.2924225330352783, -3.1491706371307373, -3.005918502807617, -2.862666606903076, -2.719414710998535, -2.576162576675415, -2.432910680770874, -2.289658546447754, -2.146406650543213, -2.003154754638672, -1.8599027395248413, -1.7166507244110107, -1.5733988285064697, -1.4301468133926392, -1.2868947982788086, -1.1436429023742676, -1.000390887260437, -0.8571389317512512, -0.7138869762420654, -0.5706349611282349, -0.42738306522369385, -0.2841310501098633, -0.1408790796995163, 0.0023728907108306885, 0.14562487602233887, 0.28887683153152466, 0.43212878704071045, 0.575380802154541, 0.718632698059082, 0.8618847131729126, 1.0051367282867432, 1.1483886241912842, 1.2916406393051147, 1.4348926544189453, 1.5781445503234863, 1.721396565437317, 1.864648461341858, 2.0079004764556885, 2.1511523723602295, 2.2944045066833496, 2.4376564025878906, 2.5809082984924316, 2.7241601943969727, 2.8674123287200928, 3.010664224624634, 3.153916358947754, 3.297168254852295, 3.440420389175415, 3.583672285079956, 3.726924180984497, 3.870176315307617, 4.013428211212158, 4.156680107116699, 4.29993200302124]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 7.0, 6.0, 12.0, 11.0, 12.0, 16.0, 12.0, 18.0, 27.0, 19.0, 14.0, 22.0, 22.0, 36.0, 39.0, 24.0, 26.0, 36.0, 34.0, 46.0, 41.0, 39.0, 47.0, 36.0, 36.0, 38.0, 37.0, 27.0, 31.0, 37.0, 25.0, 26.0, 24.0, 21.0, 16.0, 10.0, 14.0, 7.0, 8.0, 13.0, 5.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.992197871208191, -1.9318187236785889, -1.8714396953582764, -1.8110605478286743, -1.7506814002990723, -1.6903023719787598, -1.6299232244491577, -1.5695440769195557, -1.5091650485992432, -1.4487859010696411, -1.3884068727493286, -1.3280277252197266, -1.2676485776901245, -1.2072694301605225, -1.14689040184021, -1.086511254310608, -1.0261321067810059, -0.9657530188560486, -0.9053738713264465, -0.8449947834014893, -0.7846156358718872, -0.7242365479469299, -0.6638574600219727, -0.6034783124923706, -0.5430992245674133, -0.48272010684013367, -0.422340989112854, -0.36196190118789673, -0.30158278346061707, -0.2412036657333374, -0.18082457780838013, -0.12044546008110046, -0.06006622314453125, 0.00031288713216781616, 0.06069199740886688, 0.12107110023498535, 0.18145021796226501, 0.24182933568954468, 0.30220842361450195, 0.3625875413417816, 0.4229666590690613, 0.48334577679634094, 0.5437248945236206, 0.6041039824485779, 0.6644830703735352, 0.7248622179031372, 0.7852413058280945, 0.8456203937530518, 0.9059995412826538, 0.9663786292076111, 1.0267577171325684, 1.0871368646621704, 1.1475160121917725, 1.207895040512085, 1.268274188041687, 1.328653335571289, 1.3890323638916016, 1.4494115114212036, 1.5097905397415161, 1.5701696872711182, 1.6305488348007202, 1.6909279823303223, 1.7513070106506348, 1.8116861581802368, 1.8720653057098389]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 17.0, 18.0, 22.0, 43.0, 74.0, 133.0, 199.0, 298.0, 498.0, 832.0, 1419.0, 2618.0, 4620.0, 8675.0, 16585.0, 34867.0, 79247.0, 198938.0, 562609.0, 1347464.0, 1192420.0, 452143.0, 162392.0, 66632.0, 30030.0, 14683.0, 7471.0, 3989.0, 2204.0, 1272.0, 765.0, 438.0, 247.0, 158.0, 101.0, 58.0, 33.0, 26.0, 10.0, 11.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.64776611328125, -4.4869384765625, -4.32611083984375, -4.165283203125, -4.00445556640625, -3.8436279296875, -3.68280029296875, -3.52197265625, -3.36114501953125, -3.2003173828125, -3.03948974609375, -2.878662109375, -2.71783447265625, -2.5570068359375, -2.39617919921875, -2.2353515625, -2.07452392578125, -1.9136962890625, -1.75286865234375, -1.592041015625, -1.43121337890625, -1.2703857421875, -1.10955810546875, -0.94873046875, -0.78790283203125, -0.6270751953125, -0.46624755859375, -0.305419921875, -0.14459228515625, 0.0162353515625, 0.17706298828125, 0.337890625, 0.49871826171875, 0.6595458984375, 0.82037353515625, 0.981201171875, 1.14202880859375, 1.3028564453125, 1.46368408203125, 1.62451171875, 1.78533935546875, 1.9461669921875, 2.10699462890625, 2.267822265625, 2.42864990234375, 2.5894775390625, 2.75030517578125, 2.9111328125, 3.07196044921875, 3.2327880859375, 3.39361572265625, 3.554443359375, 3.71527099609375, 3.8760986328125, 4.03692626953125, 4.19775390625, 4.35858154296875, 4.5194091796875, 4.68023681640625, 4.841064453125, 5.00189208984375, 5.1627197265625, 5.32354736328125, 5.484375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 8.0, 7.0, 13.0, 9.0, 19.0, 17.0, 20.0, 17.0, 11.0, 31.0, 20.0, 38.0, 29.0, 34.0, 44.0, 41.0, 42.0, 38.0, 41.0, 48.0, 35.0, 40.0, 36.0, 49.0, 30.0, 41.0, 32.0, 34.0, 22.0, 30.0, 18.0, 24.0, 15.0, 13.0, 8.0, 11.0, 10.0, 8.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.8583984375, -1.8057098388671875, -1.753021240234375, -1.7003326416015625, -1.64764404296875, -1.5949554443359375, -1.542266845703125, -1.4895782470703125, -1.4368896484375, -1.3842010498046875, -1.331512451171875, -1.2788238525390625, -1.22613525390625, -1.1734466552734375, -1.120758056640625, -1.0680694580078125, -1.015380859375, -0.9626922607421875, -0.910003662109375, -0.8573150634765625, -0.80462646484375, -0.7519378662109375, -0.699249267578125, -0.6465606689453125, -0.5938720703125, -0.5411834716796875, -0.488494873046875, -0.4358062744140625, -0.38311767578125, -0.3304290771484375, -0.277740478515625, -0.2250518798828125, -0.17236328125, -0.1196746826171875, -0.066986083984375, -0.0142974853515625, 0.03839111328125, 0.0910797119140625, 0.143768310546875, 0.1964569091796875, 0.2491455078125, 0.3018341064453125, 0.354522705078125, 0.4072113037109375, 0.45989990234375, 0.5125885009765625, 0.565277099609375, 0.6179656982421875, 0.670654296875, 0.7233428955078125, 0.776031494140625, 0.8287200927734375, 0.88140869140625, 0.9340972900390625, 0.986785888671875, 1.0394744873046875, 1.0921630859375, 1.1448516845703125, 1.197540283203125, 1.2502288818359375, 1.30291748046875, 1.3556060791015625, 1.408294677734375, 1.4609832763671875, 1.513671875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 8.0, 15.0, 20.0, 31.0, 33.0, 54.0, 86.0, 126.0, 180.0, 296.0, 420.0, 613.0, 970.0, 1446.0, 2363.0, 4023.0, 6676.0, 11517.0, 20180.0, 37937.0, 72101.0, 141521.0, 287879.0, 578844.0, 980187.0, 950174.0, 543755.0, 269077.0, 133547.0, 67561.0, 35751.0, 19595.0, 10842.0, 6314.0, 3635.0, 2349.0, 1418.0, 925.0, 592.0, 385.0, 253.0, 174.0, 123.0, 86.0, 62.0, 34.0, 24.0, 20.0, 16.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.07421875, -3.94671630859375, -3.8192138671875, -3.69171142578125, -3.564208984375, -3.43670654296875, -3.3092041015625, -3.18170166015625, -3.05419921875, -2.92669677734375, -2.7991943359375, -2.67169189453125, -2.544189453125, -2.41668701171875, -2.2891845703125, -2.16168212890625, -2.0341796875, -1.90667724609375, -1.7791748046875, -1.65167236328125, -1.524169921875, -1.39666748046875, -1.2691650390625, -1.14166259765625, -1.01416015625, -0.88665771484375, -0.7591552734375, -0.63165283203125, -0.504150390625, -0.37664794921875, -0.2491455078125, -0.12164306640625, 0.005859375, 0.13336181640625, 0.2608642578125, 0.38836669921875, 0.515869140625, 0.64337158203125, 0.7708740234375, 0.89837646484375, 1.02587890625, 1.15338134765625, 1.2808837890625, 1.40838623046875, 1.535888671875, 1.66339111328125, 1.7908935546875, 1.91839599609375, 2.0458984375, 2.17340087890625, 2.3009033203125, 2.42840576171875, 2.555908203125, 2.68341064453125, 2.8109130859375, 2.93841552734375, 3.06591796875, 3.19342041015625, 3.3209228515625, 3.44842529296875, 3.575927734375, 3.70343017578125, 3.8309326171875, 3.95843505859375, 4.0859375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 7.0, 11.0, 7.0, 10.0, 12.0, 16.0, 25.0, 24.0, 51.0, 51.0, 73.0, 68.0, 77.0, 107.0, 114.0, 135.0, 164.0, 200.0, 215.0, 219.0, 247.0, 272.0, 272.0, 241.0, 227.0, 205.0, 181.0, 159.0, 144.0, 105.0, 98.0, 61.0, 51.0, 47.0, 42.0, 36.0, 27.0, 12.0, 15.0, 13.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8853073120117188, -0.8531341552734375, -0.8209609985351562, -0.788787841796875, -0.7566146850585938, -0.7244415283203125, -0.6922683715820312, -0.66009521484375, -0.6279220581054688, -0.5957489013671875, -0.5635757446289062, -0.531402587890625, -0.49922943115234375, -0.4670562744140625, -0.43488311767578125, -0.4027099609375, -0.37053680419921875, -0.3383636474609375, -0.30619049072265625, -0.274017333984375, -0.24184417724609375, -0.2096710205078125, -0.17749786376953125, -0.14532470703125, -0.11315155029296875, -0.0809783935546875, -0.04880523681640625, -0.016632080078125, 0.01554107666015625, 0.0477142333984375, 0.07988739013671875, 0.112060546875, 0.14423370361328125, 0.1764068603515625, 0.20858001708984375, 0.240753173828125, 0.27292633056640625, 0.3050994873046875, 0.33727264404296875, 0.36944580078125, 0.40161895751953125, 0.4337921142578125, 0.46596527099609375, 0.498138427734375, 0.5303115844726562, 0.5624847412109375, 0.5946578979492188, 0.6268310546875, 0.6590042114257812, 0.6911773681640625, 0.7233505249023438, 0.755523681640625, 0.7876968383789062, 0.8198699951171875, 0.8520431518554688, 0.88421630859375, 0.9163894653320312, 0.9485626220703125, 0.9807357788085938, 1.012908935546875, 1.0450820922851562, 1.0772552490234375, 1.1094284057617188, 1.1416015625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 6.0, 7.0, 11.0, 14.0, 18.0, 26.0, 41.0, 37.0, 50.0, 53.0, 86.0, 95.0, 67.0, 86.0, 84.0, 51.0, 59.0, 59.0, 33.0, 25.0, 19.0, 16.0, 13.0, 12.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.172397613525391, -6.000027179718018, -5.8276567459106445, -5.655285835266113, -5.48291540145874, -5.310544967651367, -5.138174533843994, -4.965804100036621, -4.79343318939209, -4.621062755584717, -4.448692321777344, -4.2763214111328125, -4.1039509773254395, -3.9315805435180664, -3.7592101097106934, -3.5868396759033203, -3.4144692420959473, -3.242098808288574, -3.069728136062622, -2.897357702255249, -2.724987030029297, -2.552616596221924, -2.380246162414551, -2.2078757286071777, -2.0355050563812256, -1.863134503364563, -1.6907639503479004, -1.5183935165405273, -1.3460229635238647, -1.1736524105072021, -1.001281976699829, -0.8289114236831665, -0.6565403938293457, -0.4841698706150055, -0.3117993474006653, -0.13942885398864746, 0.03294169902801514, 0.20531225204467773, 0.3776826858520508, 0.5500532388687134, 0.722423791885376, 0.8947943449020386, 1.0671648979187012, 1.2395353317260742, 1.4119058847427368, 1.5842764377593994, 1.7566468715667725, 1.929017424583435, 2.1013879776000977, 2.2737584114074707, 2.446129083633423, 2.618499517440796, 2.790870189666748, 2.963240623474121, 3.135611057281494, 3.307981491088867, 3.4803521633148193, 3.6527225971221924, 3.8250932693481445, 3.9974637031555176, 4.169834136962891, 4.342205047607422, 4.514575004577637, 4.686945915222168, 4.859316349029541]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 12.0, 10.0, 5.0, 16.0, 14.0, 19.0, 24.0, 11.0, 20.0, 18.0, 19.0, 20.0, 33.0, 30.0, 33.0, 32.0, 34.0, 28.0, 40.0, 35.0, 31.0, 40.0, 42.0, 44.0, 33.0, 25.0, 30.0, 35.0, 24.0, 21.0, 30.0, 26.0, 25.0, 26.0, 11.0, 11.0, 11.0, 8.0, 10.0, 9.0, 2.0, 8.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.6643472909927368, -1.6124193668365479, -1.5604914426803589, -1.50856351852417, -1.4566354751586914, -1.4047075510025024, -1.3527796268463135, -1.3008517026901245, -1.2489237785339355, -1.1969958543777466, -1.1450679302215576, -1.093139886856079, -1.0412119626998901, -0.9892840385437012, -0.9373561143875122, -0.8854281902313232, -0.8335001468658447, -0.7815722227096558, -0.729644238948822, -0.6777163147926331, -0.6257883310317993, -0.5738604068756104, -0.5219324827194214, -0.47000452876091003, -0.4180765748023987, -0.36614862084388733, -0.314220666885376, -0.262292742729187, -0.21036478877067566, -0.1584368348121643, -0.10650891065597534, -0.05458095669746399, -0.0026531219482421875, 0.04927482455968857, 0.10120277106761932, 0.15313071012496948, 0.20505866408348083, 0.2569866180419922, 0.30891454219818115, 0.3608424961566925, 0.41277045011520386, 0.4646984040737152, 0.5166263580322266, 0.5685542821884155, 0.6204822063446045, 0.6724101901054382, 0.7243381142616272, 0.7762660980224609, 0.8281940221786499, 0.8801219463348389, 0.9320499300956726, 0.9839778542518616, 1.0359058380126953, 1.0878337621688843, 1.1397616863250732, 1.1916896104812622, 1.2436175346374512, 1.2955454587936401, 1.347473382949829, 1.3994014263153076, 1.4513293504714966, 1.5032572746276855, 1.5551851987838745, 1.6071131229400635, 1.659041166305542]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 22.0, 31.0, 37.0, 36.0, 70.0, 101.0, 195.0, 276.0, 458.0, 765.0, 1103.0, 1784.0, 2949.0, 4554.0, 7714.0, 12976.0, 22532.0, 39025.0, 68688.0, 119159.0, 180762.0, 204086.0, 156394.0, 94745.0, 54244.0, 31093.0, 17896.0, 10541.0, 6200.0, 3717.0, 2431.0, 1392.0, 928.0, 577.0, 410.0, 250.0, 128.0, 94.0, 58.0, 46.0, 23.0, 20.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25749969482421875, -0.2483978271484375, -0.23929595947265625, -0.230194091796875, -0.22109222412109375, -0.2119903564453125, -0.20288848876953125, -0.19378662109375, -0.18468475341796875, -0.1755828857421875, -0.16648101806640625, -0.157379150390625, -0.14827728271484375, -0.1391754150390625, -0.13007354736328125, -0.1209716796875, -0.11186981201171875, -0.1027679443359375, -0.09366607666015625, -0.084564208984375, -0.07546234130859375, -0.0663604736328125, -0.05725860595703125, -0.04815673828125, -0.03905487060546875, -0.0299530029296875, -0.02085113525390625, -0.011749267578125, -0.00264739990234375, 0.0064544677734375, 0.01555633544921875, 0.024658203125, 0.03376007080078125, 0.0428619384765625, 0.05196380615234375, 0.061065673828125, 0.07016754150390625, 0.0792694091796875, 0.08837127685546875, 0.09747314453125, 0.10657501220703125, 0.1156768798828125, 0.12477874755859375, 0.133880615234375, 0.14298248291015625, 0.1520843505859375, 0.16118621826171875, 0.1702880859375, 0.17938995361328125, 0.1884918212890625, 0.19759368896484375, 0.206695556640625, 0.21579742431640625, 0.2248992919921875, 0.23400115966796875, 0.24310302734375, 0.25220489501953125, 0.2613067626953125, 0.27040863037109375, 0.279510498046875, 0.28861236572265625, 0.2977142333984375, 0.30681610107421875, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 10.0, 12.0, 14.0, 10.0, 15.0, 19.0, 16.0, 22.0, 31.0, 23.0, 37.0, 47.0, 32.0, 45.0, 39.0, 44.0, 33.0, 32.0, 47.0, 55.0, 47.0, 36.0, 38.0, 40.0, 30.0, 33.0, 25.0, 32.0, 20.0, 23.0, 13.0, 9.0, 17.0, 7.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087554931640625, -2.01495361328125, -1.942352294921875, -1.8697509765625, -1.797149658203125, -1.72454833984375, -1.651947021484375, -1.579345703125, -1.506744384765625, -1.43414306640625, -1.361541748046875, -1.2889404296875, -1.216339111328125, -1.14373779296875, -1.071136474609375, -0.99853515625, -0.925933837890625, -0.85333251953125, -0.780731201171875, -0.7081298828125, -0.635528564453125, -0.56292724609375, -0.490325927734375, -0.417724609375, -0.345123291015625, -0.27252197265625, -0.199920654296875, -0.1273193359375, -0.054718017578125, 0.01788330078125, 0.090484619140625, 0.1630859375, 0.235687255859375, 0.30828857421875, 0.380889892578125, 0.4534912109375, 0.526092529296875, 0.59869384765625, 0.671295166015625, 0.743896484375, 0.816497802734375, 0.88909912109375, 0.961700439453125, 1.0343017578125, 1.106903076171875, 1.17950439453125, 1.252105712890625, 1.32470703125, 1.397308349609375, 1.46990966796875, 1.542510986328125, 1.6151123046875, 1.687713623046875, 1.76031494140625, 1.832916259765625, 1.905517578125, 1.978118896484375, 2.05072021484375, 2.123321533203125, 2.1959228515625, 2.268524169921875, 2.34112548828125, 2.413726806640625, 2.486328125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 13.0, 13.0, 16.0, 26.0, 33.0, 38.0, 63.0, 88.0, 136.0, 176.0, 337.0, 570.0, 958.0, 1697.0, 3674.0, 8331.0, 23168.0, 211303.0, 747447.0, 30491.0, 10686.0, 4421.0, 2013.0, 1126.0, 582.0, 397.0, 259.0, 139.0, 92.0, 74.0, 59.0, 31.0, 25.0, 18.0, 8.0, 13.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.21484375, -1.1770172119140625, -1.139190673828125, -1.1013641357421875, -1.06353759765625, -1.0257110595703125, -0.987884521484375, -0.9500579833984375, -0.9122314453125, -0.8744049072265625, -0.836578369140625, -0.7987518310546875, -0.76092529296875, -0.7230987548828125, -0.685272216796875, -0.6474456787109375, -0.609619140625, -0.5717926025390625, -0.533966064453125, -0.4961395263671875, -0.45831298828125, -0.4204864501953125, -0.382659912109375, -0.3448333740234375, -0.3070068359375, -0.2691802978515625, -0.231353759765625, -0.1935272216796875, -0.15570068359375, -0.1178741455078125, -0.080047607421875, -0.0422210693359375, -0.00439453125, 0.0334320068359375, 0.071258544921875, 0.1090850830078125, 0.14691162109375, 0.1847381591796875, 0.222564697265625, 0.2603912353515625, 0.2982177734375, 0.3360443115234375, 0.373870849609375, 0.4116973876953125, 0.44952392578125, 0.4873504638671875, 0.525177001953125, 0.5630035400390625, 0.600830078125, 0.6386566162109375, 0.676483154296875, 0.7143096923828125, 0.75213623046875, 0.7899627685546875, 0.827789306640625, 0.8656158447265625, 0.9034423828125, 0.9412689208984375, 0.979095458984375, 1.0169219970703125, 1.05474853515625, 1.0925750732421875, 1.130401611328125, 1.1682281494140625, 1.2060546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 11.0, 11.0, 17.0, 11.0, 22.0, 18.0, 24.0, 30.0, 36.0, 30.0, 30.0, 42.0, 37.0, 32.0, 31.0, 40.0, 45.0, 51.0, 41.0, 34.0, 45.0, 47.0, 40.0, 38.0, 38.0, 28.0, 21.0, 19.0, 24.0, 16.0, 12.0, 13.0, 9.0, 5.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.2974853515625, -1.250244140625, -1.2030029296875, -1.15576171875, -1.1085205078125, -1.061279296875, -1.0140380859375, -0.966796875, -0.9195556640625, -0.872314453125, -0.8250732421875, -0.77783203125, -0.7305908203125, -0.683349609375, -0.6361083984375, -0.5888671875, -0.5416259765625, -0.494384765625, -0.4471435546875, -0.39990234375, -0.3526611328125, -0.305419921875, -0.2581787109375, -0.2109375, -0.1636962890625, -0.116455078125, -0.0692138671875, -0.02197265625, 0.0252685546875, 0.072509765625, 0.1197509765625, 0.1669921875, 0.2142333984375, 0.261474609375, 0.3087158203125, 0.35595703125, 0.4031982421875, 0.450439453125, 0.4976806640625, 0.544921875, 0.5921630859375, 0.639404296875, 0.6866455078125, 0.73388671875, 0.7811279296875, 0.828369140625, 0.8756103515625, 0.9228515625, 0.9700927734375, 1.017333984375, 1.0645751953125, 1.11181640625, 1.1590576171875, 1.206298828125, 1.2535400390625, 1.30078125, 1.3480224609375, 1.395263671875, 1.4425048828125, 1.48974609375, 1.5369873046875, 1.584228515625, 1.6314697265625, 1.6787109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 12.0, 7.0, 5.0, 8.0, 28.0, 32.0, 37.0, 60.0, 96.0, 124.0, 204.0, 299.0, 461.0, 809.0, 1405.0, 2594.0, 4836.0, 10603.0, 26809.0, 790727.0, 168339.0, 22337.0, 9116.0, 4222.0, 2181.0, 1224.0, 728.0, 478.0, 272.0, 161.0, 90.0, 66.0, 49.0, 43.0, 21.0, 23.0, 17.0, 8.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26624298095703125, -0.2573394775390625, -0.24843597412109375, -0.239532470703125, -0.23062896728515625, -0.2217254638671875, -0.21282196044921875, -0.20391845703125, -0.19501495361328125, -0.1861114501953125, -0.17720794677734375, -0.168304443359375, -0.15940093994140625, -0.1504974365234375, -0.14159393310546875, -0.1326904296875, -0.12378692626953125, -0.1148834228515625, -0.10597991943359375, -0.097076416015625, -0.08817291259765625, -0.0792694091796875, -0.07036590576171875, -0.06146240234375, -0.05255889892578125, -0.0436553955078125, -0.03475189208984375, -0.025848388671875, -0.01694488525390625, -0.0080413818359375, 0.00086212158203125, 0.009765625, 0.01866912841796875, 0.0275726318359375, 0.03647613525390625, 0.045379638671875, 0.05428314208984375, 0.0631866455078125, 0.07209014892578125, 0.08099365234375, 0.08989715576171875, 0.0988006591796875, 0.10770416259765625, 0.116607666015625, 0.12551116943359375, 0.1344146728515625, 0.14331817626953125, 0.1522216796875, 0.16112518310546875, 0.1700286865234375, 0.17893218994140625, 0.187835693359375, 0.19673919677734375, 0.2056427001953125, 0.21454620361328125, 0.22344970703125, 0.23235321044921875, 0.2412567138671875, 0.25016021728515625, 0.259063720703125, 0.26796722412109375, 0.2768707275390625, 0.28577423095703125, 0.294677734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 2.0, 4.0, 7.0, 14.0, 11.0, 13.0, 13.0, 22.0, 21.0, 18.0, 18.0, 29.0, 36.0, 44.0, 35.0, 49.0, 43.0, 41.0, 61.0, 51.0, 54.0, 41.0, 56.0, 41.0, 45.0, 28.0, 41.0, 21.0, 21.0, 26.0, 13.0, 18.0, 9.0, 9.0, 9.0, 3.0, 8.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.184246063232422e-05, -4.0601007640361786e-05, -3.935955464839935e-05, -3.811810165643692e-05, -3.687664866447449e-05, -3.5635195672512054e-05, -3.439374268054962e-05, -3.315228968858719e-05, -3.1910836696624756e-05, -3.066938370466232e-05, -2.942793071269989e-05, -2.8186477720737457e-05, -2.6945024728775024e-05, -2.570357173681259e-05, -2.446211874485016e-05, -2.3220665752887726e-05, -2.1979212760925293e-05, -2.073775976896286e-05, -1.9496306777000427e-05, -1.8254853785037994e-05, -1.701340079307556e-05, -1.577194780111313e-05, -1.4530494809150696e-05, -1.3289041817188263e-05, -1.204758882522583e-05, -1.0806135833263397e-05, -9.564682841300964e-06, -8.323229849338531e-06, -7.081776857376099e-06, -5.840323865413666e-06, -4.598870873451233e-06, -3.3574178814888e-06, -2.115964889526367e-06, -8.745118975639343e-07, 3.6694109439849854e-07, 1.6083940863609314e-06, 2.8498470783233643e-06, 4.091300070285797e-06, 5.33275306224823e-06, 6.574206054210663e-06, 7.815659046173096e-06, 9.057112038135529e-06, 1.0298565030097961e-05, 1.1540018022060394e-05, 1.2781471014022827e-05, 1.402292400598526e-05, 1.5264376997947693e-05, 1.6505829989910126e-05, 1.774728298187256e-05, 1.898873597383499e-05, 2.0230188965797424e-05, 2.1471641957759857e-05, 2.271309494972229e-05, 2.3954547941684723e-05, 2.5196000933647156e-05, 2.643745392560959e-05, 2.767890691757202e-05, 2.8920359909534454e-05, 3.0161812901496887e-05, 3.140326589345932e-05, 3.264471888542175e-05, 3.3886171877384186e-05, 3.512762486934662e-05, 3.636907786130905e-05, 3.7610530853271484e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 5.0, 5.0, 4.0, 8.0, 14.0, 20.0, 23.0, 24.0, 39.0, 44.0, 77.0, 122.0, 153.0, 210.0, 279.0, 416.0, 558.0, 771.0, 1094.0, 1661.0, 2290.0, 3371.0, 5129.0, 7983.0, 13040.0, 21359.0, 37246.0, 66164.0, 116637.0, 185253.0, 213896.0, 153189.0, 90693.0, 50861.0, 28460.0, 16905.0, 10218.0, 6586.0, 4299.0, 2760.0, 1956.0, 1309.0, 965.0, 726.0, 506.0, 366.0, 227.0, 168.0, 129.0, 113.0, 67.0, 50.0, 34.0, 16.0, 21.0, 15.0, 12.0, 6.0, 9.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.0679931640625, -0.06581878662109375, -0.0636444091796875, -0.06147003173828125, -0.059295654296875, -0.05712127685546875, -0.0549468994140625, -0.05277252197265625, -0.05059814453125, -0.04842376708984375, -0.0462493896484375, -0.04407501220703125, -0.041900634765625, -0.03972625732421875, -0.0375518798828125, -0.03537750244140625, -0.033203125, -0.03102874755859375, -0.0288543701171875, -0.02667999267578125, -0.024505615234375, -0.02233123779296875, -0.0201568603515625, -0.01798248291015625, -0.01580810546875, -0.01363372802734375, -0.0114593505859375, -0.00928497314453125, -0.007110595703125, -0.00493621826171875, -0.0027618408203125, -0.00058746337890625, 0.0015869140625, 0.00376129150390625, 0.0059356689453125, 0.00811004638671875, 0.010284423828125, 0.01245880126953125, 0.0146331787109375, 0.01680755615234375, 0.01898193359375, 0.02115631103515625, 0.0233306884765625, 0.02550506591796875, 0.027679443359375, 0.02985382080078125, 0.0320281982421875, 0.03420257568359375, 0.036376953125, 0.03855133056640625, 0.0407257080078125, 0.04290008544921875, 0.045074462890625, 0.04724884033203125, 0.0494232177734375, 0.05159759521484375, 0.05377197265625, 0.05594635009765625, 0.0581207275390625, 0.06029510498046875, 0.062469482421875, 0.06464385986328125, 0.0668182373046875, 0.06899261474609375, 0.0711669921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 8.0, 6.0, 11.0, 13.0, 17.0, 28.0, 28.0, 39.0, 42.0, 72.0, 44.0, 61.0, 62.0, 90.0, 73.0, 66.0, 68.0, 50.0, 46.0, 46.0, 31.0, 21.0, 23.0, 14.0, 9.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023406982421875, -0.022638797760009766, -0.02187061309814453, -0.021102428436279297, -0.020334243774414062, -0.019566059112548828, -0.018797874450683594, -0.01802968978881836, -0.017261505126953125, -0.01649332046508789, -0.015725135803222656, -0.014956951141357422, -0.014188766479492188, -0.013420581817626953, -0.012652397155761719, -0.011884212493896484, -0.01111602783203125, -0.010347843170166016, -0.009579658508300781, -0.008811473846435547, -0.008043289184570312, -0.007275104522705078, -0.006506919860839844, -0.005738735198974609, -0.004970550537109375, -0.004202365875244141, -0.0034341812133789062, -0.002665996551513672, -0.0018978118896484375, -0.0011296272277832031, -0.00036144256591796875, 0.0004067420959472656, 0.0011749267578125, 0.0019431114196777344, 0.0027112960815429688, 0.003479480743408203, 0.0042476654052734375, 0.005015850067138672, 0.005784034729003906, 0.006552219390869141, 0.007320404052734375, 0.00808858871459961, 0.008856773376464844, 0.009624958038330078, 0.010393142700195312, 0.011161327362060547, 0.011929512023925781, 0.012697696685791016, 0.01346588134765625, 0.014234066009521484, 0.015002250671386719, 0.015770435333251953, 0.016538619995117188, 0.017306804656982422, 0.018074989318847656, 0.01884317398071289, 0.019611358642578125, 0.02037954330444336, 0.021147727966308594, 0.021915912628173828, 0.022684097290039062, 0.023452281951904297, 0.02422046661376953, 0.024988651275634766, 0.0257568359375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 11.0, 17.0, 21.0, 31.0, 32.0, 47.0, 47.0, 58.0, 89.0, 99.0, 63.0, 95.0, 73.0, 57.0, 50.0, 59.0, 27.0, 23.0, 20.0, 17.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.15084171295166, -5.977791786193848, -5.804741859436035, -5.631691932678223, -5.45864200592041, -5.285592079162598, -5.112542152404785, -4.939492702484131, -4.766442775726318, -4.593392848968506, -4.420342922210693, -4.247292995452881, -4.074243068695068, -3.901193380355835, -3.7281434535980225, -3.555093765258789, -3.3820436000823975, -3.208993673324585, -3.0359437465667725, -2.862894058227539, -2.6898441314697266, -2.516794204711914, -2.3437442779541016, -2.170694351196289, -1.9976445436477661, -1.8245946168899536, -1.6515448093414307, -1.4784948825836182, -1.3054449558258057, -1.1323951482772827, -0.9593452215194702, -0.7862954139709473, -0.6132454872131348, -0.44019562005996704, -0.26714572310447693, -0.09409582614898682, 0.07895404100418091, 0.25200390815734863, 0.42505383491516113, 0.5981036424636841, 0.7711535692214966, 0.9442034363746643, 1.117253303527832, 1.2903032302856445, 1.463353157043457, 1.63640296459198, 1.8094528913497925, 1.9825026988983154, 2.155552625656128, 2.3286025524139404, 2.501652479171753, 2.6747021675109863, 2.847752094268799, 3.0208020210266113, 3.193851947784424, 3.3669018745422363, 3.539951801300049, 3.7130017280578613, 3.886051654815674, 4.059101581573486, 4.232151508331299, 4.405200958251953, 4.578250885009766, 4.751300811767578, 4.924350738525391]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 11.0, 11.0, 6.0, 13.0, 15.0, 21.0, 23.0, 11.0, 20.0, 19.0, 16.0, 20.0, 36.0, 28.0, 32.0, 31.0, 40.0, 26.0, 39.0, 33.0, 32.0, 40.0, 42.0, 40.0, 35.0, 27.0, 28.0, 35.0, 28.0, 20.0, 25.0, 31.0, 24.0, 27.0, 10.0, 11.0, 10.0, 10.0, 8.0, 11.0, 1.0, 9.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.6304569244384766, -1.5789599418640137, -1.5274629592895508, -1.4759658575057983, -1.4244688749313354, -1.3729718923568726, -1.3214747905731201, -1.2699778079986572, -1.2184808254241943, -1.1669838428497314, -1.1154868602752686, -1.0639897584915161, -1.0124927759170532, -0.9609957933425903, -0.9094987511634827, -0.858001708984375, -0.8065047264099121, -0.7550077438354492, -0.7035107016563416, -0.6520136594772339, -0.600516676902771, -0.5490196943283081, -0.49752265214920044, -0.44602563977241516, -0.3945286273956299, -0.3430316150188446, -0.2915346026420593, -0.24003759026527405, -0.18854057788848877, -0.1370435655117035, -0.08554655313491821, -0.034049540758132935, 0.017447471618652344, 0.06894448399543762, 0.1204414963722229, 0.17193850874900818, 0.22343552112579346, 0.27493253350257874, 0.326429545879364, 0.3779265582561493, 0.42942357063293457, 0.48092058300971985, 0.5324175953865051, 0.5839146375656128, 0.6354116201400757, 0.6869086027145386, 0.7384056448936462, 0.7899026870727539, 0.8413996696472168, 0.8928966522216797, 0.9443936944007874, 0.995890736579895, 1.047387719154358, 1.0988847017288208, 1.1503818035125732, 1.2018787860870361, 1.253375768661499, 1.304872751235962, 1.3563697338104248, 1.4078668355941772, 1.4593638181686401, 1.510860800743103, 1.5623579025268555, 1.6138548851013184, 1.6653518676757812]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 13.0, 18.0, 23.0, 37.0, 41.0, 56.0, 83.0, 150.0, 159.0, 291.0, 432.0, 645.0, 1065.0, 1710.0, 3032.0, 5445.0, 10351.0, 19737.0, 38136.0, 72313.0, 125851.0, 184243.0, 202256.0, 161700.0, 101738.0, 56245.0, 29273.0, 14963.0, 7892.0, 4297.0, 2458.0, 1449.0, 853.0, 527.0, 359.0, 228.0, 140.0, 98.0, 63.0, 49.0, 35.0, 26.0, 19.0, 17.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.876953125, -2.77874755859375, -2.6805419921875, -2.58233642578125, -2.484130859375, -2.38592529296875, -2.2877197265625, -2.18951416015625, -2.09130859375, -1.99310302734375, -1.8948974609375, -1.79669189453125, -1.698486328125, -1.60028076171875, -1.5020751953125, -1.40386962890625, -1.3056640625, -1.20745849609375, -1.1092529296875, -1.01104736328125, -0.912841796875, -0.81463623046875, -0.7164306640625, -0.61822509765625, -0.52001953125, -0.42181396484375, -0.3236083984375, -0.22540283203125, -0.127197265625, -0.02899169921875, 0.0692138671875, 0.16741943359375, 0.265625, 0.36383056640625, 0.4620361328125, 0.56024169921875, 0.658447265625, 0.75665283203125, 0.8548583984375, 0.95306396484375, 1.05126953125, 1.14947509765625, 1.2476806640625, 1.34588623046875, 1.444091796875, 1.54229736328125, 1.6405029296875, 1.73870849609375, 1.8369140625, 1.93511962890625, 2.0333251953125, 2.13153076171875, 2.229736328125, 2.32794189453125, 2.4261474609375, 2.52435302734375, 2.62255859375, 2.72076416015625, 2.8189697265625, 2.91717529296875, 3.015380859375, 3.11358642578125, 3.2117919921875, 3.30999755859375, 3.408203125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 10.0, 8.0, 13.0, 8.0, 10.0, 20.0, 16.0, 20.0, 26.0, 24.0, 26.0, 22.0, 26.0, 34.0, 36.0, 37.0, 35.0, 43.0, 48.0, 39.0, 39.0, 34.0, 41.0, 30.0, 29.0, 26.0, 33.0, 29.0, 24.0, 20.0, 27.0, 27.0, 22.0, 13.0, 11.0, 14.0, 6.0, 11.0, 3.0, 8.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.11328125, -2.0505828857421875, -1.987884521484375, -1.9251861572265625, -1.86248779296875, -1.7997894287109375, -1.737091064453125, -1.6743927001953125, -1.6116943359375, -1.5489959716796875, -1.486297607421875, -1.4235992431640625, -1.36090087890625, -1.2982025146484375, -1.235504150390625, -1.1728057861328125, -1.110107421875, -1.0474090576171875, -0.984710693359375, -0.9220123291015625, -0.85931396484375, -0.7966156005859375, -0.733917236328125, -0.6712188720703125, -0.6085205078125, -0.5458221435546875, -0.483123779296875, -0.4204254150390625, -0.35772705078125, -0.2950286865234375, -0.232330322265625, -0.1696319580078125, -0.10693359375, -0.0442352294921875, 0.018463134765625, 0.0811614990234375, 0.14385986328125, 0.2065582275390625, 0.269256591796875, 0.3319549560546875, 0.3946533203125, 0.4573516845703125, 0.520050048828125, 0.5827484130859375, 0.64544677734375, 0.7081451416015625, 0.770843505859375, 0.8335418701171875, 0.896240234375, 0.9589385986328125, 1.021636962890625, 1.0843353271484375, 1.14703369140625, 1.2097320556640625, 1.272430419921875, 1.3351287841796875, 1.3978271484375, 1.4605255126953125, 1.523223876953125, 1.5859222412109375, 1.64862060546875, 1.7113189697265625, 1.774017333984375, 1.8367156982421875, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 20.0, 24.0, 42.0, 47.0, 63.0, 121.0, 145.0, 238.0, 337.0, 516.0, 768.0, 1332.0, 2067.0, 3346.0, 5718.0, 10038.0, 17773.0, 31894.0, 56072.0, 93595.0, 140919.0, 176733.0, 171636.0, 132193.0, 85378.0, 50266.0, 28599.0, 16047.0, 9050.0, 5158.0, 3048.0, 1917.0, 1223.0, 755.0, 493.0, 315.0, 208.0, 148.0, 87.0, 69.0, 38.0, 32.0, 28.0, 17.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.720703125, -2.629730224609375, -2.53875732421875, -2.447784423828125, -2.3568115234375, -2.265838623046875, -2.17486572265625, -2.083892822265625, -1.992919921875, -1.901947021484375, -1.81097412109375, -1.720001220703125, -1.6290283203125, -1.538055419921875, -1.44708251953125, -1.356109619140625, -1.26513671875, -1.174163818359375, -1.08319091796875, -0.992218017578125, -0.9012451171875, -0.810272216796875, -0.71929931640625, -0.628326416015625, -0.537353515625, -0.446380615234375, -0.35540771484375, -0.264434814453125, -0.1734619140625, -0.082489013671875, 0.00848388671875, 0.099456787109375, 0.1904296875, 0.281402587890625, 0.37237548828125, 0.463348388671875, 0.5543212890625, 0.645294189453125, 0.73626708984375, 0.827239990234375, 0.918212890625, 1.009185791015625, 1.10015869140625, 1.191131591796875, 1.2821044921875, 1.373077392578125, 1.46405029296875, 1.555023193359375, 1.64599609375, 1.736968994140625, 1.82794189453125, 1.918914794921875, 2.0098876953125, 2.100860595703125, 2.19183349609375, 2.282806396484375, 2.373779296875, 2.464752197265625, 2.55572509765625, 2.646697998046875, 2.7376708984375, 2.828643798828125, 2.91961669921875, 3.010589599609375, 3.1015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 12.0, 12.0, 16.0, 23.0, 17.0, 18.0, 36.0, 24.0, 29.0, 41.0, 38.0, 37.0, 44.0, 36.0, 47.0, 44.0, 44.0, 43.0, 49.0, 37.0, 34.0, 42.0, 39.0, 24.0, 29.0, 22.0, 20.0, 19.0, 27.0, 16.0, 10.0, 8.0, 13.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2480316162109375, -1.202117919921875, -1.1562042236328125, -1.11029052734375, -1.0643768310546875, -1.018463134765625, -0.9725494384765625, -0.9266357421875, -0.8807220458984375, -0.834808349609375, -0.7888946533203125, -0.74298095703125, -0.6970672607421875, -0.651153564453125, -0.6052398681640625, -0.559326171875, -0.5134124755859375, -0.467498779296875, -0.4215850830078125, -0.37567138671875, -0.3297576904296875, -0.283843994140625, -0.2379302978515625, -0.1920166015625, -0.1461029052734375, -0.100189208984375, -0.0542755126953125, -0.00836181640625, 0.0375518798828125, 0.083465576171875, 0.1293792724609375, 0.17529296875, 0.2212066650390625, 0.267120361328125, 0.3130340576171875, 0.35894775390625, 0.4048614501953125, 0.450775146484375, 0.4966888427734375, 0.5426025390625, 0.5885162353515625, 0.634429931640625, 0.6803436279296875, 0.72625732421875, 0.7721710205078125, 0.818084716796875, 0.8639984130859375, 0.909912109375, 0.9558258056640625, 1.001739501953125, 1.0476531982421875, 1.09356689453125, 1.1394805908203125, 1.185394287109375, 1.2313079833984375, 1.2772216796875, 1.3231353759765625, 1.369049072265625, 1.4149627685546875, 1.46087646484375, 1.5067901611328125, 1.552703857421875, 1.5986175537109375, 1.64453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 6.0, 9.0, 22.0, 27.0, 41.0, 44.0, 86.0, 83.0, 160.0, 244.0, 282.0, 526.0, 796.0, 1060.0, 1803.0, 2731.0, 4513.0, 7348.0, 13007.0, 23521.0, 43775.0, 83187.0, 147416.0, 209129.0, 201800.0, 137558.0, 76417.0, 40513.0, 21775.0, 11933.0, 7084.0, 4149.0, 2584.0, 1680.0, 1117.0, 675.0, 476.0, 313.0, 198.0, 143.0, 107.0, 65.0, 45.0, 31.0, 27.0, 13.0, 17.0, 10.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7138671875, -1.6584625244140625, -1.603057861328125, -1.5476531982421875, -1.49224853515625, -1.4368438720703125, -1.381439208984375, -1.3260345458984375, -1.2706298828125, -1.2152252197265625, -1.159820556640625, -1.1044158935546875, -1.04901123046875, -0.9936065673828125, -0.938201904296875, -0.8827972412109375, -0.827392578125, -0.7719879150390625, -0.716583251953125, -0.6611785888671875, -0.60577392578125, -0.5503692626953125, -0.494964599609375, -0.4395599365234375, -0.3841552734375, -0.3287506103515625, -0.273345947265625, -0.2179412841796875, -0.16253662109375, -0.1071319580078125, -0.051727294921875, 0.0036773681640625, 0.05908203125, 0.1144866943359375, 0.169891357421875, 0.2252960205078125, 0.28070068359375, 0.3361053466796875, 0.391510009765625, 0.4469146728515625, 0.5023193359375, 0.5577239990234375, 0.613128662109375, 0.6685333251953125, 0.72393798828125, 0.7793426513671875, 0.834747314453125, 0.8901519775390625, 0.945556640625, 1.0009613037109375, 1.056365966796875, 1.1117706298828125, 1.16717529296875, 1.2225799560546875, 1.277984619140625, 1.3333892822265625, 1.3887939453125, 1.4441986083984375, 1.499603271484375, 1.5550079345703125, 1.61041259765625, 1.6658172607421875, 1.721221923828125, 1.7766265869140625, 1.83203125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 14.0, 17.0, 14.0, 19.0, 29.0, 31.0, 39.0, 40.0, 45.0, 50.0, 65.0, 61.0, 65.0, 68.0, 75.0, 65.0, 52.0, 37.0, 36.0, 33.0, 26.0, 26.0, 13.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00015115737915039062, -0.00014640763401985168, -0.00014165788888931274, -0.0001369081437587738, -0.00013215839862823486, -0.00012740865349769592, -0.00012265890836715698, -0.00011790916323661804, -0.0001131594181060791, -0.00010840967297554016, -0.00010365992784500122, -9.891018271446228e-05, -9.416043758392334e-05, -8.94106924533844e-05, -8.466094732284546e-05, -7.991120219230652e-05, -7.516145706176758e-05, -7.041171193122864e-05, -6.56619668006897e-05, -6.091222167015076e-05, -5.6162476539611816e-05, -5.1412731409072876e-05, -4.6662986278533936e-05, -4.1913241147994995e-05, -3.7163496017456055e-05, -3.2413750886917114e-05, -2.7664005756378174e-05, -2.2914260625839233e-05, -1.8164515495300293e-05, -1.3414770364761353e-05, -8.665025234222412e-06, -3.915280103683472e-06, 8.344650268554688e-07, 5.584210157394409e-06, 1.033395528793335e-05, 1.508370041847229e-05, 1.983344554901123e-05, 2.458319067955017e-05, 2.933293581008911e-05, 3.408268094062805e-05, 3.883242607116699e-05, 4.358217120170593e-05, 4.833191633224487e-05, 5.3081661462783813e-05, 5.7831406593322754e-05, 6.25811517238617e-05, 6.733089685440063e-05, 7.208064198493958e-05, 7.683038711547852e-05, 8.158013224601746e-05, 8.63298773765564e-05, 9.107962250709534e-05, 9.582936763763428e-05, 0.00010057911276817322, 0.00010532885789871216, 0.0001100786030292511, 0.00011482834815979004, 0.00011957809329032898, 0.00012432783842086792, 0.00012907758355140686, 0.0001338273286819458, 0.00013857707381248474, 0.00014332681894302368, 0.00014807656407356262, 0.00015282630920410156]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 21.0, 28.0, 64.0, 82.0, 120.0, 198.0, 337.0, 601.0, 1008.0, 1778.0, 3100.0, 5987.0, 11620.0, 22885.0, 46501.0, 92868.0, 166782.0, 229264.0, 205666.0, 127413.0, 65616.0, 32195.0, 16370.0, 8059.0, 4397.0, 2406.0, 1306.0, 771.0, 405.0, 256.0, 127.0, 92.0, 74.0, 51.0, 21.0, 25.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7138671875, -1.6581268310546875, -1.602386474609375, -1.5466461181640625, -1.49090576171875, -1.4351654052734375, -1.379425048828125, -1.3236846923828125, -1.2679443359375, -1.2122039794921875, -1.156463623046875, -1.1007232666015625, -1.04498291015625, -0.9892425537109375, -0.933502197265625, -0.8777618408203125, -0.822021484375, -0.7662811279296875, -0.710540771484375, -0.6548004150390625, -0.59906005859375, -0.5433197021484375, -0.487579345703125, -0.4318389892578125, -0.3760986328125, -0.3203582763671875, -0.264617919921875, -0.2088775634765625, -0.15313720703125, -0.0973968505859375, -0.041656494140625, 0.0140838623046875, 0.06982421875, 0.1255645751953125, 0.181304931640625, 0.2370452880859375, 0.29278564453125, 0.3485260009765625, 0.404266357421875, 0.4600067138671875, 0.5157470703125, 0.5714874267578125, 0.627227783203125, 0.6829681396484375, 0.73870849609375, 0.7944488525390625, 0.850189208984375, 0.9059295654296875, 0.961669921875, 1.0174102783203125, 1.073150634765625, 1.1288909912109375, 1.18463134765625, 1.2403717041015625, 1.296112060546875, 1.3518524169921875, 1.4075927734375, 1.4633331298828125, 1.519073486328125, 1.5748138427734375, 1.63055419921875, 1.6862945556640625, 1.742034912109375, 1.7977752685546875, 1.853515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 11.0, 11.0, 13.0, 12.0, 22.0, 21.0, 30.0, 39.0, 47.0, 49.0, 56.0, 80.0, 69.0, 56.0, 70.0, 54.0, 64.0, 43.0, 39.0, 36.0, 37.0, 36.0, 17.0, 13.0, 8.0, 16.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33078765869140625, -0.3185577392578125, -0.30632781982421875, -0.294097900390625, -0.28186798095703125, -0.2696380615234375, -0.25740814208984375, -0.24517822265625, -0.23294830322265625, -0.2207183837890625, -0.20848846435546875, -0.196258544921875, -0.18402862548828125, -0.1717987060546875, -0.15956878662109375, -0.1473388671875, -0.13510894775390625, -0.1228790283203125, -0.11064910888671875, -0.098419189453125, -0.08618927001953125, -0.0739593505859375, -0.06172943115234375, -0.04949951171875, -0.03726959228515625, -0.0250396728515625, -0.01280975341796875, -0.000579833984375, 0.01165008544921875, 0.0238800048828125, 0.03610992431640625, 0.04833984375, 0.06056976318359375, 0.0727996826171875, 0.08502960205078125, 0.097259521484375, 0.10948944091796875, 0.1217193603515625, 0.13394927978515625, 0.14617919921875, 0.15840911865234375, 0.1706390380859375, 0.18286895751953125, 0.195098876953125, 0.20732879638671875, 0.2195587158203125, 0.23178863525390625, 0.2440185546875, 0.25624847412109375, 0.2684783935546875, 0.28070831298828125, 0.292938232421875, 0.30516815185546875, 0.3173980712890625, 0.32962799072265625, 0.34185791015625, 0.35408782958984375, 0.3663177490234375, 0.37854766845703125, 0.390777587890625, 0.40300750732421875, 0.4152374267578125, 0.42746734619140625, 0.439697265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 10.0, 13.0, 22.0, 20.0, 39.0, 43.0, 57.0, 61.0, 78.0, 93.0, 95.0, 73.0, 93.0, 58.0, 51.0, 45.0, 34.0, 28.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668394565582275, -6.490774154663086, -6.313153266906738, -6.135532855987549, -5.957912445068359, -5.78029203414917, -5.6026716232299805, -5.425050735473633, -5.247430324554443, -5.069809913635254, -4.892189025878906, -4.714568614959717, -4.536948204040527, -4.359327793121338, -4.181707382202148, -4.004086494445801, -3.8264660835266113, -3.648845672607422, -3.4712250232696533, -3.2936043739318848, -3.1159839630126953, -2.938363552093506, -2.7607429027557373, -2.5831222534179688, -2.4055018424987793, -2.22788143157959, -2.0502607822418213, -1.8726402521133423, -1.6950197219848633, -1.5173991918563843, -1.3397786617279053, -1.1621581315994263, -0.9845380783081055, -0.8069175481796265, -0.6292970180511475, -0.45167648792266846, -0.27405595779418945, -0.09643542766571045, 0.08118510246276855, 0.25880563259124756, 0.43642616271972656, 0.6140466928482056, 0.7916672229766846, 0.9692877531051636, 1.1469082832336426, 1.3245288133621216, 1.5021493434906006, 1.6797698736190796, 1.8573904037475586, 2.035010814666748, 2.2126314640045166, 2.390252113342285, 2.5678725242614746, 2.745492935180664, 2.9231135845184326, 3.100734233856201, 3.2783546447753906, 3.45597505569458, 3.6335957050323486, 3.811216354370117, 3.9888367652893066, 4.166457176208496, 4.344078063964844, 4.521698474884033, 4.699318885803223]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 13.0, 14.0, 27.0, 21.0, 14.0, 21.0, 27.0, 34.0, 19.0, 35.0, 35.0, 34.0, 35.0, 45.0, 52.0, 42.0, 44.0, 44.0, 47.0, 31.0, 32.0, 34.0, 41.0, 29.0, 21.0, 21.0, 26.0, 20.0, 13.0, 23.0, 17.0, 4.0, 13.0, 12.0, 4.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9693043231964111, -1.907718539237976, -1.8461326360702515, -1.7845468521118164, -1.7229610681533813, -1.6613751649856567, -1.5997893810272217, -1.538203477859497, -1.476617693901062, -1.415031909942627, -1.3534460067749023, -1.2918602228164673, -1.2302744388580322, -1.1686885356903076, -1.1071027517318726, -1.0455169677734375, -0.9839311242103577, -0.9223452806472778, -0.8607594966888428, -0.7991736531257629, -0.7375878095626831, -0.676002025604248, -0.6144161820411682, -0.5528303384780884, -0.49124452471733093, -0.4296587109565735, -0.36807286739349365, -0.3064870536327362, -0.24490122497081757, -0.18331539630889893, -0.12172958254814148, -0.060143738985061646, 0.0014420747756958008, 0.06302790343761444, 0.12461372464895248, 0.18619954586029053, 0.24778537452220917, 0.3093712031841278, 0.37095701694488525, 0.4325428605079651, 0.49412867426872253, 0.55571448802948, 0.6173003315925598, 0.6788861751556396, 0.7404719591140747, 0.8020578026771545, 0.8636436462402344, 0.9252294301986694, 0.9868152737617493, 1.048401117324829, 1.1099869012832642, 1.1715726852416992, 1.2331585884094238, 1.2947443723678589, 1.356330156326294, 1.4179160594940186, 1.4795018434524536, 1.5410876274108887, 1.6026735305786133, 1.6642593145370483, 1.7258450984954834, 1.787431001663208, 1.849016785621643, 1.9106025695800781, 1.9721884727478027]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 17.0, 15.0, 30.0, 53.0, 72.0, 115.0, 159.0, 260.0, 440.0, 654.0, 1032.0, 1716.0, 3034.0, 5258.0, 9629.0, 18512.0, 37235.0, 80871.0, 193478.0, 512983.0, 1207863.0, 1228824.0, 534557.0, 197648.0, 81611.0, 37276.0, 18129.0, 9622.0, 5355.0, 3054.0, 1833.0, 1113.0, 654.0, 428.0, 257.0, 184.0, 96.0, 75.0, 53.0, 28.0, 22.0, 14.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.46453857421875, -4.3157958984375, -4.16705322265625, -4.018310546875, -3.86956787109375, -3.7208251953125, -3.57208251953125, -3.42333984375, -3.27459716796875, -3.1258544921875, -2.97711181640625, -2.828369140625, -2.67962646484375, -2.5308837890625, -2.38214111328125, -2.2333984375, -2.08465576171875, -1.9359130859375, -1.78717041015625, -1.638427734375, -1.48968505859375, -1.3409423828125, -1.19219970703125, -1.04345703125, -0.89471435546875, -0.7459716796875, -0.59722900390625, -0.448486328125, -0.29974365234375, -0.1510009765625, -0.00225830078125, 0.146484375, 0.29522705078125, 0.4439697265625, 0.59271240234375, 0.741455078125, 0.89019775390625, 1.0389404296875, 1.18768310546875, 1.33642578125, 1.48516845703125, 1.6339111328125, 1.78265380859375, 1.931396484375, 2.08013916015625, 2.2288818359375, 2.37762451171875, 2.5263671875, 2.67510986328125, 2.8238525390625, 2.97259521484375, 3.121337890625, 3.27008056640625, 3.4188232421875, 3.56756591796875, 3.71630859375, 3.86505126953125, 4.0137939453125, 4.16253662109375, 4.311279296875, 4.46002197265625, 4.6087646484375, 4.75750732421875, 4.90625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 4.0, 1.0, 5.0, 5.0, 11.0, 15.0, 11.0, 17.0, 10.0, 19.0, 19.0, 25.0, 20.0, 28.0, 29.0, 36.0, 32.0, 30.0, 27.0, 36.0, 40.0, 49.0, 30.0, 46.0, 39.0, 27.0, 41.0, 34.0, 37.0, 30.0, 29.0, 28.0, 21.0, 22.0, 18.0, 12.0, 21.0, 18.0, 10.0, 10.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.521484375, -1.4746856689453125, -1.427886962890625, -1.3810882568359375, -1.33428955078125, -1.2874908447265625, -1.240692138671875, -1.1938934326171875, -1.1470947265625, -1.1002960205078125, -1.053497314453125, -1.0066986083984375, -0.95989990234375, -0.9131011962890625, -0.866302490234375, -0.8195037841796875, -0.772705078125, -0.7259063720703125, -0.679107666015625, -0.6323089599609375, -0.58551025390625, -0.5387115478515625, -0.491912841796875, -0.4451141357421875, -0.3983154296875, -0.3515167236328125, -0.304718017578125, -0.2579193115234375, -0.21112060546875, -0.1643218994140625, -0.117523193359375, -0.0707244873046875, -0.02392578125, 0.0228729248046875, 0.069671630859375, 0.1164703369140625, 0.16326904296875, 0.2100677490234375, 0.256866455078125, 0.3036651611328125, 0.3504638671875, 0.3972625732421875, 0.444061279296875, 0.4908599853515625, 0.53765869140625, 0.5844573974609375, 0.631256103515625, 0.6780548095703125, 0.724853515625, 0.7716522216796875, 0.818450927734375, 0.8652496337890625, 0.91204833984375, 0.9588470458984375, 1.005645751953125, 1.0524444580078125, 1.0992431640625, 1.1460418701171875, 1.192840576171875, 1.2396392822265625, 1.28643798828125, 1.3332366943359375, 1.380035400390625, 1.4268341064453125, 1.4736328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 18.0, 21.0, 34.0, 49.0, 85.0, 107.0, 132.0, 230.0, 328.0, 517.0, 746.0, 1216.0, 1900.0, 2960.0, 4741.0, 7636.0, 12945.0, 22377.0, 40009.0, 73152.0, 138658.0, 272854.0, 535096.0, 921368.0, 958471.0, 576936.0, 293593.0, 148977.0, 78048.0, 41927.0, 23661.0, 13667.0, 8188.0, 5038.0, 3014.0, 1946.0, 1255.0, 774.0, 538.0, 350.0, 230.0, 165.0, 98.0, 65.0, 49.0, 41.0, 14.0, 13.0, 14.0, 10.0, 4.0, 1.0, 5.0, 4.0, 1.0], "bins": [-4.10546875, -3.98126220703125, -3.8570556640625, -3.73284912109375, -3.608642578125, -3.48443603515625, -3.3602294921875, -3.23602294921875, -3.11181640625, -2.98760986328125, -2.8634033203125, -2.73919677734375, -2.614990234375, -2.49078369140625, -2.3665771484375, -2.24237060546875, -2.1181640625, -1.99395751953125, -1.8697509765625, -1.74554443359375, -1.621337890625, -1.49713134765625, -1.3729248046875, -1.24871826171875, -1.12451171875, -1.00030517578125, -0.8760986328125, -0.75189208984375, -0.627685546875, -0.50347900390625, -0.3792724609375, -0.25506591796875, -0.130859375, -0.00665283203125, 0.1175537109375, 0.24176025390625, 0.365966796875, 0.49017333984375, 0.6143798828125, 0.73858642578125, 0.86279296875, 0.98699951171875, 1.1112060546875, 1.23541259765625, 1.359619140625, 1.48382568359375, 1.6080322265625, 1.73223876953125, 1.8564453125, 1.98065185546875, 2.1048583984375, 2.22906494140625, 2.353271484375, 2.47747802734375, 2.6016845703125, 2.72589111328125, 2.85009765625, 2.97430419921875, 3.0985107421875, 3.22271728515625, 3.346923828125, 3.47113037109375, 3.5953369140625, 3.71954345703125, 3.84375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 9.0, 8.0, 6.0, 17.0, 32.0, 40.0, 34.0, 48.0, 57.0, 95.0, 94.0, 105.0, 141.0, 176.0, 209.0, 265.0, 260.0, 293.0, 294.0, 265.0, 263.0, 272.0, 205.0, 180.0, 148.0, 118.0, 98.0, 79.0, 61.0, 50.0, 43.0, 28.0, 16.0, 13.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.07647705078125, -1.0396728515625, -1.00286865234375, -0.966064453125, -0.92926025390625, -0.8924560546875, -0.85565185546875, -0.81884765625, -0.78204345703125, -0.7452392578125, -0.70843505859375, -0.671630859375, -0.63482666015625, -0.5980224609375, -0.56121826171875, -0.5244140625, -0.48760986328125, -0.4508056640625, -0.41400146484375, -0.377197265625, -0.34039306640625, -0.3035888671875, -0.26678466796875, -0.22998046875, -0.19317626953125, -0.1563720703125, -0.11956787109375, -0.082763671875, -0.04595947265625, -0.0091552734375, 0.02764892578125, 0.064453125, 0.10125732421875, 0.1380615234375, 0.17486572265625, 0.211669921875, 0.24847412109375, 0.2852783203125, 0.32208251953125, 0.35888671875, 0.39569091796875, 0.4324951171875, 0.46929931640625, 0.506103515625, 0.54290771484375, 0.5797119140625, 0.61651611328125, 0.6533203125, 0.69012451171875, 0.7269287109375, 0.76373291015625, 0.800537109375, 0.83734130859375, 0.8741455078125, 0.91094970703125, 0.94775390625, 0.98455810546875, 1.0213623046875, 1.05816650390625, 1.094970703125, 1.13177490234375, 1.1685791015625, 1.20538330078125, 1.2421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 9.0, 14.0, 16.0, 14.0, 26.0, 41.0, 51.0, 63.0, 74.0, 95.0, 79.0, 92.0, 91.0, 64.0, 57.0, 60.0, 32.0, 27.0, 24.0, 20.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.784271717071533, -7.594692707061768, -7.405113697052002, -7.2155351638793945, -7.025956153869629, -6.836377143859863, -6.646798133850098, -6.457219123840332, -6.267640113830566, -6.078061103820801, -5.888482093811035, -5.6989030838012695, -5.509324550628662, -5.3197455406188965, -5.130166530609131, -4.940587520599365, -4.751008987426758, -4.561429977416992, -4.371850967407227, -4.182271957397461, -3.9926934242248535, -3.803114414215088, -3.6135354042053223, -3.4239563941955566, -3.23437762260437, -3.0447986125946045, -2.855219841003418, -2.6656408309936523, -2.4760618209838867, -2.2864830493927, -2.0969040393829346, -1.9073251485824585, -1.7177457809448242, -1.5281668901443481, -1.338587999343872, -1.1490089893341064, -0.9594300985336304, -0.7698512077331543, -0.5802721977233887, -0.3906933069229126, -0.20111441612243652, -0.011535495519638062, 0.1780434250831604, 0.36762237548828125, 0.5572012662887573, 0.7467801570892334, 0.936359167098999, 1.125938057899475, 1.3155169486999512, 1.5050958395004272, 1.6946747303009033, 1.884253740310669, 2.0738325119018555, 2.263411521911621, 2.4529905319213867, 2.6425695419311523, 2.832148313522339, 3.0217273235321045, 3.211306095123291, 3.4008851051330566, 3.5904641151428223, 3.780042886734009, 3.9696218967437744, 4.159200668334961, 4.348779678344727]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 7.0, 16.0, 10.0, 16.0, 22.0, 25.0, 14.0, 29.0, 20.0, 30.0, 30.0, 30.0, 42.0, 45.0, 33.0, 43.0, 42.0, 48.0, 38.0, 34.0, 36.0, 39.0, 46.0, 38.0, 34.0, 32.0, 27.0, 20.0, 22.0, 18.0, 19.0, 14.0, 11.0, 9.0, 14.0, 10.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.2169461250305176, -2.1566765308380127, -2.096407175064087, -2.036137580871582, -1.9758681058883667, -1.9155986309051514, -1.855329155921936, -1.7950596809387207, -1.7347902059555054, -1.67452073097229, -1.6142512559890747, -1.5539817810058594, -1.4937121868133545, -1.4334427118301392, -1.3731732368469238, -1.3129037618637085, -1.2526342868804932, -1.1923648118972778, -1.1320953369140625, -1.0718257427215576, -1.0115562677383423, -0.951286792755127, -0.8910173177719116, -0.8307478427886963, -0.7704782485961914, -0.7102087736129761, -0.649939239025116, -0.5896697640419006, -0.5294002890586853, -0.4691307842731476, -0.40886127948760986, -0.34859180450439453, -0.2883223295211792, -0.22805283963680267, -0.16778334975242615, -0.10751384496688843, -0.0472443550825119, 0.013025134801864624, 0.07329463958740234, 0.13356411457061768, 0.1938336193561554, 0.2541031241416931, 0.31437259912490845, 0.37464210391044617, 0.4349116086959839, 0.4951810836791992, 0.5554505586624146, 0.6157200336456299, 0.67598956823349, 0.7362590432167053, 0.7965285778045654, 0.8567980527877808, 0.9170675277709961, 0.9773370027542114, 1.0376064777374268, 1.0978760719299316, 1.158145546913147, 1.2184150218963623, 1.2786844968795776, 1.338953971862793, 1.3992235660552979, 1.4594930410385132, 1.5197625160217285, 1.5800319910049438, 1.6403014659881592]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 2.0, 8.0, 16.0, 17.0, 23.0, 39.0, 50.0, 84.0, 135.0, 251.0, 375.0, 565.0, 1053.0, 1793.0, 3324.0, 6319.0, 11909.0, 23719.0, 48421.0, 98618.0, 185751.0, 251671.0, 197455.0, 109129.0, 53839.0, 25988.0, 12835.0, 6635.0, 3733.0, 2003.0, 1131.0, 661.0, 360.0, 212.0, 154.0, 97.0, 54.0, 37.0, 27.0, 14.0, 17.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.32747650146484375, -0.3155975341796875, -0.30371856689453125, -0.291839599609375, -0.27996063232421875, -0.2680816650390625, -0.25620269775390625, -0.24432373046875, -0.23244476318359375, -0.2205657958984375, -0.20868682861328125, -0.196807861328125, -0.18492889404296875, -0.1730499267578125, -0.16117095947265625, -0.1492919921875, -0.13741302490234375, -0.1255340576171875, -0.11365509033203125, -0.101776123046875, -0.08989715576171875, -0.0780181884765625, -0.06613922119140625, -0.05426025390625, -0.04238128662109375, -0.0305023193359375, -0.01862335205078125, -0.006744384765625, 0.00513458251953125, 0.0170135498046875, 0.02889251708984375, 0.040771484375, 0.05265045166015625, 0.0645294189453125, 0.07640838623046875, 0.088287353515625, 0.10016632080078125, 0.1120452880859375, 0.12392425537109375, 0.13580322265625, 0.14768218994140625, 0.1595611572265625, 0.17144012451171875, 0.183319091796875, 0.19519805908203125, 0.2070770263671875, 0.21895599365234375, 0.2308349609375, 0.24271392822265625, 0.2545928955078125, 0.26647186279296875, 0.278350830078125, 0.29022979736328125, 0.3021087646484375, 0.31398773193359375, 0.32586669921875, 0.33774566650390625, 0.3496246337890625, 0.36150360107421875, 0.373382568359375, 0.38526153564453125, 0.3971405029296875, 0.40901947021484375, 0.4208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 7.0, 12.0, 14.0, 20.0, 20.0, 23.0, 23.0, 27.0, 33.0, 24.0, 48.0, 37.0, 36.0, 35.0, 35.0, 33.0, 45.0, 33.0, 51.0, 41.0, 41.0, 42.0, 39.0, 23.0, 35.0, 29.0, 19.0, 25.0, 22.0, 15.0, 18.0, 16.0, 13.0, 10.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.147979736328125, -2.07916259765625, -2.010345458984375, -1.9415283203125, -1.872711181640625, -1.80389404296875, -1.735076904296875, -1.666259765625, -1.597442626953125, -1.52862548828125, -1.459808349609375, -1.3909912109375, -1.322174072265625, -1.25335693359375, -1.184539794921875, -1.11572265625, -1.046905517578125, -0.97808837890625, -0.909271240234375, -0.8404541015625, -0.771636962890625, -0.70281982421875, -0.634002685546875, -0.565185546875, -0.496368408203125, -0.42755126953125, -0.358734130859375, -0.2899169921875, -0.221099853515625, -0.15228271484375, -0.083465576171875, -0.0146484375, 0.054168701171875, 0.12298583984375, 0.191802978515625, 0.2606201171875, 0.329437255859375, 0.39825439453125, 0.467071533203125, 0.535888671875, 0.604705810546875, 0.67352294921875, 0.742340087890625, 0.8111572265625, 0.879974365234375, 0.94879150390625, 1.017608642578125, 1.08642578125, 1.155242919921875, 1.22406005859375, 1.292877197265625, 1.3616943359375, 1.430511474609375, 1.49932861328125, 1.568145751953125, 1.636962890625, 1.705780029296875, 1.77459716796875, 1.843414306640625, 1.9122314453125, 1.981048583984375, 2.04986572265625, 2.118682861328125, 2.1875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 8.0, 3.0, 7.0, 8.0, 14.0, 15.0, 22.0, 30.0, 44.0, 66.0, 98.0, 129.0, 183.0, 286.0, 450.0, 693.0, 1152.0, 2002.0, 3984.0, 8534.0, 20126.0, 79197.0, 858546.0, 43362.0, 15206.0, 6627.0, 3194.0, 1758.0, 1019.0, 582.0, 398.0, 280.0, 143.0, 99.0, 73.0, 54.0, 42.0, 29.0, 18.0, 16.0, 15.0, 12.0, 9.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.080078125, -1.04669189453125, -1.0133056640625, -0.97991943359375, -0.946533203125, -0.91314697265625, -0.8797607421875, -0.84637451171875, -0.81298828125, -0.77960205078125, -0.7462158203125, -0.71282958984375, -0.679443359375, -0.64605712890625, -0.6126708984375, -0.57928466796875, -0.5458984375, -0.51251220703125, -0.4791259765625, -0.44573974609375, -0.412353515625, -0.37896728515625, -0.3455810546875, -0.31219482421875, -0.27880859375, -0.24542236328125, -0.2120361328125, -0.17864990234375, -0.145263671875, -0.11187744140625, -0.0784912109375, -0.04510498046875, -0.01171875, 0.02166748046875, 0.0550537109375, 0.08843994140625, 0.121826171875, 0.15521240234375, 0.1885986328125, 0.22198486328125, 0.25537109375, 0.28875732421875, 0.3221435546875, 0.35552978515625, 0.388916015625, 0.42230224609375, 0.4556884765625, 0.48907470703125, 0.5224609375, 0.55584716796875, 0.5892333984375, 0.62261962890625, 0.656005859375, 0.68939208984375, 0.7227783203125, 0.75616455078125, 0.78955078125, 0.82293701171875, 0.8563232421875, 0.88970947265625, 0.923095703125, 0.95648193359375, 0.9898681640625, 1.02325439453125, 1.056640625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 4.0, 5.0, 9.0, 11.0, 23.0, 27.0, 16.0, 21.0, 21.0, 34.0, 36.0, 32.0, 35.0, 38.0, 34.0, 43.0, 44.0, 43.0, 37.0, 40.0, 30.0, 37.0, 35.0, 39.0, 39.0, 31.0, 25.0, 28.0, 20.0, 12.0, 14.0, 23.0, 24.0, 13.0, 9.0, 10.0, 6.0, 10.0, 6.0, 9.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.36328125, -1.320404052734375, -1.27752685546875, -1.234649658203125, -1.1917724609375, -1.148895263671875, -1.10601806640625, -1.063140869140625, -1.020263671875, -0.977386474609375, -0.93450927734375, -0.891632080078125, -0.8487548828125, -0.805877685546875, -0.76300048828125, -0.720123291015625, -0.67724609375, -0.634368896484375, -0.59149169921875, -0.548614501953125, -0.5057373046875, -0.462860107421875, -0.41998291015625, -0.377105712890625, -0.334228515625, -0.291351318359375, -0.24847412109375, -0.205596923828125, -0.1627197265625, -0.119842529296875, -0.07696533203125, -0.034088134765625, 0.0087890625, 0.051666259765625, 0.09454345703125, 0.137420654296875, 0.1802978515625, 0.223175048828125, 0.26605224609375, 0.308929443359375, 0.351806640625, 0.394683837890625, 0.43756103515625, 0.480438232421875, 0.5233154296875, 0.566192626953125, 0.60906982421875, 0.651947021484375, 0.69482421875, 0.737701416015625, 0.78057861328125, 0.823455810546875, 0.8663330078125, 0.909210205078125, 0.95208740234375, 0.994964599609375, 1.037841796875, 1.080718994140625, 1.12359619140625, 1.166473388671875, 1.2093505859375, 1.252227783203125, 1.29510498046875, 1.337982177734375, 1.380859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 13.0, 19.0, 18.0, 37.0, 49.0, 61.0, 116.0, 173.0, 274.0, 426.0, 801.0, 1574.0, 3218.0, 7855.0, 24748.0, 888202.0, 93343.0, 16556.0, 5688.0, 2476.0, 1178.0, 661.0, 373.0, 228.0, 138.0, 100.0, 61.0, 43.0, 33.0, 24.0, 10.0, 9.0, 16.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.36058807373046875, -0.3471527099609375, -0.33371734619140625, -0.320281982421875, -0.30684661865234375, -0.2934112548828125, -0.27997589111328125, -0.26654052734375, -0.25310516357421875, -0.2396697998046875, -0.22623443603515625, -0.212799072265625, -0.19936370849609375, -0.1859283447265625, -0.17249298095703125, -0.1590576171875, -0.14562225341796875, -0.1321868896484375, -0.11875152587890625, -0.105316162109375, -0.09188079833984375, -0.0784454345703125, -0.06501007080078125, -0.05157470703125, -0.03813934326171875, -0.0247039794921875, -0.01126861572265625, 0.002166748046875, 0.01560211181640625, 0.0290374755859375, 0.04247283935546875, 0.055908203125, 0.06934356689453125, 0.0827789306640625, 0.09621429443359375, 0.109649658203125, 0.12308502197265625, 0.1365203857421875, 0.14995574951171875, 0.16339111328125, 0.17682647705078125, 0.1902618408203125, 0.20369720458984375, 0.217132568359375, 0.23056793212890625, 0.2440032958984375, 0.25743865966796875, 0.2708740234375, 0.28430938720703125, 0.2977447509765625, 0.31118011474609375, 0.324615478515625, 0.33805084228515625, 0.3514862060546875, 0.36492156982421875, 0.37835693359375, 0.39179229736328125, 0.4052276611328125, 0.41866302490234375, 0.432098388671875, 0.44553375244140625, 0.4589691162109375, 0.47240447998046875, 0.48583984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 5.0, 4.0, 14.0, 12.0, 20.0, 17.0, 10.0, 20.0, 33.0, 23.0, 33.0, 40.0, 47.0, 52.0, 45.0, 52.0, 42.0, 56.0, 41.0, 49.0, 32.0, 43.0, 34.0, 36.0, 22.0, 28.0, 30.0, 26.0, 18.0, 21.0, 13.0, 5.0, 11.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-3.552436828613281e-05, -3.449525684118271e-05, -3.3466145396232605e-05, -3.24370339512825e-05, -3.14079225063324e-05, -3.0378811061382294e-05, -2.934969961643219e-05, -2.8320588171482086e-05, -2.7291476726531982e-05, -2.626236528158188e-05, -2.5233253836631775e-05, -2.420414239168167e-05, -2.3175030946731567e-05, -2.2145919501781464e-05, -2.111680805683136e-05, -2.0087696611881256e-05, -1.9058585166931152e-05, -1.802947372198105e-05, -1.7000362277030945e-05, -1.597125083208084e-05, -1.4942139387130737e-05, -1.3913027942180634e-05, -1.288391649723053e-05, -1.1854805052280426e-05, -1.0825693607330322e-05, -9.796582162380219e-06, -8.767470717430115e-06, -7.738359272480011e-06, -6.709247827529907e-06, -5.6801363825798035e-06, -4.6510249376297e-06, -3.621913492679596e-06, -2.592802047729492e-06, -1.5636906027793884e-06, -5.345791578292847e-07, 4.945322871208191e-07, 1.5236437320709229e-06, 2.5527551770210266e-06, 3.5818666219711304e-06, 4.610978066921234e-06, 5.640089511871338e-06, 6.669200956821442e-06, 7.698312401771545e-06, 8.72742384672165e-06, 9.756535291671753e-06, 1.0785646736621857e-05, 1.181475818157196e-05, 1.2843869626522064e-05, 1.3872981071472168e-05, 1.4902092516422272e-05, 1.5931203961372375e-05, 1.696031540632248e-05, 1.7989426851272583e-05, 1.9018538296222687e-05, 2.004764974117279e-05, 2.1076761186122894e-05, 2.2105872631072998e-05, 2.3134984076023102e-05, 2.4164095520973206e-05, 2.519320696592331e-05, 2.6222318410873413e-05, 2.7251429855823517e-05, 2.828054130077362e-05, 2.9309652745723724e-05, 3.0338764190673828e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 9.0, 10.0, 19.0, 17.0, 34.0, 40.0, 53.0, 88.0, 149.0, 160.0, 290.0, 409.0, 618.0, 961.0, 1615.0, 2530.0, 4381.0, 7540.0, 13486.0, 24816.0, 47368.0, 90314.0, 165173.0, 237697.0, 200850.0, 116604.0, 61069.0, 31787.0, 17113.0, 9409.0, 5472.0, 3112.0, 1890.0, 1208.0, 767.0, 506.0, 322.0, 198.0, 132.0, 116.0, 67.0, 37.0, 34.0, 19.0, 18.0, 12.0, 4.0, 6.0, 5.0, 9.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.082763671875, -0.08006763458251953, -0.07737159729003906, -0.0746755599975586, -0.07197952270507812, -0.06928348541259766, -0.06658744812011719, -0.06389141082763672, -0.06119537353515625, -0.05849933624267578, -0.05580329895019531, -0.053107261657714844, -0.050411224365234375, -0.047715187072753906, -0.04501914978027344, -0.04232311248779297, -0.0396270751953125, -0.03693103790283203, -0.03423500061035156, -0.031538963317871094, -0.028842926025390625, -0.026146888732910156, -0.023450851440429688, -0.02075481414794922, -0.01805877685546875, -0.015362739562988281, -0.012666702270507812, -0.009970664978027344, -0.007274627685546875, -0.004578590393066406, -0.0018825531005859375, 0.0008134841918945312, 0.003509521484375, 0.006205558776855469, 0.008901596069335938, 0.011597633361816406, 0.014293670654296875, 0.016989707946777344, 0.019685745239257812, 0.02238178253173828, 0.02507781982421875, 0.02777385711669922, 0.030469894409179688, 0.033165931701660156, 0.035861968994140625, 0.038558006286621094, 0.04125404357910156, 0.04395008087158203, 0.0466461181640625, 0.04934215545654297, 0.05203819274902344, 0.054734230041503906, 0.057430267333984375, 0.060126304626464844, 0.06282234191894531, 0.06551837921142578, 0.06821441650390625, 0.07091045379638672, 0.07360649108886719, 0.07630252838134766, 0.07899856567382812, 0.0816946029663086, 0.08439064025878906, 0.08708667755126953, 0.08978271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 8.0, 9.0, 10.0, 17.0, 30.0, 26.0, 33.0, 39.0, 56.0, 67.0, 69.0, 88.0, 79.0, 95.0, 79.0, 70.0, 49.0, 30.0, 35.0, 16.0, 33.0, 5.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.021753787994384766, -0.02103137969970703, -0.020308971405029297, -0.019586563110351562, -0.018864154815673828, -0.018141746520996094, -0.01741933822631836, -0.016696929931640625, -0.01597452163696289, -0.015252113342285156, -0.014529705047607422, -0.013807296752929688, -0.013084888458251953, -0.012362480163574219, -0.011640071868896484, -0.01091766357421875, -0.010195255279541016, -0.009472846984863281, -0.008750438690185547, -0.008028030395507812, -0.007305622100830078, -0.006583213806152344, -0.005860805511474609, -0.005138397216796875, -0.004415988922119141, -0.0036935806274414062, -0.002971172332763672, -0.0022487640380859375, -0.0015263557434082031, -0.0008039474487304688, -8.153915405273438e-05, 0.000640869140625, 0.0013632774353027344, 0.0020856857299804688, 0.002808094024658203, 0.0035305023193359375, 0.004252910614013672, 0.004975318908691406, 0.005697727203369141, 0.006420135498046875, 0.007142543792724609, 0.007864952087402344, 0.008587360382080078, 0.009309768676757812, 0.010032176971435547, 0.010754585266113281, 0.011476993560791016, 0.01219940185546875, 0.012921810150146484, 0.013644218444824219, 0.014366626739501953, 0.015089035034179688, 0.015811443328857422, 0.016533851623535156, 0.01725625991821289, 0.017978668212890625, 0.01870107650756836, 0.019423484802246094, 0.020145893096923828, 0.020868301391601562, 0.021590709686279297, 0.02231311798095703, 0.023035526275634766, 0.0237579345703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 19.0, 20.0, 35.0, 50.0, 63.0, 71.0, 95.0, 79.0, 86.0, 92.0, 76.0, 53.0, 60.0, 44.0, 25.0, 23.0, 20.0, 12.0, 9.0, 6.0, 7.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.76797342300415, -7.5797271728515625, -7.391481399536133, -7.203235149383545, -7.014988899230957, -6.826742649078369, -6.638496398925781, -6.450250625610352, -6.262004375457764, -6.073758125305176, -5.885512351989746, -5.697266101837158, -5.50901985168457, -5.320773601531982, -5.1325273513793945, -4.944281578063965, -4.756035327911377, -4.567789077758789, -4.379543304443359, -4.1912970542907715, -4.003050804138184, -3.8148045539855957, -3.626558542251587, -3.438312530517578, -3.2500662803649902, -3.0618200302124023, -2.8735740184783936, -2.6853280067443848, -2.497081756591797, -2.308835506439209, -2.1205894947052, -1.9323433637619019, -1.7440977096557617, -1.5558515787124634, -1.367605447769165, -1.1793593168258667, -0.9911131858825684, -0.80286705493927, -0.6146209239959717, -0.42637479305267334, -0.238128662109375, -0.04988253116607666, 0.13836359977722168, 0.32660973072052, 0.5148558616638184, 0.7031019926071167, 0.891348123550415, 1.0795942544937134, 1.2678403854370117, 1.45608651638031, 1.6443326473236084, 1.8325787782669067, 2.020824909210205, 2.209071159362793, 2.3973171710968018, 2.5855631828308105, 2.7738094329833984, 2.9620556831359863, 3.150301694869995, 3.338547706604004, 3.526793956756592, 3.7150402069091797, 3.9032862186431885, 4.091532230377197, 4.279778480529785]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 8.0, 6.0, 14.0, 12.0, 14.0, 23.0, 23.0, 18.0, 24.0, 22.0, 29.0, 32.0, 28.0, 44.0, 41.0, 36.0, 37.0, 47.0, 43.0, 40.0, 34.0, 32.0, 46.0, 43.0, 36.0, 41.0, 30.0, 28.0, 21.0, 21.0, 21.0, 13.0, 18.0, 14.0, 8.0, 13.0, 10.0, 5.0, 4.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0], "bins": [-2.200934886932373, -2.141292095184326, -2.0816493034362793, -2.0220065116882324, -1.962363839149475, -1.9027210474014282, -1.8430782556533813, -1.7834354639053345, -1.7237927913665771, -1.6641499996185303, -1.6045072078704834, -1.5448644161224365, -1.4852217435836792, -1.4255789518356323, -1.3659361600875854, -1.3062933683395386, -1.2466505765914917, -1.1870077848434448, -1.127364993095398, -1.0677223205566406, -1.0080795288085938, -0.9484367370605469, -0.8887939453125, -0.8291511535644531, -0.769508421421051, -0.7098656296730042, -0.650222897529602, -0.5905801057815552, -0.5309373140335083, -0.4712945818901062, -0.4116517901420593, -0.35200902819633484, -0.2923663854598999, -0.23272362351417542, -0.17308084666728973, -0.11343806982040405, -0.053795307874679565, 0.005847454071044922, 0.0654902458190918, 0.12513300776481628, 0.18477576971054077, 0.24441853165626526, 0.30406129360198975, 0.3637040853500366, 0.4233468472957611, 0.4829896092414856, 0.5426324009895325, 0.6022751331329346, 0.6619179248809814, 0.7215607166290283, 0.7812034487724304, 0.8408462405204773, 0.9004889726638794, 0.9601317644119263, 1.0197745561599731, 1.07941734790802, 1.1390600204467773, 1.1987028121948242, 1.258345603942871, 1.317988395690918, 1.3776310682296753, 1.4372738599777222, 1.496916651725769, 1.556559443473816, 1.6162022352218628]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 18.0, 22.0, 26.0, 30.0, 56.0, 108.0, 183.0, 315.0, 472.0, 717.0, 1156.0, 1993.0, 3203.0, 5447.0, 8809.0, 14767.0, 24315.0, 39148.0, 61162.0, 90567.0, 122147.0, 143693.0, 145157.0, 123860.0, 92996.0, 63414.0, 40142.0, 25287.0, 15660.0, 9342.0, 5619.0, 3415.0, 2149.0, 1272.0, 708.0, 406.0, 270.0, 182.0, 121.0, 75.0, 39.0, 21.0, 22.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.24609375, -2.175994873046875, -2.10589599609375, -2.035797119140625, -1.9656982421875, -1.895599365234375, -1.82550048828125, -1.755401611328125, -1.685302734375, -1.615203857421875, -1.54510498046875, -1.475006103515625, -1.4049072265625, -1.334808349609375, -1.26470947265625, -1.194610595703125, -1.12451171875, -1.054412841796875, -0.98431396484375, -0.914215087890625, -0.8441162109375, -0.774017333984375, -0.70391845703125, -0.633819580078125, -0.563720703125, -0.493621826171875, -0.42352294921875, -0.353424072265625, -0.2833251953125, -0.213226318359375, -0.14312744140625, -0.073028564453125, -0.0029296875, 0.067169189453125, 0.13726806640625, 0.207366943359375, 0.2774658203125, 0.347564697265625, 0.41766357421875, 0.487762451171875, 0.557861328125, 0.627960205078125, 0.69805908203125, 0.768157958984375, 0.8382568359375, 0.908355712890625, 0.97845458984375, 1.048553466796875, 1.11865234375, 1.188751220703125, 1.25885009765625, 1.328948974609375, 1.3990478515625, 1.469146728515625, 1.53924560546875, 1.609344482421875, 1.679443359375, 1.749542236328125, 1.81964111328125, 1.889739990234375, 1.9598388671875, 2.029937744140625, 2.10003662109375, 2.170135498046875, 2.240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 11.0, 8.0, 13.0, 12.0, 11.0, 9.0, 11.0, 24.0, 17.0, 25.0, 33.0, 30.0, 42.0, 24.0, 36.0, 29.0, 40.0, 32.0, 49.0, 45.0, 39.0, 46.0, 39.0, 49.0, 42.0, 32.0, 32.0, 26.0, 24.0, 32.0, 19.0, 18.0, 17.0, 14.0, 15.0, 9.0, 9.0, 7.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.27349853515625, -2.2052001953125, -2.13690185546875, -2.068603515625, -2.00030517578125, -1.9320068359375, -1.86370849609375, -1.79541015625, -1.72711181640625, -1.6588134765625, -1.59051513671875, -1.522216796875, -1.45391845703125, -1.3856201171875, -1.31732177734375, -1.2490234375, -1.18072509765625, -1.1124267578125, -1.04412841796875, -0.975830078125, -0.90753173828125, -0.8392333984375, -0.77093505859375, -0.70263671875, -0.63433837890625, -0.5660400390625, -0.49774169921875, -0.429443359375, -0.36114501953125, -0.2928466796875, -0.22454833984375, -0.15625, -0.08795166015625, -0.0196533203125, 0.04864501953125, 0.116943359375, 0.18524169921875, 0.2535400390625, 0.32183837890625, 0.39013671875, 0.45843505859375, 0.5267333984375, 0.59503173828125, 0.663330078125, 0.73162841796875, 0.7999267578125, 0.86822509765625, 0.9365234375, 1.00482177734375, 1.0731201171875, 1.14141845703125, 1.209716796875, 1.27801513671875, 1.3463134765625, 1.41461181640625, 1.48291015625, 1.55120849609375, 1.6195068359375, 1.68780517578125, 1.756103515625, 1.82440185546875, 1.8927001953125, 1.96099853515625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 11.0, 24.0, 25.0, 37.0, 66.0, 108.0, 194.0, 271.0, 498.0, 773.0, 1300.0, 2156.0, 3589.0, 5979.0, 9990.0, 17235.0, 28268.0, 45354.0, 71001.0, 104484.0, 136716.0, 152765.0, 142265.0, 113275.0, 79743.0, 52043.0, 32112.0, 19446.0, 11701.0, 6750.0, 4192.0, 2370.0, 1476.0, 914.0, 555.0, 326.0, 198.0, 105.0, 78.0, 55.0, 37.0, 24.0, 15.0, 12.0, 4.0, 1.0, 4.0, 3.0], "bins": [-2.876953125, -2.800506591796875, -2.72406005859375, -2.647613525390625, -2.5711669921875, -2.494720458984375, -2.41827392578125, -2.341827392578125, -2.265380859375, -2.188934326171875, -2.11248779296875, -2.036041259765625, -1.9595947265625, -1.883148193359375, -1.80670166015625, -1.730255126953125, -1.65380859375, -1.577362060546875, -1.50091552734375, -1.424468994140625, -1.3480224609375, -1.271575927734375, -1.19512939453125, -1.118682861328125, -1.042236328125, -0.965789794921875, -0.88934326171875, -0.812896728515625, -0.7364501953125, -0.660003662109375, -0.58355712890625, -0.507110595703125, -0.4306640625, -0.354217529296875, -0.27777099609375, -0.201324462890625, -0.1248779296875, -0.048431396484375, 0.02801513671875, 0.104461669921875, 0.180908203125, 0.257354736328125, 0.33380126953125, 0.410247802734375, 0.4866943359375, 0.563140869140625, 0.63958740234375, 0.716033935546875, 0.79248046875, 0.868927001953125, 0.94537353515625, 1.021820068359375, 1.0982666015625, 1.174713134765625, 1.25115966796875, 1.327606201171875, 1.404052734375, 1.480499267578125, 1.55694580078125, 1.633392333984375, 1.7098388671875, 1.786285400390625, 1.86273193359375, 1.939178466796875, 2.015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 13.0, 11.0, 17.0, 21.0, 15.0, 32.0, 27.0, 24.0, 29.0, 42.0, 36.0, 43.0, 36.0, 27.0, 43.0, 54.0, 48.0, 38.0, 52.0, 42.0, 39.0, 35.0, 26.0, 34.0, 25.0, 25.0, 31.0, 27.0, 20.0, 12.0, 10.0, 10.0, 3.0, 10.0, 6.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5126953125, -1.4666748046875, -1.420654296875, -1.3746337890625, -1.32861328125, -1.2825927734375, -1.236572265625, -1.1905517578125, -1.14453125, -1.0985107421875, -1.052490234375, -1.0064697265625, -0.96044921875, -0.9144287109375, -0.868408203125, -0.8223876953125, -0.7763671875, -0.7303466796875, -0.684326171875, -0.6383056640625, -0.59228515625, -0.5462646484375, -0.500244140625, -0.4542236328125, -0.408203125, -0.3621826171875, -0.316162109375, -0.2701416015625, -0.22412109375, -0.1781005859375, -0.132080078125, -0.0860595703125, -0.0400390625, 0.0059814453125, 0.052001953125, 0.0980224609375, 0.14404296875, 0.1900634765625, 0.236083984375, 0.2821044921875, 0.328125, 0.3741455078125, 0.420166015625, 0.4661865234375, 0.51220703125, 0.5582275390625, 0.604248046875, 0.6502685546875, 0.6962890625, 0.7423095703125, 0.788330078125, 0.8343505859375, 0.88037109375, 0.9263916015625, 0.972412109375, 1.0184326171875, 1.064453125, 1.1104736328125, 1.156494140625, 1.2025146484375, 1.24853515625, 1.2945556640625, 1.340576171875, 1.3865966796875, 1.4326171875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 18.0, 22.0, 19.0, 44.0, 56.0, 77.0, 137.0, 182.0, 253.0, 404.0, 559.0, 915.0, 1305.0, 2045.0, 3171.0, 5291.0, 8580.0, 14272.0, 24335.0, 42283.0, 71904.0, 116646.0, 163621.0, 181668.0, 153042.0, 103390.0, 62840.0, 37000.0, 21404.0, 12633.0, 7488.0, 4469.0, 2871.0, 1857.0, 1222.0, 862.0, 528.0, 381.0, 219.0, 188.0, 119.0, 65.0, 50.0, 37.0, 28.0, 12.0, 11.0, 7.0, 6.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4015045166015625, -1.353790283203125, -1.3060760498046875, -1.25836181640625, -1.2106475830078125, -1.162933349609375, -1.1152191162109375, -1.0675048828125, -1.0197906494140625, -0.972076416015625, -0.9243621826171875, -0.87664794921875, -0.8289337158203125, -0.781219482421875, -0.7335052490234375, -0.685791015625, -0.6380767822265625, -0.590362548828125, -0.5426483154296875, -0.49493408203125, -0.4472198486328125, -0.399505615234375, -0.3517913818359375, -0.3040771484375, -0.2563629150390625, -0.208648681640625, -0.1609344482421875, -0.11322021484375, -0.0655059814453125, -0.017791748046875, 0.0299224853515625, 0.07763671875, 0.1253509521484375, 0.173065185546875, 0.2207794189453125, 0.26849365234375, 0.3162078857421875, 0.363922119140625, 0.4116363525390625, 0.4593505859375, 0.5070648193359375, 0.554779052734375, 0.6024932861328125, 0.65020751953125, 0.6979217529296875, 0.745635986328125, 0.7933502197265625, 0.841064453125, 0.8887786865234375, 0.936492919921875, 0.9842071533203125, 1.03192138671875, 1.0796356201171875, 1.127349853515625, 1.1750640869140625, 1.2227783203125, 1.2704925537109375, 1.318206787109375, 1.3659210205078125, 1.41363525390625, 1.4613494873046875, 1.509063720703125, 1.5567779541015625, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 6.0, 21.0, 13.0, 25.0, 32.0, 37.0, 50.0, 50.0, 62.0, 63.0, 56.0, 79.0, 73.0, 71.0, 62.0, 42.0, 48.0, 41.0, 38.0, 24.0, 25.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.0001490432769060135, -0.00014382973313331604, -0.0001386161893606186, -0.00013340264558792114, -0.0001281891018152237, -0.00012297555804252625, -0.0001177620142698288, -0.00011254847049713135, -0.0001073349267244339, -0.00010212138295173645, -9.6907839179039e-05, -9.169429540634155e-05, -8.64807516336441e-05, -8.126720786094666e-05, -7.60536640882492e-05, -7.084012031555176e-05, -6.562657654285431e-05, -6.041303277015686e-05, -5.519948899745941e-05, -4.998594522476196e-05, -4.4772401452064514e-05, -3.9558857679367065e-05, -3.434531390666962e-05, -2.9131770133972168e-05, -2.391822636127472e-05, -1.870468258857727e-05, -1.3491138815879822e-05, -8.277595043182373e-06, -3.0640512704849243e-06, 2.1494925022125244e-06, 7.363036274909973e-06, 1.2576580047607422e-05, 1.779012382030487e-05, 2.300366759300232e-05, 2.8217211365699768e-05, 3.343075513839722e-05, 3.8644298911094666e-05, 4.3857842683792114e-05, 4.907138645648956e-05, 5.428493022918701e-05, 5.949847400188446e-05, 6.471201777458191e-05, 6.992556154727936e-05, 7.51391053199768e-05, 8.035264909267426e-05, 8.55661928653717e-05, 9.077973663806915e-05, 9.59932804107666e-05, 0.00010120682418346405, 0.0001064203679561615, 0.00011163391172885895, 0.0001168474555015564, 0.00012206099927425385, 0.0001272745430469513, 0.00013248808681964874, 0.0001377016305923462, 0.00014291517436504364, 0.0001481287181377411, 0.00015334226191043854, 0.00015855580568313599, 0.00016376934945583344, 0.00016898289322853088, 0.00017419643700122833, 0.00017940998077392578]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 28.0, 21.0, 50.0, 65.0, 89.0, 170.0, 259.0, 365.0, 624.0, 937.0, 1558.0, 2574.0, 4229.0, 7426.0, 13417.0, 24421.0, 43942.0, 78330.0, 128056.0, 178636.0, 190180.0, 150247.0, 96743.0, 55915.0, 30554.0, 16522.0, 9376.0, 5512.0, 3145.0, 1929.0, 1162.0, 710.0, 469.0, 298.0, 205.0, 104.0, 91.0, 56.0, 34.0, 18.0, 12.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.39898681640625, -1.3526611328125, -1.30633544921875, -1.260009765625, -1.21368408203125, -1.1673583984375, -1.12103271484375, -1.07470703125, -1.02838134765625, -0.9820556640625, -0.93572998046875, -0.889404296875, -0.84307861328125, -0.7967529296875, -0.75042724609375, -0.7041015625, -0.65777587890625, -0.6114501953125, -0.56512451171875, -0.518798828125, -0.47247314453125, -0.4261474609375, -0.37982177734375, -0.33349609375, -0.28717041015625, -0.2408447265625, -0.19451904296875, -0.148193359375, -0.10186767578125, -0.0555419921875, -0.00921630859375, 0.037109375, 0.08343505859375, 0.1297607421875, 0.17608642578125, 0.222412109375, 0.26873779296875, 0.3150634765625, 0.36138916015625, 0.40771484375, 0.45404052734375, 0.5003662109375, 0.54669189453125, 0.593017578125, 0.63934326171875, 0.6856689453125, 0.73199462890625, 0.7783203125, 0.82464599609375, 0.8709716796875, 0.91729736328125, 0.963623046875, 1.00994873046875, 1.0562744140625, 1.10260009765625, 1.14892578125, 1.19525146484375, 1.2415771484375, 1.28790283203125, 1.334228515625, 1.38055419921875, 1.4268798828125, 1.47320556640625, 1.51953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 9.0, 10.0, 15.0, 14.0, 16.0, 15.0, 25.0, 33.0, 20.0, 45.0, 40.0, 72.0, 68.0, 52.0, 62.0, 77.0, 68.0, 55.0, 46.0, 51.0, 44.0, 31.0, 24.0, 23.0, 18.0, 7.0, 12.0, 7.0, 3.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4009056091308594, -0.38823699951171875, -0.3755683898925781, -0.3628997802734375, -0.3502311706542969, -0.33756256103515625, -0.3248939514160156, -0.312225341796875, -0.2995567321777344, -0.28688812255859375, -0.2742195129394531, -0.2615509033203125, -0.24888229370117188, -0.23621368408203125, -0.22354507446289062, -0.21087646484375, -0.19820785522460938, -0.18553924560546875, -0.17287063598632812, -0.1602020263671875, -0.14753341674804688, -0.13486480712890625, -0.12219619750976562, -0.109527587890625, -0.09685897827148438, -0.08419036865234375, -0.07152175903320312, -0.0588531494140625, -0.046184539794921875, -0.03351593017578125, -0.020847320556640625, -0.0081787109375, 0.004489898681640625, 0.01715850830078125, 0.029827117919921875, 0.0424957275390625, 0.055164337158203125, 0.06783294677734375, 0.08050155639648438, 0.093170166015625, 0.10583877563476562, 0.11850738525390625, 0.13117599487304688, 0.1438446044921875, 0.15651321411132812, 0.16918182373046875, 0.18185043334960938, 0.19451904296875, 0.20718765258789062, 0.21985626220703125, 0.23252487182617188, 0.2451934814453125, 0.2578620910644531, 0.27053070068359375, 0.2831993103027344, 0.295867919921875, 0.3085365295410156, 0.32120513916015625, 0.3338737487792969, 0.3465423583984375, 0.3592109680175781, 0.37187957763671875, 0.3845481872558594, 0.397216796875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 27.0, 19.0, 37.0, 32.0, 51.0, 69.0, 80.0, 92.0, 104.0, 77.0, 83.0, 72.0, 65.0, 35.0, 32.0, 28.0, 17.0, 21.0, 13.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.787813186645508, -7.59655237197876, -7.40529203414917, -7.214031219482422, -7.022770881652832, -6.831510066986084, -6.640249252319336, -6.448988914489746, -6.257728576660156, -6.066467761993408, -5.875207424163818, -5.68394660949707, -5.4926862716674805, -5.301425457000732, -5.110164642333984, -4.9189043045043945, -4.7276434898376465, -4.536382675170898, -4.345122337341309, -4.1538615226745605, -3.9626011848449707, -3.7713403701782227, -3.5800797939300537, -3.3888192176818848, -3.197558641433716, -3.006298065185547, -2.815037488937378, -2.623776912689209, -2.432516098022461, -2.241255760192871, -2.049994945526123, -1.858734369277954, -1.667473316192627, -1.476212739944458, -1.284952163696289, -1.0936914682388306, -0.9024308919906616, -0.7111703157424927, -0.5199096202850342, -0.32864904403686523, -0.1373884677886963, 0.053872138261795044, 0.24513274431228638, 0.4363933801651001, 0.627653956413269, 0.818914532661438, 1.0101752281188965, 1.2014358043670654, 1.3926963806152344, 1.5839569568634033, 1.7752175331115723, 1.9664782285690308, 2.15773868560791, 2.348999500274658, 2.540260076522827, 2.731520652770996, 2.922781229019165, 3.114041805267334, 3.305302381515503, 3.496562957763672, 3.68782377243042, 3.8790841102600098, 4.070344924926758, 4.261605262756348, 4.452866077423096]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 10.0, 10.0, 13.0, 17.0, 17.0, 19.0, 18.0, 21.0, 33.0, 34.0, 29.0, 30.0, 37.0, 25.0, 37.0, 36.0, 42.0, 46.0, 46.0, 35.0, 39.0, 33.0, 33.0, 34.0, 22.0, 33.0, 16.0, 28.0, 27.0, 18.0, 23.0, 14.0, 16.0, 9.0, 19.0, 10.0, 17.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-2.103912353515625, -2.04496431350708, -1.9860161542892456, -1.9270681142807007, -1.8681199550628662, -1.8091719150543213, -1.7502238750457764, -1.6912758350372314, -1.632327675819397, -1.573379635810852, -1.5144314765930176, -1.4554834365844727, -1.3965353965759277, -1.3375872373580933, -1.2786391973495483, -1.2196910381317139, -1.160742998123169, -1.101794958114624, -1.0428467988967896, -0.9838987588882446, -0.9249506592750549, -0.8660025596618652, -0.8070545196533203, -0.7481064200401306, -0.6891583204269409, -0.6302102208137512, -0.5712621212005615, -0.5123140811920166, -0.4533659815788269, -0.3944178819656372, -0.3354698121547699, -0.2765217423439026, -0.21757376194000244, -0.15862567722797394, -0.09967759251594543, -0.04072950780391693, 0.018218576908111572, 0.07716667652130127, 0.13611474633216858, 0.1950628161430359, 0.2540109157562256, 0.3129590153694153, 0.3719070851802826, 0.4308551549911499, 0.4898032546043396, 0.5487513542175293, 0.6076993942260742, 0.6666474938392639, 0.7255955934524536, 0.7845436930656433, 0.843491792678833, 0.9024398326873779, 0.9613879323005676, 1.0203360319137573, 1.0792840719223022, 1.1382322311401367, 1.1971802711486816, 1.2561283111572266, 1.315076470375061, 1.374024510383606, 1.4329726696014404, 1.4919207096099854, 1.5508687496185303, 1.6098167896270752, 1.6687649488449097]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 10.0, 22.0, 25.0, 44.0, 76.0, 117.0, 191.0, 276.0, 462.0, 806.0, 1383.0, 2191.0, 3634.0, 6327.0, 11467.0, 20756.0, 39748.0, 81050.0, 178953.0, 436498.0, 997004.0, 1223554.0, 672831.0, 278304.0, 120663.0, 57059.0, 28288.0, 14712.0, 7811.0, 4306.0, 2382.0, 1377.0, 806.0, 441.0, 278.0, 170.0, 98.0, 50.0, 36.0, 25.0, 23.0, 5.0, 5.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.26519775390625, -4.1241455078125, -3.98309326171875, -3.842041015625, -3.70098876953125, -3.5599365234375, -3.41888427734375, -3.27783203125, -3.13677978515625, -2.9957275390625, -2.85467529296875, -2.713623046875, -2.57257080078125, -2.4315185546875, -2.29046630859375, -2.1494140625, -2.00836181640625, -1.8673095703125, -1.72625732421875, -1.585205078125, -1.44415283203125, -1.3031005859375, -1.16204833984375, -1.02099609375, -0.87994384765625, -0.7388916015625, -0.59783935546875, -0.456787109375, -0.31573486328125, -0.1746826171875, -0.03363037109375, 0.107421875, 0.24847412109375, 0.3895263671875, 0.53057861328125, 0.671630859375, 0.81268310546875, 0.9537353515625, 1.09478759765625, 1.23583984375, 1.37689208984375, 1.5179443359375, 1.65899658203125, 1.800048828125, 1.94110107421875, 2.0821533203125, 2.22320556640625, 2.3642578125, 2.50531005859375, 2.6463623046875, 2.78741455078125, 2.928466796875, 3.06951904296875, 3.2105712890625, 3.35162353515625, 3.49267578125, 3.63372802734375, 3.7747802734375, 3.91583251953125, 4.056884765625, 4.19793701171875, 4.3389892578125, 4.48004150390625, 4.62109375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 6.0, 22.0, 12.0, 19.0, 27.0, 25.0, 29.0, 26.0, 39.0, 38.0, 36.0, 43.0, 31.0, 44.0, 35.0, 36.0, 54.0, 35.0, 52.0, 49.0, 40.0, 23.0, 38.0, 37.0, 30.0, 21.0, 21.0, 35.0, 15.0, 9.0, 10.0, 6.0, 12.0, 6.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.078125, -2.019866943359375, -1.96160888671875, -1.903350830078125, -1.8450927734375, -1.786834716796875, -1.72857666015625, -1.670318603515625, -1.612060546875, -1.553802490234375, -1.49554443359375, -1.437286376953125, -1.3790283203125, -1.320770263671875, -1.26251220703125, -1.204254150390625, -1.14599609375, -1.087738037109375, -1.02947998046875, -0.971221923828125, -0.9129638671875, -0.854705810546875, -0.79644775390625, -0.738189697265625, -0.679931640625, -0.621673583984375, -0.56341552734375, -0.505157470703125, -0.4468994140625, -0.388641357421875, -0.33038330078125, -0.272125244140625, -0.2138671875, -0.155609130859375, -0.09735107421875, -0.039093017578125, 0.0191650390625, 0.077423095703125, 0.13568115234375, 0.193939208984375, 0.252197265625, 0.310455322265625, 0.36871337890625, 0.426971435546875, 0.4852294921875, 0.543487548828125, 0.60174560546875, 0.660003662109375, 0.71826171875, 0.776519775390625, 0.83477783203125, 0.893035888671875, 0.9512939453125, 1.009552001953125, 1.06781005859375, 1.126068115234375, 1.184326171875, 1.242584228515625, 1.30084228515625, 1.359100341796875, 1.4173583984375, 1.475616455078125, 1.53387451171875, 1.592132568359375, 1.650390625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 14.0, 27.0, 40.0, 45.0, 85.0, 134.0, 227.0, 335.0, 582.0, 967.0, 1473.0, 2510.0, 4315.0, 7428.0, 13143.0, 24089.0, 44776.0, 86996.0, 171692.0, 352864.0, 693910.0, 1039472.0, 840922.0, 451720.0, 221802.0, 110664.0, 56175.0, 29964.0, 16329.0, 9061.0, 4959.0, 3030.0, 1818.0, 1090.0, 646.0, 337.0, 231.0, 144.0, 103.0, 64.0, 32.0, 28.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.16015625, -4.0245361328125, -3.888916015625, -3.7532958984375, -3.61767578125, -3.4820556640625, -3.346435546875, -3.2108154296875, -3.0751953125, -2.9395751953125, -2.803955078125, -2.6683349609375, -2.53271484375, -2.3970947265625, -2.261474609375, -2.1258544921875, -1.990234375, -1.8546142578125, -1.718994140625, -1.5833740234375, -1.44775390625, -1.3121337890625, -1.176513671875, -1.0408935546875, -0.9052734375, -0.7696533203125, -0.634033203125, -0.4984130859375, -0.36279296875, -0.2271728515625, -0.091552734375, 0.0440673828125, 0.1796875, 0.3153076171875, 0.450927734375, 0.5865478515625, 0.72216796875, 0.8577880859375, 0.993408203125, 1.1290283203125, 1.2646484375, 1.4002685546875, 1.535888671875, 1.6715087890625, 1.80712890625, 1.9427490234375, 2.078369140625, 2.2139892578125, 2.349609375, 2.4852294921875, 2.620849609375, 2.7564697265625, 2.89208984375, 3.0277099609375, 3.163330078125, 3.2989501953125, 3.4345703125, 3.5701904296875, 3.705810546875, 3.8414306640625, 3.97705078125, 4.1126708984375, 4.248291015625, 4.3839111328125, 4.51953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 11.0, 11.0, 14.0, 20.0, 32.0, 33.0, 47.0, 68.0, 81.0, 97.0, 99.0, 135.0, 137.0, 181.0, 201.0, 219.0, 245.0, 230.0, 285.0, 258.0, 215.0, 241.0, 199.0, 165.0, 136.0, 137.0, 100.0, 87.0, 84.0, 71.0, 52.0, 40.0, 23.0, 15.0, 23.0, 17.0, 6.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.99072265625, -0.9569778442382812, -0.9232330322265625, -0.8894882202148438, -0.855743408203125, -0.8219985961914062, -0.7882537841796875, -0.7545089721679688, -0.72076416015625, -0.6870193481445312, -0.6532745361328125, -0.6195297241210938, -0.585784912109375, -0.5520401000976562, -0.5182952880859375, -0.48455047607421875, -0.4508056640625, -0.41706085205078125, -0.3833160400390625, -0.34957122802734375, -0.315826416015625, -0.28208160400390625, -0.2483367919921875, -0.21459197998046875, -0.18084716796875, -0.14710235595703125, -0.1133575439453125, -0.07961273193359375, -0.045867919921875, -0.01212310791015625, 0.0216217041015625, 0.05536651611328125, 0.089111328125, 0.12285614013671875, 0.1566009521484375, 0.19034576416015625, 0.224090576171875, 0.25783538818359375, 0.2915802001953125, 0.32532501220703125, 0.35906982421875, 0.39281463623046875, 0.4265594482421875, 0.46030426025390625, 0.494049072265625, 0.5277938842773438, 0.5615386962890625, 0.5952835083007812, 0.6290283203125, 0.6627731323242188, 0.6965179443359375, 0.7302627563476562, 0.764007568359375, 0.7977523803710938, 0.8314971923828125, 0.8652420043945312, 0.89898681640625, 0.9327316284179688, 0.9664764404296875, 1.0002212524414062, 1.033966064453125, 1.0677108764648438, 1.1014556884765625, 1.1352005004882812, 1.1689453125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 14.0, 12.0, 16.0, 16.0, 25.0, 49.0, 47.0, 55.0, 70.0, 64.0, 74.0, 84.0, 74.0, 80.0, 68.0, 57.0, 26.0, 30.0, 21.0, 25.0, 19.0, 8.0, 13.0, 14.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.886803150177002, -6.720529079437256, -6.554255485534668, -6.387981414794922, -6.221707344055176, -6.05543327331543, -5.889159202575684, -5.722885608673096, -5.55661153793335, -5.3903374671936035, -5.224063873291016, -5.0577898025512695, -4.891515731811523, -4.725241661071777, -4.558967590332031, -4.392693996429443, -4.226419925689697, -4.060145854949951, -3.893872022628784, -3.727598190307617, -3.561324119567871, -3.395050048828125, -3.228776216506958, -3.062502384185791, -2.896228313446045, -2.729954242706299, -2.563680410385132, -2.397406578063965, -2.2311325073242188, -2.0648584365844727, -1.8985846042633057, -1.7323106527328491, -1.5660364627838135, -1.399762511253357, -1.2334885597229004, -1.0672146081924438, -0.9009406566619873, -0.7346667051315308, -0.5683927536010742, -0.4021188020706177, -0.23584485054016113, -0.06957089900970459, 0.09670305252075195, 0.2629770040512085, 0.42925095558166504, 0.5955249071121216, 0.7617988586425781, 0.9280728101730347, 1.0943467617034912, 1.2606207132339478, 1.4268946647644043, 1.5931686162948608, 1.7594425678253174, 1.925716519355774, 2.0919904708862305, 2.2582645416259766, 2.4245383739471436, 2.5908122062683105, 2.7570862770080566, 2.9233603477478027, 3.0896341800689697, 3.2559080123901367, 3.422182083129883, 3.588456153869629, 3.754729986190796]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 8.0, 4.0, 12.0, 20.0, 12.0, 25.0, 15.0, 20.0, 19.0, 26.0, 31.0, 31.0, 35.0, 33.0, 38.0, 50.0, 40.0, 32.0, 44.0, 44.0, 31.0, 42.0, 34.0, 29.0, 29.0, 20.0, 32.0, 25.0, 20.0, 19.0, 26.0, 20.0, 17.0, 14.0, 18.0, 11.0, 11.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8708324432373047, -1.8121438026428223, -1.7534551620483398, -1.6947665214538574, -1.636077880859375, -1.5773892402648926, -1.5187007188796997, -1.4600120782852173, -1.4013234376907349, -1.3426347970962524, -1.28394615650177, -1.2252575159072876, -1.1665689945220947, -1.1078803539276123, -1.0491917133331299, -0.9905030727386475, -0.931814432144165, -0.8731257915496826, -0.8144371509552002, -0.7557485699653625, -0.6970599293708801, -0.6383712887763977, -0.5796827077865601, -0.5209940671920776, -0.4623054265975952, -0.4036167860031128, -0.34492817521095276, -0.2862395644187927, -0.2275509238243103, -0.16886228322982788, -0.11017367243766785, -0.05148506164550781, 0.00720369815826416, 0.06589232385158539, 0.12458094954490662, 0.18326957523822784, 0.24195820093154907, 0.3006468415260315, 0.35933545231819153, 0.41802406311035156, 0.476712703704834, 0.5354013442993164, 0.5940899848937988, 0.6527785658836365, 0.7114672064781189, 0.7701558470726013, 0.828844428062439, 0.8875330686569214, 0.9462217092514038, 1.0049103498458862, 1.0635989904403687, 1.122287631034851, 1.180976152420044, 1.2396647930145264, 1.2983534336090088, 1.3570420742034912, 1.4157307147979736, 1.474419355392456, 1.5331079959869385, 1.591796636581421, 1.6504852771759033, 1.7091739177703857, 1.7678624391555786, 1.826551079750061, 1.8852397203445435]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 15.0, 22.0, 37.0, 46.0, 98.0, 126.0, 216.0, 317.0, 495.0, 790.0, 1301.0, 2005.0, 3435.0, 5767.0, 10168.0, 18038.0, 32493.0, 58886.0, 105221.0, 169738.0, 210826.0, 175578.0, 111063.0, 62661.0, 34362.0, 19025.0, 10695.0, 5939.0, 3474.0, 2229.0, 1299.0, 751.0, 529.0, 307.0, 216.0, 148.0, 79.0, 44.0, 35.0, 17.0, 16.0, 12.0, 14.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.328125, -0.31862640380859375, -0.3091278076171875, -0.29962921142578125, -0.290130615234375, -0.28063201904296875, -0.2711334228515625, -0.26163482666015625, -0.25213623046875, -0.24263763427734375, -0.2331390380859375, -0.22364044189453125, -0.214141845703125, -0.20464324951171875, -0.1951446533203125, -0.18564605712890625, -0.1761474609375, -0.16664886474609375, -0.1571502685546875, -0.14765167236328125, -0.138153076171875, -0.12865447998046875, -0.1191558837890625, -0.10965728759765625, -0.10015869140625, -0.09066009521484375, -0.0811614990234375, -0.07166290283203125, -0.062164306640625, -0.05266571044921875, -0.0431671142578125, -0.03366851806640625, -0.024169921875, -0.01467132568359375, -0.0051727294921875, 0.00432586669921875, 0.013824462890625, 0.02332305908203125, 0.0328216552734375, 0.04232025146484375, 0.05181884765625, 0.06131744384765625, 0.0708160400390625, 0.08031463623046875, 0.089813232421875, 0.09931182861328125, 0.1088104248046875, 0.11830902099609375, 0.1278076171875, 0.13730621337890625, 0.1468048095703125, 0.15630340576171875, 0.165802001953125, 0.17530059814453125, 0.1847991943359375, 0.19429779052734375, 0.20379638671875, 0.21329498291015625, 0.2227935791015625, 0.23229217529296875, 0.241790771484375, 0.25128936767578125, 0.2607879638671875, 0.27028656005859375, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 10.0, 6.0, 14.0, 8.0, 16.0, 17.0, 18.0, 21.0, 26.0, 26.0, 31.0, 30.0, 46.0, 27.0, 45.0, 34.0, 48.0, 27.0, 43.0, 38.0, 37.0, 30.0, 39.0, 32.0, 36.0, 30.0, 31.0, 24.0, 19.0, 13.0, 19.0, 22.0, 21.0, 12.0, 11.0, 15.0, 12.0, 6.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.296875, -2.228546142578125, -2.16021728515625, -2.091888427734375, -2.0235595703125, -1.955230712890625, -1.88690185546875, -1.818572998046875, -1.750244140625, -1.681915283203125, -1.61358642578125, -1.545257568359375, -1.4769287109375, -1.408599853515625, -1.34027099609375, -1.271942138671875, -1.20361328125, -1.135284423828125, -1.06695556640625, -0.998626708984375, -0.9302978515625, -0.861968994140625, -0.79364013671875, -0.725311279296875, -0.656982421875, -0.588653564453125, -0.52032470703125, -0.451995849609375, -0.3836669921875, -0.315338134765625, -0.24700927734375, -0.178680419921875, -0.1103515625, -0.042022705078125, 0.02630615234375, 0.094635009765625, 0.1629638671875, 0.231292724609375, 0.29962158203125, 0.367950439453125, 0.436279296875, 0.504608154296875, 0.57293701171875, 0.641265869140625, 0.7095947265625, 0.777923583984375, 0.84625244140625, 0.914581298828125, 0.98291015625, 1.051239013671875, 1.11956787109375, 1.187896728515625, 1.2562255859375, 1.324554443359375, 1.39288330078125, 1.461212158203125, 1.529541015625, 1.597869873046875, 1.66619873046875, 1.734527587890625, 1.8028564453125, 1.871185302734375, 1.93951416015625, 2.007843017578125, 2.076171875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 27.0, 29.0, 48.0, 71.0, 70.0, 132.0, 185.0, 259.0, 443.0, 791.0, 1316.0, 2533.0, 5318.0, 12331.0, 33200.0, 741366.0, 206411.0, 24797.0, 9747.0, 4332.0, 2118.0, 1162.0, 620.0, 423.0, 244.0, 185.0, 110.0, 73.0, 44.0, 39.0, 25.0, 23.0, 14.0, 9.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.060546875, -1.0272674560546875, -0.993988037109375, -0.9607086181640625, -0.92742919921875, -0.8941497802734375, -0.860870361328125, -0.8275909423828125, -0.7943115234375, -0.7610321044921875, -0.727752685546875, -0.6944732666015625, -0.66119384765625, -0.6279144287109375, -0.594635009765625, -0.5613555908203125, -0.528076171875, -0.4947967529296875, -0.461517333984375, -0.4282379150390625, -0.39495849609375, -0.3616790771484375, -0.328399658203125, -0.2951202392578125, -0.2618408203125, -0.2285614013671875, -0.195281982421875, -0.1620025634765625, -0.12872314453125, -0.0954437255859375, -0.062164306640625, -0.0288848876953125, 0.00439453125, 0.0376739501953125, 0.070953369140625, 0.1042327880859375, 0.13751220703125, 0.1707916259765625, 0.204071044921875, 0.2373504638671875, 0.2706298828125, 0.3039093017578125, 0.337188720703125, 0.3704681396484375, 0.40374755859375, 0.4370269775390625, 0.470306396484375, 0.5035858154296875, 0.536865234375, 0.5701446533203125, 0.603424072265625, 0.6367034912109375, 0.66998291015625, 0.7032623291015625, 0.736541748046875, 0.7698211669921875, 0.8031005859375, 0.8363800048828125, 0.869659423828125, 0.9029388427734375, 0.93621826171875, 0.9694976806640625, 1.002777099609375, 1.0360565185546875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 9.0, 10.0, 22.0, 21.0, 20.0, 27.0, 28.0, 25.0, 27.0, 26.0, 33.0, 33.0, 46.0, 38.0, 47.0, 46.0, 45.0, 35.0, 45.0, 43.0, 42.0, 55.0, 46.0, 29.0, 18.0, 30.0, 12.0, 24.0, 21.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8232421875, -1.772857666015625, -1.72247314453125, -1.672088623046875, -1.6217041015625, -1.571319580078125, -1.52093505859375, -1.470550537109375, -1.420166015625, -1.369781494140625, -1.31939697265625, -1.269012451171875, -1.2186279296875, -1.168243408203125, -1.11785888671875, -1.067474365234375, -1.01708984375, -0.966705322265625, -0.91632080078125, -0.865936279296875, -0.8155517578125, -0.765167236328125, -0.71478271484375, -0.664398193359375, -0.614013671875, -0.563629150390625, -0.51324462890625, -0.462860107421875, -0.4124755859375, -0.362091064453125, -0.31170654296875, -0.261322021484375, -0.2109375, -0.160552978515625, -0.11016845703125, -0.059783935546875, -0.0093994140625, 0.040985107421875, 0.09136962890625, 0.141754150390625, 0.192138671875, 0.242523193359375, 0.29290771484375, 0.343292236328125, 0.3936767578125, 0.444061279296875, 0.49444580078125, 0.544830322265625, 0.59521484375, 0.645599365234375, 0.69598388671875, 0.746368408203125, 0.7967529296875, 0.847137451171875, 0.89752197265625, 0.947906494140625, 0.998291015625, 1.048675537109375, 1.09906005859375, 1.149444580078125, 1.1998291015625, 1.250213623046875, 1.30059814453125, 1.350982666015625, 1.4013671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 14.0, 18.0, 27.0, 28.0, 28.0, 43.0, 54.0, 91.0, 151.0, 257.0, 448.0, 792.0, 1420.0, 2747.0, 5786.0, 13103.0, 36279.0, 903133.0, 53276.0, 16635.0, 6940.0, 3262.0, 1708.0, 913.0, 529.0, 292.0, 185.0, 119.0, 75.0, 51.0, 32.0, 31.0, 20.0, 15.0, 5.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0], "bins": [-0.338623046875, -0.3296241760253906, -0.32062530517578125, -0.3116264343261719, -0.3026275634765625, -0.2936286926269531, -0.28462982177734375, -0.2756309509277344, -0.266632080078125, -0.2576332092285156, -0.24863433837890625, -0.23963546752929688, -0.2306365966796875, -0.22163772583007812, -0.21263885498046875, -0.20363998413085938, -0.19464111328125, -0.18564224243164062, -0.17664337158203125, -0.16764450073242188, -0.1586456298828125, -0.14964675903320312, -0.14064788818359375, -0.13164901733398438, -0.122650146484375, -0.11365127563476562, -0.10465240478515625, -0.09565353393554688, -0.0866546630859375, -0.07765579223632812, -0.06865692138671875, -0.059658050537109375, -0.0506591796875, -0.041660308837890625, -0.03266143798828125, -0.023662567138671875, -0.0146636962890625, -0.005664825439453125, 0.00333404541015625, 0.012332916259765625, 0.021331787109375, 0.030330657958984375, 0.03932952880859375, 0.048328399658203125, 0.0573272705078125, 0.06632614135742188, 0.07532501220703125, 0.08432388305664062, 0.09332275390625, 0.10232162475585938, 0.11132049560546875, 0.12031936645507812, 0.1293182373046875, 0.13831710815429688, 0.14731597900390625, 0.15631484985351562, 0.165313720703125, 0.17431259155273438, 0.18331146240234375, 0.19231033325195312, 0.2013092041015625, 0.21030807495117188, 0.21930694580078125, 0.22830581665039062, 0.2373046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 21.0, 18.0, 26.0, 20.0, 30.0, 40.0, 43.0, 37.0, 48.0, 47.0, 37.0, 56.0, 58.0, 51.0, 53.0, 54.0, 42.0, 45.0, 35.0, 30.0, 23.0, 18.0, 22.0, 9.0, 18.0, 14.0, 13.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.612879663705826e-05, -3.5064294934272766e-05, -3.3999793231487274e-05, -3.293529152870178e-05, -3.187078982591629e-05, -3.08062881231308e-05, -2.9741786420345306e-05, -2.8677284717559814e-05, -2.7612783014774323e-05, -2.654828131198883e-05, -2.548377960920334e-05, -2.4419277906417847e-05, -2.3354776203632355e-05, -2.2290274500846863e-05, -2.122577279806137e-05, -2.016127109527588e-05, -1.9096769392490387e-05, -1.8032267689704895e-05, -1.6967765986919403e-05, -1.590326428413391e-05, -1.483876258134842e-05, -1.3774260878562927e-05, -1.2709759175777435e-05, -1.1645257472991943e-05, -1.0580755770206451e-05, -9.51625406742096e-06, -8.451752364635468e-06, -7.387250661849976e-06, -6.322748959064484e-06, -5.258247256278992e-06, -4.1937455534935e-06, -3.129243850708008e-06, -2.064742147922516e-06, -1.000240445137024e-06, 6.426125764846802e-08, 1.12876296043396e-06, 2.193264663219452e-06, 3.257766366004944e-06, 4.322268068790436e-06, 5.386769771575928e-06, 6.45127147436142e-06, 7.515773177146912e-06, 8.580274879932404e-06, 9.644776582717896e-06, 1.0709278285503387e-05, 1.177377998828888e-05, 1.2838281691074371e-05, 1.3902783393859863e-05, 1.4967285096645355e-05, 1.6031786799430847e-05, 1.709628850221634e-05, 1.816079020500183e-05, 1.9225291907787323e-05, 2.0289793610572815e-05, 2.1354295313358307e-05, 2.24187970161438e-05, 2.348329871892929e-05, 2.4547800421714783e-05, 2.5612302124500275e-05, 2.6676803827285767e-05, 2.774130553007126e-05, 2.880580723285675e-05, 2.9870308935642242e-05, 3.0934810638427734e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 13.0, 26.0, 37.0, 44.0, 55.0, 83.0, 94.0, 138.0, 230.0, 340.0, 451.0, 632.0, 1040.0, 1523.0, 2276.0, 3626.0, 5991.0, 9577.0, 16396.0, 28144.0, 49759.0, 89647.0, 150337.0, 208660.0, 189692.0, 123210.0, 70081.0, 39741.0, 22222.0, 12958.0, 7688.0, 4773.0, 2958.0, 1933.0, 1293.0, 934.0, 623.0, 409.0, 259.0, 188.0, 161.0, 86.0, 63.0, 48.0, 28.0, 21.0, 19.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0], "bins": [-0.07452392578125, -0.07238197326660156, -0.07024002075195312, -0.06809806823730469, -0.06595611572265625, -0.06381416320800781, -0.061672210693359375, -0.05953025817871094, -0.0573883056640625, -0.05524635314941406, -0.053104400634765625, -0.05096244812011719, -0.04882049560546875, -0.04667854309082031, -0.044536590576171875, -0.04239463806152344, -0.040252685546875, -0.03811073303222656, -0.035968780517578125, -0.03382682800292969, -0.03168487548828125, -0.029542922973632812, -0.027400970458984375, -0.025259017944335938, -0.0231170654296875, -0.020975112915039062, -0.018833160400390625, -0.016691207885742188, -0.01454925537109375, -0.012407302856445312, -0.010265350341796875, -0.008123397827148438, -0.0059814453125, -0.0038394927978515625, -0.001697540283203125, 0.0004444122314453125, 0.00258636474609375, 0.0047283172607421875, 0.006870269775390625, 0.009012222290039062, 0.0111541748046875, 0.013296127319335938, 0.015438079833984375, 0.017580032348632812, 0.01972198486328125, 0.021863937377929688, 0.024005889892578125, 0.026147842407226562, 0.028289794921875, 0.030431747436523438, 0.032573699951171875, 0.03471565246582031, 0.03685760498046875, 0.03899955749511719, 0.041141510009765625, 0.04328346252441406, 0.0454254150390625, 0.04756736755371094, 0.049709320068359375, 0.05185127258300781, 0.05399322509765625, 0.05613517761230469, 0.058277130126953125, 0.06041908264160156, 0.06256103515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 21.0, 22.0, 21.0, 32.0, 56.0, 74.0, 79.0, 79.0, 70.0, 78.0, 76.0, 73.0, 60.0, 57.0, 35.0, 32.0, 23.0, 20.0, 14.0, 12.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020233154296875, -0.01952052116394043, -0.01880788803100586, -0.01809525489807129, -0.01738262176513672, -0.01666998863220215, -0.015957355499267578, -0.015244722366333008, -0.014532089233398438, -0.013819456100463867, -0.013106822967529297, -0.012394189834594727, -0.011681556701660156, -0.010968923568725586, -0.010256290435791016, -0.009543657302856445, -0.008831024169921875, -0.008118391036987305, -0.007405757904052734, -0.006693124771118164, -0.005980491638183594, -0.0052678585052490234, -0.004555225372314453, -0.003842592239379883, -0.0031299591064453125, -0.002417325973510742, -0.0017046928405761719, -0.0009920597076416016, -0.00027942657470703125, 0.00043320655822753906, 0.0011458396911621094, 0.0018584728240966797, 0.00257110595703125, 0.0032837390899658203, 0.003996372222900391, 0.004709005355834961, 0.005421638488769531, 0.0061342716217041016, 0.006846904754638672, 0.007559537887573242, 0.008272171020507812, 0.008984804153442383, 0.009697437286376953, 0.010410070419311523, 0.011122703552246094, 0.011835336685180664, 0.012547969818115234, 0.013260602951049805, 0.013973236083984375, 0.014685869216918945, 0.015398502349853516, 0.016111135482788086, 0.016823768615722656, 0.017536401748657227, 0.018249034881591797, 0.018961668014526367, 0.019674301147460938, 0.020386934280395508, 0.021099567413330078, 0.02181220054626465, 0.02252483367919922, 0.02323746681213379, 0.02395009994506836, 0.02466273307800293, 0.0253753662109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 8.0, 19.0, 16.0, 27.0, 45.0, 48.0, 55.0, 71.0, 65.0, 71.0, 84.0, 83.0, 81.0, 66.0, 47.0, 29.0, 31.0, 23.0, 19.0, 22.0, 12.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.85531759262085, -6.689630031585693, -6.523942470550537, -6.358254432678223, -6.192566871643066, -6.02687931060791, -5.861191749572754, -5.695504188537598, -5.529816627502441, -5.364129066467285, -5.198441505432129, -5.0327534675598145, -4.867065906524658, -4.701378345489502, -4.535690784454346, -4.3700032234191895, -4.204315185546875, -4.038627624511719, -3.8729398250579834, -3.707252264022827, -3.541564464569092, -3.3758769035339355, -3.2101893424987793, -3.044501781463623, -2.8788139820098877, -2.7131264209747314, -2.547438621520996, -2.38175106048584, -2.2160634994506836, -2.0503756999969482, -1.884688138961792, -1.7190004587173462, -1.5533127784729004, -1.3876250982284546, -1.2219374179840088, -1.0562498569488525, -0.8905621767044067, -0.7248744964599609, -0.5591868758201599, -0.3934992551803589, -0.22781157493591309, -0.06212392449378967, 0.10356372594833374, 0.26925137639045715, 0.43493902683258057, 0.6006267070770264, 0.7663143277168274, 0.9320019483566284, 1.0976896286010742, 1.26337730884552, 1.4290649890899658, 1.594752550125122, 1.7604402303695679, 1.9261279106140137, 2.09181547164917, 2.257503032684326, 2.4231908321380615, 2.5888783931732178, 2.754566192626953, 2.9202537536621094, 3.0859413146972656, 3.251629114151001, 3.4173166751861572, 3.5830044746398926, 3.748692035675049]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 9.0, 6.0, 10.0, 16.0, 16.0, 20.0, 18.0, 18.0, 18.0, 27.0, 26.0, 36.0, 33.0, 35.0, 39.0, 46.0, 45.0, 29.0, 42.0, 45.0, 35.0, 40.0, 36.0, 28.0, 32.0, 22.0, 30.0, 22.0, 22.0, 22.0, 26.0, 21.0, 14.0, 15.0, 18.0, 10.0, 13.0, 6.0, 7.0, 5.0, 8.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8758937120437622, -1.8173400163650513, -1.7587863206863403, -1.7002326250076294, -1.6416789293289185, -1.5831252336502075, -1.524571418762207, -1.466017723083496, -1.4074640274047852, -1.3489103317260742, -1.2903566360473633, -1.2318029403686523, -1.1732492446899414, -1.1146955490112305, -1.0561418533325195, -0.9975880980491638, -0.9390344619750977, -0.8804807662963867, -0.8219270706176758, -0.7633733749389648, -0.7048196792602539, -0.646265983581543, -0.5877122282981873, -0.5291585326194763, -0.4706048369407654, -0.41205114126205444, -0.3534974455833435, -0.2949437201023102, -0.23639002442359924, -0.1778363287448883, -0.11928260326385498, -0.06072890758514404, -0.0021750926971435547, 0.05637861043214798, 0.11493231356143951, 0.17348602414131165, 0.23203971982002258, 0.2905934154987335, 0.34914714097976685, 0.4077008366584778, 0.4662545323371887, 0.5248082280158997, 0.5833619236946106, 0.6419156789779663, 0.7004693746566772, 0.7590230703353882, 0.8175767660140991, 0.8761304616928101, 0.934684157371521, 0.9932378530502319, 1.0517915487289429, 1.1103452444076538, 1.1688989400863647, 1.2274526357650757, 1.2860064506530762, 1.344560146331787, 1.403113842010498, 1.461667537689209, 1.52022123336792, 1.5787749290466309, 1.6373286247253418, 1.6958823204040527, 1.7544360160827637, 1.8129897117614746, 1.8715434074401855]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 23.0, 29.0, 52.0, 57.0, 75.0, 154.0, 233.0, 299.0, 463.0, 734.0, 1185.0, 1680.0, 2687.0, 4302.0, 6911.0, 10312.0, 16105.0, 24830.0, 37831.0, 55167.0, 77715.0, 102431.0, 123341.0, 131028.0, 120995.0, 99998.0, 75064.0, 52509.0, 35529.0, 23661.0, 15383.0, 9850.0, 6387.0, 4089.0, 2581.0, 1668.0, 1122.0, 721.0, 458.0, 312.0, 194.0, 120.0, 84.0, 55.0, 41.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.22265625, -2.15618896484375, -2.0897216796875, -2.02325439453125, -1.956787109375, -1.89031982421875, -1.8238525390625, -1.75738525390625, -1.69091796875, -1.62445068359375, -1.5579833984375, -1.49151611328125, -1.425048828125, -1.35858154296875, -1.2921142578125, -1.22564697265625, -1.1591796875, -1.09271240234375, -1.0262451171875, -0.95977783203125, -0.893310546875, -0.82684326171875, -0.7603759765625, -0.69390869140625, -0.62744140625, -0.56097412109375, -0.4945068359375, -0.42803955078125, -0.361572265625, -0.29510498046875, -0.2286376953125, -0.16217041015625, -0.095703125, -0.02923583984375, 0.0372314453125, 0.10369873046875, 0.170166015625, 0.23663330078125, 0.3031005859375, 0.36956787109375, 0.43603515625, 0.50250244140625, 0.5689697265625, 0.63543701171875, 0.701904296875, 0.76837158203125, 0.8348388671875, 0.90130615234375, 0.9677734375, 1.03424072265625, 1.1007080078125, 1.16717529296875, 1.233642578125, 1.30010986328125, 1.3665771484375, 1.43304443359375, 1.49951171875, 1.56597900390625, 1.6324462890625, 1.69891357421875, 1.765380859375, 1.83184814453125, 1.8983154296875, 1.96478271484375, 2.03125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 6.0, 11.0, 20.0, 19.0, 21.0, 29.0, 31.0, 33.0, 31.0, 41.0, 42.0, 47.0, 39.0, 46.0, 38.0, 48.0, 53.0, 33.0, 44.0, 39.0, 34.0, 37.0, 30.0, 29.0, 22.0, 24.0, 20.0, 27.0, 10.0, 8.0, 13.0, 10.0, 10.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.3851318359375, -2.307373046875, -2.2296142578125, -2.15185546875, -2.0740966796875, -1.996337890625, -1.9185791015625, -1.8408203125, -1.7630615234375, -1.685302734375, -1.6075439453125, -1.52978515625, -1.4520263671875, -1.374267578125, -1.2965087890625, -1.21875, -1.1409912109375, -1.063232421875, -0.9854736328125, -0.90771484375, -0.8299560546875, -0.752197265625, -0.6744384765625, -0.5966796875, -0.5189208984375, -0.441162109375, -0.3634033203125, -0.28564453125, -0.2078857421875, -0.130126953125, -0.0523681640625, 0.025390625, 0.1031494140625, 0.180908203125, 0.2586669921875, 0.33642578125, 0.4141845703125, 0.491943359375, 0.5697021484375, 0.6474609375, 0.7252197265625, 0.802978515625, 0.8807373046875, 0.95849609375, 1.0362548828125, 1.114013671875, 1.1917724609375, 1.26953125, 1.3472900390625, 1.425048828125, 1.5028076171875, 1.58056640625, 1.6583251953125, 1.736083984375, 1.8138427734375, 1.8916015625, 1.9693603515625, 2.047119140625, 2.1248779296875, 2.20263671875, 2.2803955078125, 2.358154296875, 2.4359130859375, 2.513671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 9.0, 11.0, 16.0, 22.0, 26.0, 56.0, 73.0, 121.0, 157.0, 250.0, 365.0, 621.0, 908.0, 1485.0, 2326.0, 3771.0, 6130.0, 10011.0, 16425.0, 26272.0, 42704.0, 65500.0, 95190.0, 125552.0, 144413.0, 141825.0, 118613.0, 87730.0, 58910.0, 37881.0, 23420.0, 14468.0, 8731.0, 5496.0, 3274.0, 2123.0, 1328.0, 848.0, 496.0, 368.0, 226.0, 143.0, 85.0, 66.0, 34.0, 27.0, 21.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.4375, -2.358551025390625, -2.27960205078125, -2.200653076171875, -2.1217041015625, -2.042755126953125, -1.96380615234375, -1.884857177734375, -1.805908203125, -1.726959228515625, -1.64801025390625, -1.569061279296875, -1.4901123046875, -1.411163330078125, -1.33221435546875, -1.253265380859375, -1.17431640625, -1.095367431640625, -1.01641845703125, -0.937469482421875, -0.8585205078125, -0.779571533203125, -0.70062255859375, -0.621673583984375, -0.542724609375, -0.463775634765625, -0.38482666015625, -0.305877685546875, -0.2269287109375, -0.147979736328125, -0.06903076171875, 0.009918212890625, 0.0888671875, 0.167816162109375, 0.24676513671875, 0.325714111328125, 0.4046630859375, 0.483612060546875, 0.56256103515625, 0.641510009765625, 0.720458984375, 0.799407958984375, 0.87835693359375, 0.957305908203125, 1.0362548828125, 1.115203857421875, 1.19415283203125, 1.273101806640625, 1.35205078125, 1.430999755859375, 1.50994873046875, 1.588897705078125, 1.6678466796875, 1.746795654296875, 1.82574462890625, 1.904693603515625, 1.983642578125, 2.062591552734375, 2.14154052734375, 2.220489501953125, 2.2994384765625, 2.378387451171875, 2.45733642578125, 2.536285400390625, 2.615234375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 5.0, 7.0, 13.0, 12.0, 15.0, 22.0, 17.0, 20.0, 30.0, 25.0, 23.0, 37.0, 40.0, 32.0, 37.0, 28.0, 38.0, 35.0, 30.0, 39.0, 39.0, 36.0, 36.0, 31.0, 31.0, 23.0, 16.0, 34.0, 25.0, 20.0, 22.0, 14.0, 18.0, 16.0, 12.0, 11.0, 15.0, 7.0, 8.0, 6.0, 4.0, 9.0, 6.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.3134765625, -1.274261474609375, -1.23504638671875, -1.195831298828125, -1.1566162109375, -1.117401123046875, -1.07818603515625, -1.038970947265625, -0.999755859375, -0.960540771484375, -0.92132568359375, -0.882110595703125, -0.8428955078125, -0.803680419921875, -0.76446533203125, -0.725250244140625, -0.68603515625, -0.646820068359375, -0.60760498046875, -0.568389892578125, -0.5291748046875, -0.489959716796875, -0.45074462890625, -0.411529541015625, -0.372314453125, -0.333099365234375, -0.29388427734375, -0.254669189453125, -0.2154541015625, -0.176239013671875, -0.13702392578125, -0.097808837890625, -0.05859375, -0.019378662109375, 0.01983642578125, 0.059051513671875, 0.0982666015625, 0.137481689453125, 0.17669677734375, 0.215911865234375, 0.255126953125, 0.294342041015625, 0.33355712890625, 0.372772216796875, 0.4119873046875, 0.451202392578125, 0.49041748046875, 0.529632568359375, 0.56884765625, 0.608062744140625, 0.64727783203125, 0.686492919921875, 0.7257080078125, 0.764923095703125, 0.80413818359375, 0.843353271484375, 0.882568359375, 0.921783447265625, 0.96099853515625, 1.000213623046875, 1.0394287109375, 1.078643798828125, 1.11785888671875, 1.157073974609375, 1.1962890625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 15.0, 29.0, 29.0, 40.0, 68.0, 96.0, 153.0, 235.0, 319.0, 577.0, 766.0, 1248.0, 1835.0, 2983.0, 4741.0, 7500.0, 12007.0, 19857.0, 33435.0, 55280.0, 89246.0, 133294.0, 168881.0, 167382.0, 128911.0, 85325.0, 52502.0, 31508.0, 18947.0, 11711.0, 7032.0, 4514.0, 2878.0, 1771.0, 1191.0, 783.0, 499.0, 297.0, 216.0, 148.0, 93.0, 69.0, 52.0, 25.0, 13.0, 13.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3737030029296875, -1.324554443359375, -1.2754058837890625, -1.22625732421875, -1.1771087646484375, -1.127960205078125, -1.0788116455078125, -1.0296630859375, -0.9805145263671875, -0.931365966796875, -0.8822174072265625, -0.83306884765625, -0.7839202880859375, -0.734771728515625, -0.6856231689453125, -0.636474609375, -0.5873260498046875, -0.538177490234375, -0.4890289306640625, -0.43988037109375, -0.3907318115234375, -0.341583251953125, -0.2924346923828125, -0.2432861328125, -0.1941375732421875, -0.144989013671875, -0.0958404541015625, -0.04669189453125, 0.0024566650390625, 0.051605224609375, 0.1007537841796875, 0.14990234375, 0.1990509033203125, 0.248199462890625, 0.2973480224609375, 0.34649658203125, 0.3956451416015625, 0.444793701171875, 0.4939422607421875, 0.5430908203125, 0.5922393798828125, 0.641387939453125, 0.6905364990234375, 0.73968505859375, 0.7888336181640625, 0.837982177734375, 0.8871307373046875, 0.936279296875, 0.9854278564453125, 1.034576416015625, 1.0837249755859375, 1.13287353515625, 1.1820220947265625, 1.231170654296875, 1.2803192138671875, 1.3294677734375, 1.3786163330078125, 1.427764892578125, 1.4769134521484375, 1.52606201171875, 1.5752105712890625, 1.624359130859375, 1.6735076904296875, 1.72265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 6.0, 14.0, 11.0, 9.0, 20.0, 27.0, 26.0, 31.0, 42.0, 63.0, 50.0, 52.0, 61.0, 77.0, 64.0, 56.0, 52.0, 56.0, 42.0, 43.0, 39.0, 24.0, 20.0, 16.0, 20.0, 15.0, 11.0, 11.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019168853759765625, -0.0001863911747932434, -0.00018109381198883057, -0.00017579644918441772, -0.00017049908638000488, -0.00016520172357559204, -0.0001599043607711792, -0.00015460699796676636, -0.00014930963516235352, -0.00014401227235794067, -0.00013871490955352783, -0.000133417546749115, -0.00012812018394470215, -0.0001228228211402893, -0.00011752545833587646, -0.00011222809553146362, -0.00010693073272705078, -0.00010163336992263794, -9.63360071182251e-05, -9.103864431381226e-05, -8.574128150939941e-05, -8.044391870498657e-05, -7.514655590057373e-05, -6.984919309616089e-05, -6.455183029174805e-05, -5.9254467487335205e-05, -5.395710468292236e-05, -4.865974187850952e-05, -4.336237907409668e-05, -3.806501626968384e-05, -3.2767653465270996e-05, -2.7470290660858154e-05, -2.2172927856445312e-05, -1.687556505203247e-05, -1.1578202247619629e-05, -6.280839443206787e-06, -9.834766387939453e-07, 4.3138861656188965e-06, 9.611248970031738e-06, 1.490861177444458e-05, 2.0205974578857422e-05, 2.5503337383270264e-05, 3.0800700187683105e-05, 3.609806299209595e-05, 4.139542579650879e-05, 4.669278860092163e-05, 5.199015140533447e-05, 5.7287514209747314e-05, 6.258487701416016e-05, 6.7882239818573e-05, 7.317960262298584e-05, 7.847696542739868e-05, 8.377432823181152e-05, 8.907169103622437e-05, 9.436905384063721e-05, 9.966641664505005e-05, 0.00010496377944946289, 0.00011026114225387573, 0.00011555850505828857, 0.00012085586786270142, 0.00012615323066711426, 0.0001314505934715271, 0.00013674795627593994, 0.00014204531908035278, 0.00014734268188476562]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 34.0, 32.0, 45.0, 69.0, 93.0, 172.0, 243.0, 457.0, 735.0, 1195.0, 2130.0, 3774.0, 6844.0, 12355.0, 22021.0, 39530.0, 68820.0, 112243.0, 162020.0, 184841.0, 161134.0, 112501.0, 68200.0, 39165.0, 21908.0, 12127.0, 6843.0, 3727.0, 2162.0, 1235.0, 689.0, 452.0, 278.0, 164.0, 108.0, 53.0, 30.0, 35.0, 18.0, 16.0, 11.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.609375, -1.5613250732421875, -1.513275146484375, -1.4652252197265625, -1.41717529296875, -1.3691253662109375, -1.321075439453125, -1.2730255126953125, -1.2249755859375, -1.1769256591796875, -1.128875732421875, -1.0808258056640625, -1.03277587890625, -0.9847259521484375, -0.936676025390625, -0.8886260986328125, -0.840576171875, -0.7925262451171875, -0.744476318359375, -0.6964263916015625, -0.64837646484375, -0.6003265380859375, -0.552276611328125, -0.5042266845703125, -0.4561767578125, -0.4081268310546875, -0.360076904296875, -0.3120269775390625, -0.26397705078125, -0.2159271240234375, -0.167877197265625, -0.1198272705078125, -0.07177734375, -0.0237274169921875, 0.024322509765625, 0.0723724365234375, 0.12042236328125, 0.1684722900390625, 0.216522216796875, 0.2645721435546875, 0.3126220703125, 0.3606719970703125, 0.408721923828125, 0.4567718505859375, 0.50482177734375, 0.5528717041015625, 0.600921630859375, 0.6489715576171875, 0.697021484375, 0.7450714111328125, 0.793121337890625, 0.8411712646484375, 0.88922119140625, 0.9372711181640625, 0.985321044921875, 1.0333709716796875, 1.0814208984375, 1.1294708251953125, 1.177520751953125, 1.2255706787109375, 1.27362060546875, 1.3216705322265625, 1.369720458984375, 1.4177703857421875, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 15.0, 21.0, 28.0, 23.0, 30.0, 50.0, 50.0, 72.0, 59.0, 71.0, 71.0, 74.0, 59.0, 55.0, 45.0, 64.0, 46.0, 42.0, 31.0, 24.0, 18.0, 10.0, 3.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5405807495117188, -0.5235443115234375, -0.5065078735351562, -0.489471435546875, -0.47243499755859375, -0.4553985595703125, -0.43836212158203125, -0.42132568359375, -0.40428924560546875, -0.3872528076171875, -0.37021636962890625, -0.353179931640625, -0.33614349365234375, -0.3191070556640625, -0.30207061767578125, -0.2850341796875, -0.26799774169921875, -0.2509613037109375, -0.23392486572265625, -0.216888427734375, -0.19985198974609375, -0.1828155517578125, -0.16577911376953125, -0.14874267578125, -0.13170623779296875, -0.1146697998046875, -0.09763336181640625, -0.080596923828125, -0.06356048583984375, -0.0465240478515625, -0.02948760986328125, -0.012451171875, 0.00458526611328125, 0.0216217041015625, 0.03865814208984375, 0.055694580078125, 0.07273101806640625, 0.0897674560546875, 0.10680389404296875, 0.12384033203125, 0.14087677001953125, 0.1579132080078125, 0.17494964599609375, 0.191986083984375, 0.20902252197265625, 0.2260589599609375, 0.24309539794921875, 0.2601318359375, 0.27716827392578125, 0.2942047119140625, 0.31124114990234375, 0.328277587890625, 0.34531402587890625, 0.3623504638671875, 0.37938690185546875, 0.39642333984375, 0.41345977783203125, 0.4304962158203125, 0.44753265380859375, 0.464569091796875, 0.48160552978515625, 0.4986419677734375, 0.5156784057617188, 0.53271484375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 13.0, 11.0, 11.0, 18.0, 21.0, 24.0, 26.0, 41.0, 40.0, 61.0, 62.0, 75.0, 79.0, 75.0, 82.0, 49.0, 76.0, 41.0, 48.0, 19.0, 24.0, 20.0, 22.0, 14.0, 16.0, 14.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6054840087890625, -6.44195032119751, -6.278416633605957, -6.1148834228515625, -5.95134973526001, -5.787816047668457, -5.624282360076904, -5.460748672485352, -5.297215461730957, -5.133681774139404, -4.970148086547852, -4.806614875793457, -4.643081188201904, -4.479547500610352, -4.316013813018799, -4.152480125427246, -3.9889466762542725, -3.8254129886627197, -3.661879539489746, -3.4983458518981934, -3.3348124027252197, -3.171278715133667, -3.0077452659606934, -2.8442115783691406, -2.680677890777588, -2.517144203186035, -2.3536107540130615, -2.190077066421509, -2.026543617248535, -1.8630099296569824, -1.6994763612747192, -1.535942792892456, -1.3724095821380615, -1.2088760137557983, -1.0453424453735352, -0.8818088173866272, -0.718275249004364, -0.5547416806221008, -0.39120805263519287, -0.2276744842529297, -0.0641409158706665, 0.09939266741275787, 0.26292625069618225, 0.4264598488807678, 0.589993417263031, 0.7535269856452942, 0.9170606136322021, 1.0805941820144653, 1.2441277503967285, 1.4076613187789917, 1.5711948871612549, 1.7347285747528076, 1.8982620239257812, 2.061795711517334, 2.2253293991088867, 2.3888628482818604, 2.552396297454834, 2.7159299850463867, 2.8794634342193604, 3.042997121810913, 3.2065305709838867, 3.3700642585754395, 3.533597946166992, 3.697131395339966, 3.8606650829315186]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 2.0, 7.0, 12.0, 16.0, 11.0, 17.0, 17.0, 16.0, 26.0, 24.0, 19.0, 20.0, 30.0, 33.0, 19.0, 29.0, 35.0, 33.0, 32.0, 49.0, 39.0, 36.0, 35.0, 35.0, 39.0, 27.0, 34.0, 24.0, 17.0, 32.0, 21.0, 25.0, 21.0, 23.0, 13.0, 19.0, 14.0, 18.0, 14.0, 5.0, 10.0, 7.0, 10.0, 6.0, 2.0, 8.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.917460560798645, -1.8577678203582764, -1.7980751991271973, -1.7383824586868286, -1.67868971824646, -1.6189970970153809, -1.5593043565750122, -1.4996116161346436, -1.4399189949035645, -1.3802262544631958, -1.3205336332321167, -1.260840892791748, -1.2011481523513794, -1.1414554119110107, -1.0817627906799316, -1.022070050239563, -0.9623773097991943, -0.9026846289634705, -0.8429918885231018, -0.7832992076873779, -0.7236064672470093, -0.6639137864112854, -0.6042211055755615, -0.5445283651351929, -0.484835684299469, -0.42514297366142273, -0.36545026302337646, -0.3057575821876526, -0.24606487154960632, -0.18637216091156006, -0.12667948007583618, -0.06698676943778992, -0.007294178009033203, 0.052398525178432465, 0.11209122836589813, 0.1717839241027832, 0.23147663474082947, 0.29116934537887573, 0.3508620262145996, 0.4105547368526459, 0.47024744749069214, 0.529940128326416, 0.5896328687667847, 0.6493255496025085, 0.7090182304382324, 0.7687109708786011, 0.828403651714325, 0.8880963325500488, 0.9477890729904175, 1.0074818134307861, 1.0671744346618652, 1.1268671751022339, 1.1865599155426025, 1.2462525367736816, 1.3059452772140503, 1.365638017654419, 1.425330638885498, 1.4850233793258667, 1.5447160005569458, 1.6044087409973145, 1.664101481437683, 1.7237942218780518, 1.7834868431091309, 1.8431795835494995, 1.9028723239898682]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 26.0, 44.0, 60.0, 100.0, 166.0, 224.0, 320.0, 479.0, 768.0, 1343.0, 2017.0, 3275.0, 5534.0, 9909.0, 17397.0, 32985.0, 65687.0, 141046.0, 332614.0, 793353.0, 1249471.0, 856099.0, 369269.0, 158618.0, 73510.0, 36634.0, 19020.0, 10270.0, 5696.0, 3384.0, 1934.0, 1102.0, 692.0, 422.0, 281.0, 169.0, 113.0, 72.0, 44.0, 21.0, 27.0, 10.0, 12.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.41015625, -4.26092529296875, -4.1116943359375, -3.96246337890625, -3.813232421875, -3.66400146484375, -3.5147705078125, -3.36553955078125, -3.21630859375, -3.06707763671875, -2.9178466796875, -2.76861572265625, -2.619384765625, -2.47015380859375, -2.3209228515625, -2.17169189453125, -2.0224609375, -1.87322998046875, -1.7239990234375, -1.57476806640625, -1.425537109375, -1.27630615234375, -1.1270751953125, -0.97784423828125, -0.82861328125, -0.67938232421875, -0.5301513671875, -0.38092041015625, -0.231689453125, -0.08245849609375, 0.0667724609375, 0.21600341796875, 0.365234375, 0.51446533203125, 0.6636962890625, 0.81292724609375, 0.962158203125, 1.11138916015625, 1.2606201171875, 1.40985107421875, 1.55908203125, 1.70831298828125, 1.8575439453125, 2.00677490234375, 2.156005859375, 2.30523681640625, 2.4544677734375, 2.60369873046875, 2.7529296875, 2.90216064453125, 3.0513916015625, 3.20062255859375, 3.349853515625, 3.49908447265625, 3.6483154296875, 3.79754638671875, 3.94677734375, 4.09600830078125, 4.2452392578125, 4.39447021484375, 4.543701171875, 4.69293212890625, 4.8421630859375, 4.99139404296875, 5.140625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 18.0, 20.0, 22.0, 21.0, 18.0, 25.0, 18.0, 24.0, 28.0, 44.0, 31.0, 35.0, 38.0, 37.0, 26.0, 36.0, 35.0, 42.0, 32.0, 36.0, 33.0, 37.0, 28.0, 24.0, 37.0, 29.0, 15.0, 28.0, 27.0, 15.0, 14.0, 18.0, 14.0, 9.0, 4.0, 15.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7802734375, -1.7282562255859375, -1.676239013671875, -1.6242218017578125, -1.57220458984375, -1.5201873779296875, -1.468170166015625, -1.4161529541015625, -1.3641357421875, -1.3121185302734375, -1.260101318359375, -1.2080841064453125, -1.15606689453125, -1.1040496826171875, -1.052032470703125, -1.0000152587890625, -0.947998046875, -0.8959808349609375, -0.843963623046875, -0.7919464111328125, -0.73992919921875, -0.6879119873046875, -0.635894775390625, -0.5838775634765625, -0.5318603515625, -0.4798431396484375, -0.427825927734375, -0.3758087158203125, -0.32379150390625, -0.2717742919921875, -0.219757080078125, -0.1677398681640625, -0.11572265625, -0.0637054443359375, -0.011688232421875, 0.0403289794921875, 0.09234619140625, 0.1443634033203125, 0.196380615234375, 0.2483978271484375, 0.3004150390625, 0.3524322509765625, 0.404449462890625, 0.4564666748046875, 0.50848388671875, 0.5605010986328125, 0.612518310546875, 0.6645355224609375, 0.716552734375, 0.7685699462890625, 0.820587158203125, 0.8726043701171875, 0.92462158203125, 0.9766387939453125, 1.028656005859375, 1.0806732177734375, 1.1326904296875, 1.1847076416015625, 1.236724853515625, 1.2887420654296875, 1.34075927734375, 1.3927764892578125, 1.444793701171875, 1.4968109130859375, 1.548828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 3.0, 11.0, 19.0, 26.0, 35.0, 63.0, 93.0, 155.0, 196.0, 322.0, 534.0, 826.0, 1419.0, 2301.0, 4004.0, 6839.0, 12235.0, 22022.0, 40720.0, 78965.0, 152623.0, 302319.0, 587283.0, 952865.0, 915299.0, 540664.0, 275901.0, 138908.0, 72020.0, 37760.0, 20745.0, 11339.0, 6498.0, 3679.0, 2098.0, 1331.0, 795.0, 512.0, 324.0, 207.0, 118.0, 69.0, 50.0, 34.0, 16.0, 16.0, 8.0, 8.0, 1.0, 2.0, 3.0], "bins": [-5.29296875, -5.149658203125, -5.00634765625, -4.863037109375, -4.7197265625, -4.576416015625, -4.43310546875, -4.289794921875, -4.146484375, -4.003173828125, -3.85986328125, -3.716552734375, -3.5732421875, -3.429931640625, -3.28662109375, -3.143310546875, -3.0, -2.856689453125, -2.71337890625, -2.570068359375, -2.4267578125, -2.283447265625, -2.14013671875, -1.996826171875, -1.853515625, -1.710205078125, -1.56689453125, -1.423583984375, -1.2802734375, -1.136962890625, -0.99365234375, -0.850341796875, -0.70703125, -0.563720703125, -0.42041015625, -0.277099609375, -0.1337890625, 0.009521484375, 0.15283203125, 0.296142578125, 0.439453125, 0.582763671875, 0.72607421875, 0.869384765625, 1.0126953125, 1.156005859375, 1.29931640625, 1.442626953125, 1.5859375, 1.729248046875, 1.87255859375, 2.015869140625, 2.1591796875, 2.302490234375, 2.44580078125, 2.589111328125, 2.732421875, 2.875732421875, 3.01904296875, 3.162353515625, 3.3056640625, 3.448974609375, 3.59228515625, 3.735595703125, 3.87890625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 12.0, 14.0, 20.0, 27.0, 35.0, 52.0, 52.0, 70.0, 92.0, 112.0, 122.0, 153.0, 190.0, 215.0, 242.0, 252.0, 278.0, 304.0, 265.0, 256.0, 234.0, 176.0, 178.0, 144.0, 101.0, 98.0, 87.0, 66.0, 40.0, 48.0, 40.0, 20.0, 15.0, 16.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.86334228515625, -0.8243408203125, -0.78533935546875, -0.746337890625, -0.70733642578125, -0.6683349609375, -0.62933349609375, -0.59033203125, -0.55133056640625, -0.5123291015625, -0.47332763671875, -0.434326171875, -0.39532470703125, -0.3563232421875, -0.31732177734375, -0.2783203125, -0.23931884765625, -0.2003173828125, -0.16131591796875, -0.122314453125, -0.08331298828125, -0.0443115234375, -0.00531005859375, 0.03369140625, 0.07269287109375, 0.1116943359375, 0.15069580078125, 0.189697265625, 0.22869873046875, 0.2677001953125, 0.30670166015625, 0.345703125, 0.38470458984375, 0.4237060546875, 0.46270751953125, 0.501708984375, 0.54071044921875, 0.5797119140625, 0.61871337890625, 0.65771484375, 0.69671630859375, 0.7357177734375, 0.77471923828125, 0.813720703125, 0.85272216796875, 0.8917236328125, 0.93072509765625, 0.9697265625, 1.00872802734375, 1.0477294921875, 1.08673095703125, 1.125732421875, 1.16473388671875, 1.2037353515625, 1.24273681640625, 1.28173828125, 1.32073974609375, 1.3597412109375, 1.39874267578125, 1.437744140625, 1.47674560546875, 1.5157470703125, 1.55474853515625, 1.59375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 17.0, 12.0, 19.0, 21.0, 23.0, 23.0, 33.0, 40.0, 46.0, 36.0, 49.0, 55.0, 60.0, 72.0, 52.0, 68.0, 42.0, 55.0, 42.0, 28.0, 33.0, 26.0, 22.0, 15.0, 21.0, 15.0, 10.0, 7.0, 11.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.709427356719971, -4.573078155517578, -4.4367289543151855, -4.300380229949951, -4.164031028747559, -4.027681827545166, -3.8913326263427734, -3.75498366355896, -3.6186347007751465, -3.482285499572754, -3.3459365367889404, -3.209587335586548, -3.0732383728027344, -2.936889171600342, -2.800539970397949, -2.6641910076141357, -2.527841806411743, -2.3914926052093506, -2.255143642425537, -2.1187944412231445, -1.982445478439331, -1.8460962772369385, -1.7097471952438354, -1.5733981132507324, -1.4370490312576294, -1.3006999492645264, -1.1643508672714233, -1.0280017852783203, -0.8916526436805725, -0.7553035616874695, -0.6189544200897217, -0.48260533809661865, -0.3462562561035156, -0.2099071592092514, -0.07355806231498718, 0.06279104948043823, 0.19914013147354126, 0.3354892134666443, 0.4718383550643921, 0.6081874370574951, 0.7445365190505981, 0.8808856010437012, 1.0172346830368042, 1.1535837650299072, 1.2899329662322998, 1.4262819290161133, 1.5626311302185059, 1.6989802122116089, 1.835329294204712, 1.971678376197815, 2.108027458190918, 2.2443766593933105, 2.380725622177124, 2.5170748233795166, 2.65342378616333, 2.7897729873657227, 2.9261221885681152, 3.062471389770508, 3.1988203525543213, 3.335169553756714, 3.4715185165405273, 3.60786771774292, 3.7442169189453125, 3.880565881729126, 4.0169148445129395]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 4.0, 10.0, 16.0, 20.0, 12.0, 18.0, 14.0, 22.0, 26.0, 18.0, 27.0, 35.0, 30.0, 45.0, 36.0, 41.0, 48.0, 44.0, 41.0, 48.0, 28.0, 39.0, 35.0, 27.0, 31.0, 27.0, 30.0, 29.0, 28.0, 31.0, 16.0, 19.0, 13.0, 10.0, 10.0, 17.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2914984226226807, -2.2230279445648193, -2.154557704925537, -2.086087226867676, -2.0176169872283936, -1.9491465091705322, -1.8806761503219604, -1.8122057914733887, -1.7437353134155273, -1.6752649545669556, -1.6067945957183838, -1.5383241176605225, -1.4698537588119507, -1.401383399963379, -1.3329130411148071, -1.2644426822662354, -1.1959723234176636, -1.1275019645690918, -1.05903160572052, -0.9905611872673035, -0.9220907688140869, -0.8536204099655151, -0.7851500511169434, -0.7166796922683716, -0.648209273815155, -0.5797389149665833, -0.5112684965133667, -0.4427981376647949, -0.37432774901390076, -0.3058573603630066, -0.23738700151443481, -0.16891661286354065, -0.10044622421264648, -0.031975843012332916, 0.03649453818798065, 0.10496491193771362, 0.1734353005886078, 0.24190568923950195, 0.31037604808807373, 0.3788464367389679, 0.44731682538986206, 0.5157871842384338, 0.5842576026916504, 0.6527279615402222, 0.721198320388794, 0.7896687388420105, 0.8581390976905823, 0.9266095161437988, 0.9950798749923706, 1.0635502338409424, 1.1320205926895142, 1.200490951538086, 1.2689614295959473, 1.337431788444519, 1.4059021472930908, 1.4743725061416626, 1.5428428649902344, 1.6113132238388062, 1.679783582687378, 1.7482540607452393, 1.816724419593811, 1.8851947784423828, 1.9536651372909546, 2.0221354961395264, 2.0906059741973877]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 14.0, 8.0, 9.0, 19.0, 22.0, 41.0, 89.0, 108.0, 185.0, 356.0, 575.0, 941.0, 1618.0, 2973.0, 5166.0, 9340.0, 17459.0, 31990.0, 59581.0, 108846.0, 174694.0, 213955.0, 176805.0, 110523.0, 61422.0, 32451.0, 17742.0, 9366.0, 5227.0, 2963.0, 1671.0, 995.0, 552.0, 340.0, 205.0, 111.0, 74.0, 40.0, 32.0, 16.0, 11.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38306427001953125, -0.3725738525390625, -0.36208343505859375, -0.351593017578125, -0.34110260009765625, -0.3306121826171875, -0.32012176513671875, -0.30963134765625, -0.29914093017578125, -0.2886505126953125, -0.27816009521484375, -0.267669677734375, -0.25717926025390625, -0.2466888427734375, -0.23619842529296875, -0.2257080078125, -0.21521759033203125, -0.2047271728515625, -0.19423675537109375, -0.183746337890625, -0.17325592041015625, -0.1627655029296875, -0.15227508544921875, -0.14178466796875, -0.13129425048828125, -0.1208038330078125, -0.11031341552734375, -0.099822998046875, -0.08933258056640625, -0.0788421630859375, -0.06835174560546875, -0.057861328125, -0.04737091064453125, -0.0368804931640625, -0.02639007568359375, -0.015899658203125, -0.00540924072265625, 0.0050811767578125, 0.01557159423828125, 0.02606201171875, 0.03655242919921875, 0.0470428466796875, 0.05753326416015625, 0.068023681640625, 0.07851409912109375, 0.0890045166015625, 0.09949493408203125, 0.1099853515625, 0.12047576904296875, 0.1309661865234375, 0.14145660400390625, 0.151947021484375, 0.16243743896484375, 0.1729278564453125, 0.18341827392578125, 0.19390869140625, 0.20439910888671875, 0.2148895263671875, 0.22537994384765625, 0.235870361328125, 0.24636077880859375, 0.2568511962890625, 0.26734161376953125, 0.27783203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 12.0, 11.0, 13.0, 19.0, 12.0, 25.0, 16.0, 22.0, 34.0, 34.0, 41.0, 45.0, 50.0, 29.0, 46.0, 34.0, 36.0, 29.0, 39.0, 32.0, 28.0, 30.0, 26.0, 33.0, 29.0, 26.0, 28.0, 39.0, 27.0, 20.0, 16.0, 19.0, 10.0, 9.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-2.609375, -2.532440185546875, -2.45550537109375, -2.378570556640625, -2.3016357421875, -2.224700927734375, -2.14776611328125, -2.070831298828125, -1.993896484375, -1.916961669921875, -1.84002685546875, -1.763092041015625, -1.6861572265625, -1.609222412109375, -1.53228759765625, -1.455352783203125, -1.37841796875, -1.301483154296875, -1.22454833984375, -1.147613525390625, -1.0706787109375, -0.993743896484375, -0.91680908203125, -0.839874267578125, -0.762939453125, -0.686004638671875, -0.60906982421875, -0.532135009765625, -0.4552001953125, -0.378265380859375, -0.30133056640625, -0.224395751953125, -0.1474609375, -0.070526123046875, 0.00640869140625, 0.083343505859375, 0.1602783203125, 0.237213134765625, 0.31414794921875, 0.391082763671875, 0.468017578125, 0.544952392578125, 0.62188720703125, 0.698822021484375, 0.7757568359375, 0.852691650390625, 0.92962646484375, 1.006561279296875, 1.08349609375, 1.160430908203125, 1.23736572265625, 1.314300537109375, 1.3912353515625, 1.468170166015625, 1.54510498046875, 1.622039794921875, 1.698974609375, 1.775909423828125, 1.85284423828125, 1.929779052734375, 2.0067138671875, 2.083648681640625, 2.16058349609375, 2.237518310546875, 2.314453125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 11.0, 28.0, 13.0, 31.0, 39.0, 80.0, 98.0, 145.0, 261.0, 375.0, 625.0, 1033.0, 1892.0, 3760.0, 8173.0, 20007.0, 75853.0, 859439.0, 46672.0, 15879.0, 6871.0, 3249.0, 1599.0, 880.0, 563.0, 323.0, 209.0, 119.0, 90.0, 69.0, 41.0, 39.0, 31.0, 16.0, 9.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2973480224609375, -1.261688232421875, -1.2260284423828125, -1.19036865234375, -1.1547088623046875, -1.119049072265625, -1.0833892822265625, -1.0477294921875, -1.0120697021484375, -0.976409912109375, -0.9407501220703125, -0.90509033203125, -0.8694305419921875, -0.833770751953125, -0.7981109619140625, -0.762451171875, -0.7267913818359375, -0.691131591796875, -0.6554718017578125, -0.61981201171875, -0.5841522216796875, -0.548492431640625, -0.5128326416015625, -0.4771728515625, -0.4415130615234375, -0.405853271484375, -0.3701934814453125, -0.33453369140625, -0.2988739013671875, -0.263214111328125, -0.2275543212890625, -0.19189453125, -0.1562347412109375, -0.120574951171875, -0.0849151611328125, -0.04925537109375, -0.0135955810546875, 0.022064208984375, 0.0577239990234375, 0.0933837890625, 0.1290435791015625, 0.164703369140625, 0.2003631591796875, 0.23602294921875, 0.2716827392578125, 0.307342529296875, 0.3430023193359375, 0.378662109375, 0.4143218994140625, 0.449981689453125, 0.4856414794921875, 0.52130126953125, 0.5569610595703125, 0.592620849609375, 0.6282806396484375, 0.6639404296875, 0.6996002197265625, 0.735260009765625, 0.7709197998046875, 0.80657958984375, 0.8422393798828125, 0.877899169921875, 0.9135589599609375, 0.94921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 8.0, 13.0, 12.0, 14.0, 17.0, 20.0, 20.0, 26.0, 25.0, 29.0, 30.0, 32.0, 30.0, 39.0, 31.0, 31.0, 38.0, 43.0, 33.0, 49.0, 38.0, 31.0, 28.0, 43.0, 26.0, 35.0, 35.0, 24.0, 36.0, 20.0, 19.0, 26.0, 18.0, 5.0, 10.0, 9.0, 14.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.558135986328125, -1.50982666015625, -1.461517333984375, -1.4132080078125, -1.364898681640625, -1.31658935546875, -1.268280029296875, -1.219970703125, -1.171661376953125, -1.12335205078125, -1.075042724609375, -1.0267333984375, -0.978424072265625, -0.93011474609375, -0.881805419921875, -0.83349609375, -0.785186767578125, -0.73687744140625, -0.688568115234375, -0.6402587890625, -0.591949462890625, -0.54364013671875, -0.495330810546875, -0.447021484375, -0.398712158203125, -0.35040283203125, -0.302093505859375, -0.2537841796875, -0.205474853515625, -0.15716552734375, -0.108856201171875, -0.060546875, -0.012237548828125, 0.03607177734375, 0.084381103515625, 0.1326904296875, 0.180999755859375, 0.22930908203125, 0.277618408203125, 0.325927734375, 0.374237060546875, 0.42254638671875, 0.470855712890625, 0.5191650390625, 0.567474365234375, 0.61578369140625, 0.664093017578125, 0.71240234375, 0.760711669921875, 0.80902099609375, 0.857330322265625, 0.9056396484375, 0.953948974609375, 1.00225830078125, 1.050567626953125, 1.098876953125, 1.147186279296875, 1.19549560546875, 1.243804931640625, 1.2921142578125, 1.340423583984375, 1.38873291015625, 1.437042236328125, 1.4853515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 39.0, 51.0, 76.0, 83.0, 137.0, 165.0, 300.0, 489.0, 799.0, 1275.0, 2336.0, 4387.0, 8698.0, 18496.0, 54712.0, 886998.0, 38410.0, 15121.0, 7190.0, 3663.0, 1967.0, 1105.0, 685.0, 432.0, 266.0, 179.0, 123.0, 70.0, 49.0, 40.0, 23.0, 20.0, 21.0, 13.0, 10.0, 8.0, 7.0, 8.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.275146484375, -0.2669029235839844, -0.25865936279296875, -0.2504158020019531, -0.2421722412109375, -0.23392868041992188, -0.22568511962890625, -0.21744155883789062, -0.209197998046875, -0.20095443725585938, -0.19271087646484375, -0.18446731567382812, -0.1762237548828125, -0.16798019409179688, -0.15973663330078125, -0.15149307250976562, -0.14324951171875, -0.13500595092773438, -0.12676239013671875, -0.11851882934570312, -0.1102752685546875, -0.10203170776367188, -0.09378814697265625, -0.08554458618164062, -0.077301025390625, -0.06905746459960938, -0.06081390380859375, -0.052570343017578125, -0.0443267822265625, -0.036083221435546875, -0.02783966064453125, -0.019596099853515625, -0.0113525390625, -0.003108978271484375, 0.00513458251953125, 0.013378143310546875, 0.0216217041015625, 0.029865264892578125, 0.03810882568359375, 0.046352386474609375, 0.054595947265625, 0.06283950805664062, 0.07108306884765625, 0.07932662963867188, 0.0875701904296875, 0.09581375122070312, 0.10405731201171875, 0.11230087280273438, 0.12054443359375, 0.12878799438476562, 0.13703155517578125, 0.14527511596679688, 0.1535186767578125, 0.16176223754882812, 0.17000579833984375, 0.17824935913085938, 0.186492919921875, 0.19473648071289062, 0.20298004150390625, 0.21122360229492188, 0.2194671630859375, 0.22771072387695312, 0.23595428466796875, 0.24419784545898438, 0.25244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 9.0, 10.0, 19.0, 21.0, 21.0, 34.0, 30.0, 41.0, 33.0, 52.0, 39.0, 53.0, 51.0, 63.0, 64.0, 57.0, 57.0, 38.0, 52.0, 36.0, 34.0, 29.0, 27.0, 24.0, 12.0, 18.0, 11.0, 10.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1961669921875e-05, -4.06922772526741e-05, -3.9422884583473206e-05, -3.815349191427231e-05, -3.688409924507141e-05, -3.5614706575870514e-05, -3.434531390666962e-05, -3.307592123746872e-05, -3.180652856826782e-05, -3.0537135899066925e-05, -2.9267743229866028e-05, -2.799835056066513e-05, -2.6728957891464233e-05, -2.5459565222263336e-05, -2.419017255306244e-05, -2.2920779883861542e-05, -2.1651387214660645e-05, -2.0381994545459747e-05, -1.911260187625885e-05, -1.7843209207057953e-05, -1.6573816537857056e-05, -1.530442386865616e-05, -1.4035031199455261e-05, -1.2765638530254364e-05, -1.1496245861053467e-05, -1.022685319185257e-05, -8.957460522651672e-06, -7.688067853450775e-06, -6.418675184249878e-06, -5.149282515048981e-06, -3.8798898458480835e-06, -2.6104971766471863e-06, -1.341104507446289e-06, -7.171183824539185e-08, 1.1976808309555054e-06, 2.4670735001564026e-06, 3.7364661693573e-06, 5.005858838558197e-06, 6.275251507759094e-06, 7.5446441769599915e-06, 8.814036846160889e-06, 1.0083429515361786e-05, 1.1352822184562683e-05, 1.262221485376358e-05, 1.3891607522964478e-05, 1.5161000192165375e-05, 1.6430392861366272e-05, 1.769978553056717e-05, 1.8969178199768066e-05, 2.0238570868968964e-05, 2.150796353816986e-05, 2.2777356207370758e-05, 2.4046748876571655e-05, 2.5316141545772552e-05, 2.658553421497345e-05, 2.7854926884174347e-05, 2.9124319553375244e-05, 3.039371222257614e-05, 3.166310489177704e-05, 3.2932497560977936e-05, 3.420189023017883e-05, 3.547128289937973e-05, 3.674067556858063e-05, 3.8010068237781525e-05, 3.927946090698242e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 13.0, 13.0, 21.0, 22.0, 28.0, 41.0, 50.0, 69.0, 78.0, 142.0, 211.0, 273.0, 384.0, 579.0, 862.0, 1117.0, 1807.0, 2723.0, 4531.0, 7361.0, 12519.0, 22290.0, 39328.0, 70702.0, 123129.0, 189927.0, 208815.0, 151944.0, 90199.0, 50321.0, 28339.0, 15918.0, 9122.0, 5512.0, 3421.0, 2218.0, 1374.0, 921.0, 594.0, 413.0, 362.0, 223.0, 163.0, 139.0, 86.0, 77.0, 56.0, 32.0, 20.0, 19.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07623291015625, -0.0737905502319336, -0.07134819030761719, -0.06890583038330078, -0.06646347045898438, -0.06402111053466797, -0.06157875061035156, -0.059136390686035156, -0.05669403076171875, -0.054251670837402344, -0.05180931091308594, -0.04936695098876953, -0.046924591064453125, -0.04448223114013672, -0.04203987121582031, -0.039597511291503906, -0.0371551513671875, -0.034712791442871094, -0.03227043151855469, -0.02982807159423828, -0.027385711669921875, -0.02494335174560547, -0.022500991821289062, -0.020058631896972656, -0.01761627197265625, -0.015173912048339844, -0.012731552124023438, -0.010289192199707031, -0.007846832275390625, -0.005404472351074219, -0.0029621124267578125, -0.0005197525024414062, 0.001922607421875, 0.004364967346191406, 0.0068073272705078125, 0.009249687194824219, 0.011692047119140625, 0.014134407043457031, 0.016576766967773438, 0.019019126892089844, 0.02146148681640625, 0.023903846740722656, 0.026346206665039062, 0.02878856658935547, 0.031230926513671875, 0.03367328643798828, 0.03611564636230469, 0.038558006286621094, 0.0410003662109375, 0.043442726135253906, 0.04588508605957031, 0.04832744598388672, 0.050769805908203125, 0.05321216583251953, 0.05565452575683594, 0.058096885681152344, 0.06053924560546875, 0.06298160552978516, 0.06542396545410156, 0.06786632537841797, 0.07030868530273438, 0.07275104522705078, 0.07519340515136719, 0.0776357650756836, 0.080078125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 6.0, 15.0, 15.0, 16.0, 26.0, 19.0, 32.0, 27.0, 48.0, 50.0, 50.0, 66.0, 68.0, 52.0, 75.0, 74.0, 57.0, 59.0, 47.0, 44.0, 29.0, 28.0, 21.0, 13.0, 16.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0164947509765625, -0.015921354293823242, -0.015347957611083984, -0.014774560928344727, -0.014201164245605469, -0.013627767562866211, -0.013054370880126953, -0.012480974197387695, -0.011907577514648438, -0.01133418083190918, -0.010760784149169922, -0.010187387466430664, -0.009613990783691406, -0.009040594100952148, -0.00846719741821289, -0.007893800735473633, -0.007320404052734375, -0.006747007369995117, -0.006173610687255859, -0.0056002140045166016, -0.005026817321777344, -0.004453420639038086, -0.003880023956298828, -0.0033066272735595703, -0.0027332305908203125, -0.0021598339080810547, -0.0015864372253417969, -0.001013040542602539, -0.00043964385986328125, 0.00013375282287597656, 0.0007071495056152344, 0.0012805461883544922, 0.00185394287109375, 0.002427339553833008, 0.0030007362365722656, 0.0035741329193115234, 0.004147529602050781, 0.004720926284790039, 0.005294322967529297, 0.005867719650268555, 0.0064411163330078125, 0.00701451301574707, 0.007587909698486328, 0.008161306381225586, 0.008734703063964844, 0.009308099746704102, 0.00988149642944336, 0.010454893112182617, 0.011028289794921875, 0.011601686477661133, 0.01217508316040039, 0.012748479843139648, 0.013321876525878906, 0.013895273208618164, 0.014468669891357422, 0.01504206657409668, 0.015615463256835938, 0.016188859939575195, 0.016762256622314453, 0.01733565330505371, 0.01790904998779297, 0.018482446670532227, 0.019055843353271484, 0.019629240036010742, 0.02020263671875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 17.0, 11.0, 17.0, 23.0, 26.0, 23.0, 29.0, 37.0, 50.0, 36.0, 47.0, 51.0, 62.0, 77.0, 56.0, 62.0, 42.0, 47.0, 51.0, 29.0, 33.0, 24.0, 21.0, 19.0, 18.0, 16.0, 11.0, 5.0, 14.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703352451324463, -4.567334175109863, -4.431316375732422, -4.295298099517822, -4.159279823303223, -4.023262023925781, -3.8872437477111816, -3.751225709915161, -3.6152076721191406, -3.47918963432312, -3.3431715965270996, -3.2071533203125, -3.0711352825164795, -2.935117244720459, -2.7990989685058594, -2.663080930709839, -2.5270628929138184, -2.391044855117798, -2.2550268173217773, -2.1190085411071777, -1.9829905033111572, -1.8469724655151367, -1.7109543085098267, -1.5749361515045166, -1.438918113708496, -1.3029000759124756, -1.1668819189071655, -1.0308637619018555, -0.894845724105835, -0.7588276267051697, -0.6228095293045044, -0.4867914319038391, -0.35077333450317383, -0.21475523710250854, -0.07873713970184326, 0.05728095769882202, 0.1932990550994873, 0.3293171525001526, 0.46533524990081787, 0.6013533473014832, 0.7373714447021484, 0.8733895421028137, 1.009407639503479, 1.145425796508789, 1.2814438343048096, 1.41746187210083, 1.5534800291061401, 1.6894981861114502, 1.8255162239074707, 1.9615342617034912, 2.0975522994995117, 2.2335705757141113, 2.369588613510132, 2.5056066513061523, 2.641624927520752, 2.7776429653167725, 2.913661003112793, 3.0496790409088135, 3.185697078704834, 3.3217153549194336, 3.457733392715454, 3.5937514305114746, 3.729769706726074, 3.8657877445220947, 4.001805782318115]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 1.0, 1.0, 10.0, 10.0, 2.0, 6.0, 21.0, 17.0, 14.0, 14.0, 19.0, 21.0, 24.0, 22.0, 23.0, 38.0, 30.0, 47.0, 35.0, 34.0, 49.0, 51.0, 42.0, 41.0, 31.0, 41.0, 34.0, 26.0, 31.0, 29.0, 31.0, 29.0, 27.0, 30.0, 18.0, 15.0, 15.0, 11.0, 8.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3029496669769287, -2.2345986366271973, -2.1662473678588867, -2.0978963375091553, -2.0295450687408447, -1.9611940383911133, -1.8928428888320923, -1.8244917392730713, -1.7561405897140503, -1.6877894401550293, -1.6194382905960083, -1.5510871410369873, -1.4827361106872559, -1.4143848419189453, -1.3460338115692139, -1.2776826620101929, -1.2093315124511719, -1.1409803628921509, -1.0726292133331299, -1.0042780637741089, -0.9359269738197327, -0.8675758242607117, -0.7992247343063354, -0.7308735847473145, -0.6625224351882935, -0.5941712856292725, -0.5258201360702515, -0.45746904611587524, -0.38911789655685425, -0.32076674699783325, -0.25241562724113464, -0.18406450748443604, -0.11571335792541504, -0.04736222326755524, 0.020988911390304565, 0.08934004604816437, 0.15769118070602417, 0.22604233026504517, 0.2943934500217438, 0.3627445697784424, 0.4310957193374634, 0.4994468688964844, 0.5677980184555054, 0.6361491084098816, 0.7045002579689026, 0.7728514075279236, 0.8412024974822998, 0.9095536470413208, 0.9779047966003418, 1.0462559461593628, 1.1146070957183838, 1.1829582452774048, 1.2513093948364258, 1.3196604251861572, 1.3880115747451782, 1.4563627243041992, 1.5247138738632202, 1.5930650234222412, 1.6614161729812622, 1.7297673225402832, 1.7981183528900146, 1.8664696216583252, 1.9348206520080566, 2.003171920776367, 2.0715229511260986]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 16.0, 20.0, 33.0, 52.0, 104.0, 145.0, 233.0, 400.0, 685.0, 1169.0, 1926.0, 3260.0, 5428.0, 9318.0, 15524.0, 25828.0, 42270.0, 65918.0, 95814.0, 126941.0, 145913.0, 143131.0, 120443.0, 88683.0, 59615.0, 38254.0, 23097.0, 14061.0, 8248.0, 4847.0, 2863.0, 1707.0, 1088.0, 605.0, 349.0, 234.0, 107.0, 83.0, 60.0, 28.0, 19.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.77349853515625, -2.6837158203125, -2.59393310546875, -2.504150390625, -2.41436767578125, -2.3245849609375, -2.23480224609375, -2.14501953125, -2.05523681640625, -1.9654541015625, -1.87567138671875, -1.785888671875, -1.69610595703125, -1.6063232421875, -1.51654052734375, -1.4267578125, -1.33697509765625, -1.2471923828125, -1.15740966796875, -1.067626953125, -0.97784423828125, -0.8880615234375, -0.79827880859375, -0.70849609375, -0.61871337890625, -0.5289306640625, -0.43914794921875, -0.349365234375, -0.25958251953125, -0.1697998046875, -0.08001708984375, 0.009765625, 0.09954833984375, 0.1893310546875, 0.27911376953125, 0.368896484375, 0.45867919921875, 0.5484619140625, 0.63824462890625, 0.72802734375, 0.81781005859375, 0.9075927734375, 0.99737548828125, 1.087158203125, 1.17694091796875, 1.2667236328125, 1.35650634765625, 1.4462890625, 1.53607177734375, 1.6258544921875, 1.71563720703125, 1.805419921875, 1.89520263671875, 1.9849853515625, 2.07476806640625, 2.16455078125, 2.25433349609375, 2.3441162109375, 2.43389892578125, 2.523681640625, 2.61346435546875, 2.7032470703125, 2.79302978515625, 2.8828125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 2.0, 6.0, 8.0, 11.0, 13.0, 7.0, 9.0, 12.0, 21.0, 17.0, 24.0, 30.0, 30.0, 28.0, 35.0, 30.0, 40.0, 54.0, 51.0, 47.0, 39.0, 52.0, 52.0, 32.0, 41.0, 43.0, 32.0, 36.0, 33.0, 24.0, 22.0, 16.0, 27.0, 17.0, 11.0, 12.0, 7.0, 7.0, 8.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.783203125, -2.69830322265625, -2.6134033203125, -2.52850341796875, -2.443603515625, -2.35870361328125, -2.2738037109375, -2.18890380859375, -2.10400390625, -2.01910400390625, -1.9342041015625, -1.84930419921875, -1.764404296875, -1.67950439453125, -1.5946044921875, -1.50970458984375, -1.4248046875, -1.33990478515625, -1.2550048828125, -1.17010498046875, -1.085205078125, -1.00030517578125, -0.9154052734375, -0.83050537109375, -0.74560546875, -0.66070556640625, -0.5758056640625, -0.49090576171875, -0.406005859375, -0.32110595703125, -0.2362060546875, -0.15130615234375, -0.06640625, 0.01849365234375, 0.1033935546875, 0.18829345703125, 0.273193359375, 0.35809326171875, 0.4429931640625, 0.52789306640625, 0.61279296875, 0.69769287109375, 0.7825927734375, 0.86749267578125, 0.952392578125, 1.03729248046875, 1.1221923828125, 1.20709228515625, 1.2919921875, 1.37689208984375, 1.4617919921875, 1.54669189453125, 1.631591796875, 1.71649169921875, 1.8013916015625, 1.88629150390625, 1.97119140625, 2.05609130859375, 2.1409912109375, 2.22589111328125, 2.310791015625, 2.39569091796875, 2.4805908203125, 2.56549072265625, 2.650390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [7.0, 4.0, 10.0, 7.0, 9.0, 17.0, 24.0, 31.0, 47.0, 73.0, 103.0, 185.0, 257.0, 328.0, 540.0, 869.0, 1343.0, 1948.0, 3217.0, 4800.0, 7691.0, 11740.0, 18029.0, 26917.0, 39656.0, 56290.0, 76811.0, 98115.0, 115070.0, 121740.0, 115073.0, 98111.0, 76621.0, 56326.0, 39183.0, 26356.0, 17872.0, 11873.0, 7636.0, 4804.0, 3134.0, 1936.0, 1287.0, 846.0, 551.0, 377.0, 236.0, 157.0, 111.0, 56.0, 53.0, 30.0, 19.0, 13.0, 7.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.353515625, -2.273712158203125, -2.19390869140625, -2.114105224609375, -2.0343017578125, -1.954498291015625, -1.87469482421875, -1.794891357421875, -1.715087890625, -1.635284423828125, -1.55548095703125, -1.475677490234375, -1.3958740234375, -1.316070556640625, -1.23626708984375, -1.156463623046875, -1.07666015625, -0.996856689453125, -0.91705322265625, -0.837249755859375, -0.7574462890625, -0.677642822265625, -0.59783935546875, -0.518035888671875, -0.438232421875, -0.358428955078125, -0.27862548828125, -0.198822021484375, -0.1190185546875, -0.039215087890625, 0.04058837890625, 0.120391845703125, 0.2001953125, 0.279998779296875, 0.35980224609375, 0.439605712890625, 0.5194091796875, 0.599212646484375, 0.67901611328125, 0.758819580078125, 0.838623046875, 0.918426513671875, 0.99822998046875, 1.078033447265625, 1.1578369140625, 1.237640380859375, 1.31744384765625, 1.397247314453125, 1.47705078125, 1.556854248046875, 1.63665771484375, 1.716461181640625, 1.7962646484375, 1.876068115234375, 1.95587158203125, 2.035675048828125, 2.115478515625, 2.195281982421875, 2.27508544921875, 2.354888916015625, 2.4346923828125, 2.514495849609375, 2.59429931640625, 2.674102783203125, 2.75390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 11.0, 12.0, 12.0, 27.0, 18.0, 25.0, 27.0, 25.0, 23.0, 32.0, 38.0, 41.0, 45.0, 49.0, 57.0, 38.0, 38.0, 42.0, 47.0, 33.0, 43.0, 30.0, 30.0, 32.0, 40.0, 23.0, 29.0, 14.0, 14.0, 9.0, 16.0, 14.0, 15.0, 12.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4817047119140625, -1.429229736328125, -1.3767547607421875, -1.32427978515625, -1.2718048095703125, -1.219329833984375, -1.1668548583984375, -1.1143798828125, -1.0619049072265625, -1.009429931640625, -0.9569549560546875, -0.90447998046875, -0.8520050048828125, -0.799530029296875, -0.7470550537109375, -0.694580078125, -0.6421051025390625, -0.589630126953125, -0.5371551513671875, -0.48468017578125, -0.4322052001953125, -0.379730224609375, -0.3272552490234375, -0.2747802734375, -0.2223052978515625, -0.169830322265625, -0.1173553466796875, -0.06488037109375, -0.0124053955078125, 0.040069580078125, 0.0925445556640625, 0.14501953125, 0.1974945068359375, 0.249969482421875, 0.3024444580078125, 0.35491943359375, 0.4073944091796875, 0.459869384765625, 0.5123443603515625, 0.5648193359375, 0.6172943115234375, 0.669769287109375, 0.7222442626953125, 0.77471923828125, 0.8271942138671875, 0.879669189453125, 0.9321441650390625, 0.984619140625, 1.0370941162109375, 1.089569091796875, 1.1420440673828125, 1.19451904296875, 1.2469940185546875, 1.299468994140625, 1.3519439697265625, 1.4044189453125, 1.4568939208984375, 1.509368896484375, 1.5618438720703125, 1.61431884765625, 1.6667938232421875, 1.719268798828125, 1.7717437744140625, 1.82421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 12.0, 13.0, 19.0, 19.0, 38.0, 58.0, 101.0, 138.0, 169.0, 271.0, 376.0, 576.0, 891.0, 1442.0, 2243.0, 3948.0, 7350.0, 14212.0, 29975.0, 67393.0, 149151.0, 262970.0, 252250.0, 136940.0, 60883.0, 27424.0, 13226.0, 6649.0, 3808.0, 2159.0, 1301.0, 831.0, 587.0, 356.0, 223.0, 182.0, 117.0, 91.0, 45.0, 40.0, 24.0, 21.0, 9.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.5343017578125, -3.416259765625, -3.2982177734375, -3.18017578125, -3.0621337890625, -2.944091796875, -2.8260498046875, -2.7080078125, -2.5899658203125, -2.471923828125, -2.3538818359375, -2.23583984375, -2.1177978515625, -1.999755859375, -1.8817138671875, -1.763671875, -1.6456298828125, -1.527587890625, -1.4095458984375, -1.29150390625, -1.1734619140625, -1.055419921875, -0.9373779296875, -0.8193359375, -0.7012939453125, -0.583251953125, -0.4652099609375, -0.34716796875, -0.2291259765625, -0.111083984375, 0.0069580078125, 0.125, 0.2430419921875, 0.361083984375, 0.4791259765625, 0.59716796875, 0.7152099609375, 0.833251953125, 0.9512939453125, 1.0693359375, 1.1873779296875, 1.305419921875, 1.4234619140625, 1.54150390625, 1.6595458984375, 1.777587890625, 1.8956298828125, 2.013671875, 2.1317138671875, 2.249755859375, 2.3677978515625, 2.48583984375, 2.6038818359375, 2.721923828125, 2.8399658203125, 2.9580078125, 3.0760498046875, 3.194091796875, 3.3121337890625, 3.43017578125, 3.5482177734375, 3.666259765625, 3.7843017578125, 3.90234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 12.0, 19.0, 41.0, 75.0, 86.0, 126.0, 133.0, 142.0, 125.0, 68.0, 43.0, 32.0, 15.0, 13.0, 14.0, 8.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006952285766601562, -0.0006757825613021851, -0.0006563365459442139, -0.0006368905305862427, -0.0006174445152282715, -0.0005979984998703003, -0.0005785524845123291, -0.0005591064691543579, -0.0005396604537963867, -0.0005202144384384155, -0.0005007684230804443, -0.00048132240772247314, -0.00046187639236450195, -0.00044243037700653076, -0.00042298436164855957, -0.0004035383462905884, -0.0003840923309326172, -0.000364646315574646, -0.0003452003002166748, -0.0003257542848587036, -0.0003063082695007324, -0.00028686225414276123, -0.00026741623878479004, -0.00024797022342681885, -0.00022852420806884766, -0.00020907819271087646, -0.00018963217735290527, -0.00017018616199493408, -0.0001507401466369629, -0.0001312941312789917, -0.00011184811592102051, -9.240210056304932e-05, -7.295608520507812e-05, -5.3510069847106934e-05, -3.406405448913574e-05, -1.461803913116455e-05, 4.827976226806641e-06, 2.4273991584777832e-05, 4.3720006942749023e-05, 6.316602230072021e-05, 8.26120376586914e-05, 0.0001020580530166626, 0.00012150406837463379, 0.00014095008373260498, 0.00016039609909057617, 0.00017984211444854736, 0.00019928812980651855, 0.00021873414516448975, 0.00023818016052246094, 0.00025762617588043213, 0.0002770721912384033, 0.0002965182065963745, 0.0003159642219543457, 0.0003354102373123169, 0.0003548562526702881, 0.0003743022680282593, 0.00039374828338623047, 0.00041319429874420166, 0.00043264031410217285, 0.00045208632946014404, 0.00047153234481811523, 0.0004909783601760864, 0.0005104243755340576, 0.0005298703908920288, 0.00054931640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 9.0, 9.0, 13.0, 18.0, 28.0, 51.0, 43.0, 68.0, 108.0, 156.0, 252.0, 335.0, 451.0, 677.0, 1043.0, 1639.0, 2499.0, 4097.0, 6827.0, 11936.0, 21632.0, 39723.0, 73011.0, 129017.0, 193036.0, 207174.0, 152723.0, 89910.0, 49047.0, 26647.0, 14712.0, 8121.0, 4901.0, 3002.0, 1853.0, 1173.0, 828.0, 538.0, 386.0, 267.0, 170.0, 127.0, 87.0, 62.0, 50.0, 22.0, 31.0, 11.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.431640625, -2.3536376953125, -2.275634765625, -2.1976318359375, -2.11962890625, -2.0416259765625, -1.963623046875, -1.8856201171875, -1.8076171875, -1.7296142578125, -1.651611328125, -1.5736083984375, -1.49560546875, -1.4176025390625, -1.339599609375, -1.2615966796875, -1.18359375, -1.1055908203125, -1.027587890625, -0.9495849609375, -0.87158203125, -0.7935791015625, -0.715576171875, -0.6375732421875, -0.5595703125, -0.4815673828125, -0.403564453125, -0.3255615234375, -0.24755859375, -0.1695556640625, -0.091552734375, -0.0135498046875, 0.064453125, 0.1424560546875, 0.220458984375, 0.2984619140625, 0.37646484375, 0.4544677734375, 0.532470703125, 0.6104736328125, 0.6884765625, 0.7664794921875, 0.844482421875, 0.9224853515625, 1.00048828125, 1.0784912109375, 1.156494140625, 1.2344970703125, 1.3125, 1.3905029296875, 1.468505859375, 1.5465087890625, 1.62451171875, 1.7025146484375, 1.780517578125, 1.8585205078125, 1.9365234375, 2.0145263671875, 2.092529296875, 2.1705322265625, 2.24853515625, 2.3265380859375, 2.404541015625, 2.4825439453125, 2.560546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 0.0, 8.0, 10.0, 11.0, 17.0, 16.0, 27.0, 33.0, 38.0, 49.0, 44.0, 54.0, 58.0, 60.0, 79.0, 72.0, 66.0, 59.0, 55.0, 52.0, 23.0, 28.0, 23.0, 16.0, 14.0, 11.0, 11.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.71875, -0.696044921875, -0.67333984375, -0.650634765625, -0.6279296875, -0.605224609375, -0.58251953125, -0.559814453125, -0.537109375, -0.514404296875, -0.49169921875, -0.468994140625, -0.4462890625, -0.423583984375, -0.40087890625, -0.378173828125, -0.35546875, -0.332763671875, -0.31005859375, -0.287353515625, -0.2646484375, -0.241943359375, -0.21923828125, -0.196533203125, -0.173828125, -0.151123046875, -0.12841796875, -0.105712890625, -0.0830078125, -0.060302734375, -0.03759765625, -0.014892578125, 0.0078125, 0.030517578125, 0.05322265625, 0.075927734375, 0.0986328125, 0.121337890625, 0.14404296875, 0.166748046875, 0.189453125, 0.212158203125, 0.23486328125, 0.257568359375, 0.2802734375, 0.302978515625, 0.32568359375, 0.348388671875, 0.37109375, 0.393798828125, 0.41650390625, 0.439208984375, 0.4619140625, 0.484619140625, 0.50732421875, 0.530029296875, 0.552734375, 0.575439453125, 0.59814453125, 0.620849609375, 0.6435546875, 0.666259765625, 0.68896484375, 0.711669921875, 0.734375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 10.0, 13.0, 14.0, 16.0, 12.0, 29.0, 17.0, 30.0, 33.0, 34.0, 48.0, 37.0, 61.0, 58.0, 61.0, 57.0, 66.0, 66.0, 46.0, 49.0, 38.0, 35.0, 27.0, 19.0, 22.0, 23.0, 7.0, 7.0, 13.0, 4.0, 11.0, 11.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.617569446563721, -4.47745418548584, -4.337339401245117, -4.197224140167236, -4.0571088790893555, -3.9169936180114746, -3.776878595352173, -3.636763572692871, -3.4966483116149902, -3.3565330505371094, -3.2164180278778076, -3.076303005218506, -2.936187744140625, -2.796072483062744, -2.6559574604034424, -2.5158424377441406, -2.3757271766662598, -2.235611915588379, -2.095496892929077, -1.9553817510604858, -1.8152666091918945, -1.6751514673233032, -1.535036325454712, -1.3949211835861206, -1.2548060417175293, -1.114690899848938, -0.9745757579803467, -0.8344606161117554, -0.6943454742431641, -0.5542303323745728, -0.41411519050598145, -0.27400004863739014, -0.13388490676879883, 0.0062302350997924805, 0.1463453769683838, 0.2864605188369751, 0.4265756607055664, 0.5666908025741577, 0.706805944442749, 0.8469210863113403, 0.9870362281799316, 1.127151370048523, 1.2672665119171143, 1.4073816537857056, 1.5474967956542969, 1.6876119375228882, 1.8277270793914795, 1.9678422212600708, 2.107957363128662, 2.248072624206543, 2.3881876468658447, 2.5283026695251465, 2.6684179306030273, 2.808533191680908, 2.94864821434021, 3.0887632369995117, 3.2288784980773926, 3.3689937591552734, 3.509108781814575, 3.649223804473877, 3.789339065551758, 3.9294543266296387, 4.0695695877075195, 4.209684371948242, 4.349799633026123]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 9.0, 9.0, 10.0, 13.0, 17.0, 10.0, 18.0, 21.0, 33.0, 14.0, 33.0, 31.0, 38.0, 31.0, 33.0, 33.0, 43.0, 30.0, 39.0, 41.0, 38.0, 34.0, 34.0, 30.0, 40.0, 28.0, 33.0, 28.0, 31.0, 39.0, 14.0, 20.0, 15.0, 24.0, 6.0, 19.0, 11.0, 8.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-2.5560855865478516, -2.4842679500579834, -2.412450075149536, -2.340632438659668, -2.2688148021698, -2.1969971656799316, -2.1251792907714844, -2.053361654281616, -1.9815438985824585, -1.9097261428833008, -1.8379085063934326, -1.766090750694275, -1.6942729949951172, -1.622455358505249, -1.5506376028060913, -1.4788198471069336, -1.4070022106170654, -1.3351844549179077, -1.2633668184280396, -1.1915490627288818, -1.1197314262390137, -1.047913670539856, -0.9760959148406982, -0.9042782187461853, -0.8324605226516724, -0.7606428265571594, -0.6888251304626465, -0.6170073747634888, -0.5451896786689758, -0.4733719825744629, -0.40155425667762756, -0.32973653078079224, -0.2579185962677002, -0.18610088527202606, -0.11428317427635193, -0.042465463280677795, 0.029352247714996338, 0.10116994380950928, 0.1729876697063446, 0.24480539560317993, 0.31662309169769287, 0.3884407877922058, 0.46025851368904114, 0.5320762395858765, 0.6038939356803894, 0.6757116317749023, 0.7475293874740601, 0.819347083568573, 0.8911647796630859, 0.9629824757575989, 1.0348001718521118, 1.1066179275512695, 1.1784355640411377, 1.2502533197402954, 1.3220710754394531, 1.3938887119293213, 1.465706467628479, 1.5375242233276367, 1.6093418598175049, 1.6811596155166626, 1.7529773712158203, 1.8247950077056885, 1.8966127634048462, 1.968430519104004, 2.040248155593872]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 17.0, 17.0, 30.0, 26.0, 41.0, 84.0, 134.0, 181.0, 324.0, 457.0, 765.0, 1264.0, 2062.0, 3540.0, 6323.0, 11072.0, 20599.0, 39078.0, 77915.0, 164238.0, 369744.0, 805057.0, 1157518.0, 819576.0, 379241.0, 168429.0, 79440.0, 39743.0, 21030.0, 11352.0, 6233.0, 3606.0, 2044.0, 1215.0, 753.0, 441.0, 255.0, 153.0, 98.0, 72.0, 41.0, 29.0, 17.0, 7.0, 6.0, 9.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.9453125, -4.793212890625, -4.64111328125, -4.489013671875, -4.3369140625, -4.184814453125, -4.03271484375, -3.880615234375, -3.728515625, -3.576416015625, -3.42431640625, -3.272216796875, -3.1201171875, -2.968017578125, -2.81591796875, -2.663818359375, -2.51171875, -2.359619140625, -2.20751953125, -2.055419921875, -1.9033203125, -1.751220703125, -1.59912109375, -1.447021484375, -1.294921875, -1.142822265625, -0.99072265625, -0.838623046875, -0.6865234375, -0.534423828125, -0.38232421875, -0.230224609375, -0.078125, 0.073974609375, 0.22607421875, 0.378173828125, 0.5302734375, 0.682373046875, 0.83447265625, 0.986572265625, 1.138671875, 1.290771484375, 1.44287109375, 1.594970703125, 1.7470703125, 1.899169921875, 2.05126953125, 2.203369140625, 2.35546875, 2.507568359375, 2.65966796875, 2.811767578125, 2.9638671875, 3.115966796875, 3.26806640625, 3.420166015625, 3.572265625, 3.724365234375, 3.87646484375, 4.028564453125, 4.1806640625, 4.332763671875, 4.48486328125, 4.636962890625, 4.7890625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 5.0, 9.0, 16.0, 17.0, 14.0, 20.0, 23.0, 29.0, 24.0, 32.0, 35.0, 42.0, 45.0, 33.0, 35.0, 42.0, 50.0, 35.0, 45.0, 49.0, 44.0, 35.0, 31.0, 29.0, 24.0, 33.0, 22.0, 26.0, 24.0, 24.0, 15.0, 12.0, 18.0, 9.0, 7.0, 6.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.2865753173828125, -2.219635009765625, -2.1526947021484375, -2.08575439453125, -2.0188140869140625, -1.951873779296875, -1.8849334716796875, -1.8179931640625, -1.7510528564453125, -1.684112548828125, -1.6171722412109375, -1.55023193359375, -1.4832916259765625, -1.416351318359375, -1.3494110107421875, -1.282470703125, -1.2155303955078125, -1.148590087890625, -1.0816497802734375, -1.01470947265625, -0.9477691650390625, -0.880828857421875, -0.8138885498046875, -0.7469482421875, -0.6800079345703125, -0.613067626953125, -0.5461273193359375, -0.47918701171875, -0.4122467041015625, -0.345306396484375, -0.2783660888671875, -0.21142578125, -0.1444854736328125, -0.077545166015625, -0.0106048583984375, 0.05633544921875, 0.1232757568359375, 0.190216064453125, 0.2571563720703125, 0.3240966796875, 0.3910369873046875, 0.457977294921875, 0.5249176025390625, 0.59185791015625, 0.6587982177734375, 0.725738525390625, 0.7926788330078125, 0.859619140625, 0.9265594482421875, 0.993499755859375, 1.0604400634765625, 1.12738037109375, 1.1943206787109375, 1.261260986328125, 1.3282012939453125, 1.3951416015625, 1.4620819091796875, 1.529022216796875, 1.5959625244140625, 1.66290283203125, 1.7298431396484375, 1.796783447265625, 1.8637237548828125, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 15.0, 18.0, 15.0, 34.0, 57.0, 99.0, 138.0, 227.0, 335.0, 570.0, 937.0, 1575.0, 2800.0, 4571.0, 8458.0, 15048.0, 27894.0, 52572.0, 102349.0, 205976.0, 416428.0, 775062.0, 1021311.0, 750665.0, 398872.0, 198723.0, 98801.0, 50510.0, 26396.0, 14582.0, 7974.0, 4599.0, 2648.0, 1580.0, 907.0, 577.0, 345.0, 212.0, 132.0, 91.0, 61.0, 44.0, 21.0, 18.0, 12.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.3359375, -5.176513671875, -5.01708984375, -4.857666015625, -4.6982421875, -4.538818359375, -4.37939453125, -4.219970703125, -4.060546875, -3.901123046875, -3.74169921875, -3.582275390625, -3.4228515625, -3.263427734375, -3.10400390625, -2.944580078125, -2.78515625, -2.625732421875, -2.46630859375, -2.306884765625, -2.1474609375, -1.988037109375, -1.82861328125, -1.669189453125, -1.509765625, -1.350341796875, -1.19091796875, -1.031494140625, -0.8720703125, -0.712646484375, -0.55322265625, -0.393798828125, -0.234375, -0.074951171875, 0.08447265625, 0.243896484375, 0.4033203125, 0.562744140625, 0.72216796875, 0.881591796875, 1.041015625, 1.200439453125, 1.35986328125, 1.519287109375, 1.6787109375, 1.838134765625, 1.99755859375, 2.156982421875, 2.31640625, 2.475830078125, 2.63525390625, 2.794677734375, 2.9541015625, 3.113525390625, 3.27294921875, 3.432373046875, 3.591796875, 3.751220703125, 3.91064453125, 4.070068359375, 4.2294921875, 4.388916015625, 4.54833984375, 4.707763671875, 4.8671875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 6.0, 6.0, 15.0, 19.0, 24.0, 30.0, 40.0, 55.0, 57.0, 52.0, 81.0, 81.0, 110.0, 121.0, 165.0, 164.0, 185.0, 219.0, 219.0, 253.0, 261.0, 255.0, 232.0, 201.0, 179.0, 186.0, 147.0, 119.0, 103.0, 81.0, 66.0, 67.0, 61.0, 39.0, 33.0, 34.0, 19.0, 16.0, 10.0, 10.0, 10.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0], "bins": [-1.19921875, -1.161041259765625, -1.12286376953125, -1.084686279296875, -1.0465087890625, -1.008331298828125, -0.97015380859375, -0.931976318359375, -0.893798828125, -0.855621337890625, -0.81744384765625, -0.779266357421875, -0.7410888671875, -0.702911376953125, -0.66473388671875, -0.626556396484375, -0.58837890625, -0.550201416015625, -0.51202392578125, -0.473846435546875, -0.4356689453125, -0.397491455078125, -0.35931396484375, -0.321136474609375, -0.282958984375, -0.244781494140625, -0.20660400390625, -0.168426513671875, -0.1302490234375, -0.092071533203125, -0.05389404296875, -0.015716552734375, 0.0224609375, 0.060638427734375, 0.09881591796875, 0.136993408203125, 0.1751708984375, 0.213348388671875, 0.25152587890625, 0.289703369140625, 0.327880859375, 0.366058349609375, 0.40423583984375, 0.442413330078125, 0.4805908203125, 0.518768310546875, 0.55694580078125, 0.595123291015625, 0.63330078125, 0.671478271484375, 0.70965576171875, 0.747833251953125, 0.7860107421875, 0.824188232421875, 0.86236572265625, 0.900543212890625, 0.938720703125, 0.976898193359375, 1.01507568359375, 1.053253173828125, 1.0914306640625, 1.129608154296875, 1.16778564453125, 1.205963134765625, 1.244140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 12.0, 10.0, 16.0, 23.0, 17.0, 28.0, 34.0, 34.0, 38.0, 49.0, 52.0, 56.0, 39.0, 49.0, 56.0, 46.0, 49.0, 48.0, 45.0, 46.0, 35.0, 37.0, 29.0, 15.0, 14.0, 16.0, 13.0, 15.0, 11.0, 8.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.763072967529297, -4.624141216278076, -4.485208988189697, -4.346277236938477, -4.207345008850098, -4.068413257598877, -3.9294815063476562, -3.7905495166778564, -3.6516175270080566, -3.512685537338257, -3.373753547668457, -3.2348217964172363, -3.0958898067474365, -2.9569578170776367, -2.818026065826416, -2.679094076156616, -2.5401620864868164, -2.4012300968170166, -2.262298107147217, -2.123366355895996, -1.9844343662261963, -1.8455023765563965, -1.7065705060958862, -1.567638635635376, -1.4287066459655762, -1.2897746562957764, -1.1508427858352661, -1.0119109153747559, -0.872978925704956, -0.734046995639801, -0.595115065574646, -0.45618313550949097, -0.31725120544433594, -0.1783192753791809, -0.03938734531402588, 0.09954458475112915, 0.23847651481628418, 0.3774084448814392, 0.5163403749465942, 0.6552723050117493, 0.7942042350769043, 0.9331361651420593, 1.0720680952072144, 1.2109999656677246, 1.3499319553375244, 1.4888639450073242, 1.6277958154678345, 1.7667276859283447, 1.9056596755981445, 2.0445916652679443, 2.183523654937744, 2.322455406188965, 2.4613873958587646, 2.6003193855285645, 2.739251136779785, 2.878183126449585, 3.0171151161193848, 3.1560471057891846, 3.2949790954589844, 3.433910846710205, 3.572842836380005, 3.7117748260498047, 3.8507065773010254, 3.989638566970825, 4.128570556640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 10.0, 15.0, 12.0, 9.0, 12.0, 13.0, 28.0, 28.0, 29.0, 30.0, 38.0, 38.0, 35.0, 28.0, 44.0, 49.0, 32.0, 39.0, 37.0, 32.0, 35.0, 41.0, 48.0, 37.0, 30.0, 28.0, 24.0, 20.0, 21.0, 21.0, 20.0, 15.0, 11.0, 21.0, 11.0, 9.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4725818634033203, -2.394728183746338, -2.3168742656707764, -2.239020586013794, -2.1611669063568115, -2.08331298828125, -2.0054593086242676, -1.9276056289672852, -1.8497518301010132, -1.7718980312347412, -1.6940443515777588, -1.6161905527114868, -1.5383367538452148, -1.4604830741882324, -1.3826292753219604, -1.3047754764556885, -1.226921796798706, -1.149067997932434, -1.0712143182754517, -0.9933605194091797, -0.9155067801475525, -0.8376530408859253, -0.7597992420196533, -0.6819455027580261, -0.6040917634963989, -0.5262380242347717, -0.44838425517082214, -0.37053048610687256, -0.29267674684524536, -0.21482300758361816, -0.13696923851966858, -0.059115469455718994, 0.0187380313873291, 0.09659178555011749, 0.17444553971290588, 0.25229930877685547, 0.33015304803848267, 0.40800678730010986, 0.48586055636405945, 0.563714325428009, 0.6415680646896362, 0.7194218039512634, 0.7972755432128906, 0.8751293420791626, 0.9529830813407898, 1.030836820602417, 1.108690619468689, 1.186544418334961, 1.2643980979919434, 1.3422518968582153, 1.4201055765151978, 1.4979593753814697, 1.5758130550384521, 1.6536668539047241, 1.731520652770996, 1.8093743324279785, 1.8872281312942505, 1.9650819301605225, 2.042935609817505, 2.1207892894744873, 2.198643207550049, 2.2764968872070312, 2.3543505668640137, 2.432204484939575, 2.5100581645965576]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 13.0, 14.0, 24.0, 43.0, 54.0, 93.0, 148.0, 222.0, 315.0, 506.0, 850.0, 1292.0, 1911.0, 3270.0, 4887.0, 8554.0, 14897.0, 27116.0, 50646.0, 97522.0, 178512.0, 246931.0, 186547.0, 103047.0, 53550.0, 28704.0, 15543.0, 9175.0, 5243.0, 3185.0, 2096.0, 1256.0, 808.0, 536.0, 365.0, 234.0, 146.0, 103.0, 65.0, 53.0, 24.0, 23.0, 12.0, 9.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65673828125, -0.637725830078125, -0.61871337890625, -0.599700927734375, -0.5806884765625, -0.561676025390625, -0.54266357421875, -0.523651123046875, -0.504638671875, -0.485626220703125, -0.46661376953125, -0.447601318359375, -0.4285888671875, -0.409576416015625, -0.39056396484375, -0.371551513671875, -0.3525390625, -0.333526611328125, -0.31451416015625, -0.295501708984375, -0.2764892578125, -0.257476806640625, -0.23846435546875, -0.219451904296875, -0.200439453125, -0.181427001953125, -0.16241455078125, -0.143402099609375, -0.1243896484375, -0.105377197265625, -0.08636474609375, -0.067352294921875, -0.04833984375, -0.029327392578125, -0.01031494140625, 0.008697509765625, 0.0277099609375, 0.046722412109375, 0.06573486328125, 0.084747314453125, 0.103759765625, 0.122772216796875, 0.14178466796875, 0.160797119140625, 0.1798095703125, 0.198822021484375, 0.21783447265625, 0.236846923828125, 0.255859375, 0.274871826171875, 0.29388427734375, 0.312896728515625, 0.3319091796875, 0.350921630859375, 0.36993408203125, 0.388946533203125, 0.407958984375, 0.426971435546875, 0.44598388671875, 0.464996337890625, 0.4840087890625, 0.503021240234375, 0.52203369140625, 0.541046142578125, 0.56005859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 12.0, 11.0, 10.0, 17.0, 17.0, 26.0, 26.0, 32.0, 43.0, 36.0, 41.0, 39.0, 50.0, 50.0, 46.0, 41.0, 43.0, 38.0, 46.0, 44.0, 36.0, 33.0, 27.0, 23.0, 32.0, 25.0, 21.0, 24.0, 14.0, 11.0, 13.0, 15.0, 6.0, 9.0, 8.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.34375, -3.24462890625, -3.1455078125, -3.04638671875, -2.947265625, -2.84814453125, -2.7490234375, -2.64990234375, -2.55078125, -2.45166015625, -2.3525390625, -2.25341796875, -2.154296875, -2.05517578125, -1.9560546875, -1.85693359375, -1.7578125, -1.65869140625, -1.5595703125, -1.46044921875, -1.361328125, -1.26220703125, -1.1630859375, -1.06396484375, -0.96484375, -0.86572265625, -0.7666015625, -0.66748046875, -0.568359375, -0.46923828125, -0.3701171875, -0.27099609375, -0.171875, -0.07275390625, 0.0263671875, 0.12548828125, 0.224609375, 0.32373046875, 0.4228515625, 0.52197265625, 0.62109375, 0.72021484375, 0.8193359375, 0.91845703125, 1.017578125, 1.11669921875, 1.2158203125, 1.31494140625, 1.4140625, 1.51318359375, 1.6123046875, 1.71142578125, 1.810546875, 1.90966796875, 2.0087890625, 2.10791015625, 2.20703125, 2.30615234375, 2.4052734375, 2.50439453125, 2.603515625, 2.70263671875, 2.8017578125, 2.90087890625, 3.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 9.0, 13.0, 23.0, 24.0, 20.0, 39.0, 53.0, 93.0, 101.0, 183.0, 288.0, 442.0, 749.0, 1208.0, 2079.0, 4072.0, 8481.0, 20916.0, 143793.0, 813254.0, 30291.0, 10956.0, 5045.0, 2600.0, 1400.0, 872.0, 521.0, 329.0, 214.0, 143.0, 89.0, 66.0, 54.0, 24.0, 35.0, 23.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.068389892578125, -2.00201416015625, -1.935638427734375, -1.8692626953125, -1.802886962890625, -1.73651123046875, -1.670135498046875, -1.603759765625, -1.537384033203125, -1.47100830078125, -1.404632568359375, -1.3382568359375, -1.271881103515625, -1.20550537109375, -1.139129638671875, -1.07275390625, -1.006378173828125, -0.94000244140625, -0.873626708984375, -0.8072509765625, -0.740875244140625, -0.67449951171875, -0.608123779296875, -0.541748046875, -0.475372314453125, -0.40899658203125, -0.342620849609375, -0.2762451171875, -0.209869384765625, -0.14349365234375, -0.077117919921875, -0.0107421875, 0.055633544921875, 0.12200927734375, 0.188385009765625, 0.2547607421875, 0.321136474609375, 0.38751220703125, 0.453887939453125, 0.520263671875, 0.586639404296875, 0.65301513671875, 0.719390869140625, 0.7857666015625, 0.852142333984375, 0.91851806640625, 0.984893798828125, 1.05126953125, 1.117645263671875, 1.18402099609375, 1.250396728515625, 1.3167724609375, 1.383148193359375, 1.44952392578125, 1.515899658203125, 1.582275390625, 1.648651123046875, 1.71502685546875, 1.781402587890625, 1.8477783203125, 1.914154052734375, 1.98052978515625, 2.046905517578125, 2.11328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 7.0, 10.0, 9.0, 16.0, 20.0, 19.0, 22.0, 25.0, 24.0, 21.0, 29.0, 37.0, 42.0, 52.0, 53.0, 43.0, 43.0, 51.0, 47.0, 52.0, 33.0, 39.0, 38.0, 42.0, 34.0, 27.0, 20.0, 25.0, 20.0, 18.0, 15.0, 9.0, 13.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.97149658203125, -1.9019775390625, -1.83245849609375, -1.762939453125, -1.69342041015625, -1.6239013671875, -1.55438232421875, -1.48486328125, -1.41534423828125, -1.3458251953125, -1.27630615234375, -1.206787109375, -1.13726806640625, -1.0677490234375, -0.99822998046875, -0.9287109375, -0.85919189453125, -0.7896728515625, -0.72015380859375, -0.650634765625, -0.58111572265625, -0.5115966796875, -0.44207763671875, -0.37255859375, -0.30303955078125, -0.2335205078125, -0.16400146484375, -0.094482421875, -0.02496337890625, 0.0445556640625, 0.11407470703125, 0.18359375, 0.25311279296875, 0.3226318359375, 0.39215087890625, 0.461669921875, 0.53118896484375, 0.6007080078125, 0.67022705078125, 0.73974609375, 0.80926513671875, 0.8787841796875, 0.94830322265625, 1.017822265625, 1.08734130859375, 1.1568603515625, 1.22637939453125, 1.2958984375, 1.36541748046875, 1.4349365234375, 1.50445556640625, 1.573974609375, 1.64349365234375, 1.7130126953125, 1.78253173828125, 1.85205078125, 1.92156982421875, 1.9910888671875, 2.06060791015625, 2.130126953125, 2.19964599609375, 2.2691650390625, 2.33868408203125, 2.408203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 4.0, 16.0, 10.0, 27.0, 43.0, 48.0, 79.0, 86.0, 157.0, 225.0, 315.0, 475.0, 725.0, 1092.0, 1873.0, 3142.0, 6158.0, 14804.0, 57839.0, 905037.0, 32810.0, 11298.0, 5070.0, 2660.0, 1561.0, 936.0, 647.0, 417.0, 301.0, 206.0, 128.0, 97.0, 58.0, 46.0, 37.0, 27.0, 18.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6018905639648438, -0.5826873779296875, -0.5634841918945312, -0.544281005859375, -0.5250778198242188, -0.5058746337890625, -0.48667144775390625, -0.46746826171875, -0.44826507568359375, -0.4290618896484375, -0.40985870361328125, -0.390655517578125, -0.37145233154296875, -0.3522491455078125, -0.33304595947265625, -0.3138427734375, -0.29463958740234375, -0.2754364013671875, -0.25623321533203125, -0.237030029296875, -0.21782684326171875, -0.1986236572265625, -0.17942047119140625, -0.16021728515625, -0.14101409912109375, -0.1218109130859375, -0.10260772705078125, -0.083404541015625, -0.06420135498046875, -0.0449981689453125, -0.02579498291015625, -0.006591796875, 0.01261138916015625, 0.0318145751953125, 0.05101776123046875, 0.070220947265625, 0.08942413330078125, 0.1086273193359375, 0.12783050537109375, 0.14703369140625, 0.16623687744140625, 0.1854400634765625, 0.20464324951171875, 0.223846435546875, 0.24304962158203125, 0.2622528076171875, 0.28145599365234375, 0.3006591796875, 0.31986236572265625, 0.3390655517578125, 0.35826873779296875, 0.377471923828125, 0.39667510986328125, 0.4158782958984375, 0.43508148193359375, 0.45428466796875, 0.47348785400390625, 0.4926910400390625, 0.5118942260742188, 0.531097412109375, 0.5503005981445312, 0.5695037841796875, 0.5887069702148438, 0.60791015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 7.0, 2.0, 9.0, 11.0, 15.0, 18.0, 23.0, 22.0, 21.0, 20.0, 40.0, 40.0, 68.0, 75.0, 65.0, 74.0, 61.0, 53.0, 61.0, 50.0, 56.0, 33.0, 39.0, 21.0, 21.0, 14.0, 14.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6684017181396484e-05, -5.498994141817093e-05, -5.3295865654945374e-05, -5.160178989171982e-05, -4.990771412849426e-05, -4.821363836526871e-05, -4.651956260204315e-05, -4.4825486838817596e-05, -4.313141107559204e-05, -4.1437335312366486e-05, -3.974325954914093e-05, -3.8049183785915375e-05, -3.635510802268982e-05, -3.4661032259464264e-05, -3.296695649623871e-05, -3.127288073301315e-05, -2.9578804969787598e-05, -2.7884729206562042e-05, -2.6190653443336487e-05, -2.449657768011093e-05, -2.2802501916885376e-05, -2.110842615365982e-05, -1.9414350390434265e-05, -1.772027462720871e-05, -1.6026198863983154e-05, -1.4332123100757599e-05, -1.2638047337532043e-05, -1.0943971574306488e-05, -9.249895811080933e-06, -7.555820047855377e-06, -5.861744284629822e-06, -4.167668521404266e-06, -2.473592758178711e-06, -7.795169949531555e-07, 9.145587682723999e-07, 2.6086345314979553e-06, 4.302710294723511e-06, 5.996786057949066e-06, 7.690861821174622e-06, 9.384937584400177e-06, 1.1079013347625732e-05, 1.2773089110851288e-05, 1.4467164874076843e-05, 1.61612406373024e-05, 1.7855316400527954e-05, 1.954939216375351e-05, 2.1243467926979065e-05, 2.293754369020462e-05, 2.4631619453430176e-05, 2.632569521665573e-05, 2.8019770979881287e-05, 2.9713846743106842e-05, 3.14079225063324e-05, 3.310199826955795e-05, 3.479607403278351e-05, 3.6490149796009064e-05, 3.818422555923462e-05, 3.9878301322460175e-05, 4.157237708568573e-05, 4.3266452848911285e-05, 4.496052861213684e-05, 4.6654604375362396e-05, 4.834868013858795e-05, 5.004275590181351e-05, 5.173683166503906e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 15.0, 25.0, 45.0, 68.0, 96.0, 152.0, 199.0, 300.0, 536.0, 798.0, 1264.0, 1904.0, 3070.0, 4864.0, 7931.0, 13622.0, 23944.0, 47753.0, 118924.0, 319582.0, 297300.0, 106111.0, 44387.0, 22404.0, 12769.0, 7663.0, 4668.0, 2899.0, 1861.0, 1164.0, 788.0, 486.0, 276.0, 217.0, 136.0, 83.0, 77.0, 52.0, 31.0, 19.0, 12.0, 9.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23433685302734375, -0.2262420654296875, -0.21814727783203125, -0.210052490234375, -0.20195770263671875, -0.1938629150390625, -0.18576812744140625, -0.17767333984375, -0.16957855224609375, -0.1614837646484375, -0.15338897705078125, -0.145294189453125, -0.13719940185546875, -0.1291046142578125, -0.12100982666015625, -0.1129150390625, -0.10482025146484375, -0.0967254638671875, -0.08863067626953125, -0.080535888671875, -0.07244110107421875, -0.0643463134765625, -0.05625152587890625, -0.04815673828125, -0.04006195068359375, -0.0319671630859375, -0.02387237548828125, -0.015777587890625, -0.00768280029296875, 0.0004119873046875, 0.00850677490234375, 0.0166015625, 0.02469635009765625, 0.0327911376953125, 0.04088592529296875, 0.048980712890625, 0.05707550048828125, 0.0651702880859375, 0.07326507568359375, 0.08135986328125, 0.08945465087890625, 0.0975494384765625, 0.10564422607421875, 0.113739013671875, 0.12183380126953125, 0.1299285888671875, 0.13802337646484375, 0.1461181640625, 0.15421295166015625, 0.1623077392578125, 0.17040252685546875, 0.178497314453125, 0.18659210205078125, 0.1946868896484375, 0.20278167724609375, 0.21087646484375, 0.21897125244140625, 0.2270660400390625, 0.23516082763671875, 0.243255615234375, 0.25135040283203125, 0.2594451904296875, 0.26753997802734375, 0.275634765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 8.0, 18.0, 18.0, 21.0, 22.0, 30.0, 35.0, 55.0, 85.0, 61.0, 89.0, 102.0, 81.0, 84.0, 48.0, 36.0, 24.0, 21.0, 24.0, 15.0, 9.0, 13.0, 8.0, 5.0, 4.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05096435546875, -0.04932594299316406, -0.047687530517578125, -0.04604911804199219, -0.04441070556640625, -0.04277229309082031, -0.041133880615234375, -0.03949546813964844, -0.0378570556640625, -0.03621864318847656, -0.034580230712890625, -0.03294181823730469, -0.03130340576171875, -0.029664993286132812, -0.028026580810546875, -0.026388168334960938, -0.024749755859375, -0.023111343383789062, -0.021472930908203125, -0.019834518432617188, -0.01819610595703125, -0.016557693481445312, -0.014919281005859375, -0.013280868530273438, -0.0116424560546875, -0.010004043579101562, -0.008365631103515625, -0.0067272186279296875, -0.00508880615234375, -0.0034503936767578125, -0.001811981201171875, -0.0001735687255859375, 0.00146484375, 0.0031032562255859375, 0.004741668701171875, 0.0063800811767578125, 0.00801849365234375, 0.009656906127929688, 0.011295318603515625, 0.012933731079101562, 0.0145721435546875, 0.016210556030273438, 0.017848968505859375, 0.019487380981445312, 0.02112579345703125, 0.022764205932617188, 0.024402618408203125, 0.026041030883789062, 0.027679443359375, 0.029317855834960938, 0.030956268310546875, 0.03259468078613281, 0.03423309326171875, 0.03587150573730469, 0.037509918212890625, 0.03914833068847656, 0.0407867431640625, 0.04242515563964844, 0.044063568115234375, 0.04570198059082031, 0.04734039306640625, 0.04897880554199219, 0.050617218017578125, 0.05225563049316406, 0.05389404296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 9.0, 6.0, 11.0, 9.0, 10.0, 17.0, 21.0, 15.0, 22.0, 41.0, 31.0, 37.0, 39.0, 56.0, 54.0, 42.0, 43.0, 52.0, 54.0, 41.0, 47.0, 50.0, 40.0, 39.0, 40.0, 33.0, 25.0, 11.0, 11.0, 14.0, 16.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.538368225097656, -4.402956008911133, -4.267544269561768, -4.132132053375244, -3.996720314025879, -3.8613083362579346, -3.7258963584899902, -3.590484142303467, -3.4550724029541016, -3.3196604251861572, -3.184248447418213, -3.0488364696502686, -2.913424491882324, -2.77801251411438, -2.6426005363464355, -2.507188320159912, -2.3717763423919678, -2.2363643646240234, -2.100952386856079, -1.9655404090881348, -1.8301284313201904, -1.694716453552246, -1.5593043565750122, -1.4238923788070679, -1.2884804010391235, -1.1530684232711792, -1.0176564455032349, -0.8822444081306458, -0.7468324303627014, -0.6114204525947571, -0.47600841522216797, -0.34059643745422363, -0.2051844596862793, -0.06977246701717377, 0.06563952565193176, 0.2010515332221985, 0.3364635109901428, 0.47187548875808716, 0.6072875261306763, 0.7426995038986206, 0.8781114816665649, 1.0135234594345093, 1.1489354372024536, 1.2843475341796875, 1.4197595119476318, 1.5551714897155762, 1.6905834674835205, 1.8259954452514648, 1.9614074230194092, 2.0968194007873535, 2.232231378555298, 2.367643356323242, 2.5030553340911865, 2.638467311859131, 2.7738795280456543, 2.9092912673950195, 3.044703483581543, 3.1801154613494873, 3.3155274391174316, 3.450939416885376, 3.5863513946533203, 3.7217633724212646, 3.857175350189209, 3.9925875663757324, 4.127999305725098]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 12.0, 11.0, 10.0, 15.0, 9.0, 15.0, 7.0, 19.0, 33.0, 25.0, 30.0, 27.0, 40.0, 34.0, 35.0, 31.0, 40.0, 48.0, 41.0, 33.0, 35.0, 35.0, 31.0, 40.0, 50.0, 37.0, 27.0, 27.0, 26.0, 18.0, 23.0, 20.0, 17.0, 14.0, 14.0, 19.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.394810438156128, -2.318641185760498, -2.2424721717834473, -2.1663029193878174, -2.0901339054107666, -2.0139646530151367, -1.9377955198287964, -1.861626386642456, -1.7854571342468262, -1.7092880010604858, -1.6331188678741455, -1.5569496154785156, -1.4807804822921753, -1.404611349105835, -1.3284422159194946, -1.2522730827331543, -1.176103949546814, -1.0999348163604736, -1.0237656831741333, -0.9475964903831482, -0.8714272975921631, -0.7952581644058228, -0.7190890312194824, -0.6429198384284973, -0.566750705242157, -0.49058154225349426, -0.41441237926483154, -0.3382432460784912, -0.2620740830898285, -0.18590492010116577, -0.10973578691482544, -0.03356659412384033, 0.0426025390625, 0.11877169460058212, 0.19494085013866425, 0.27110999822616577, 0.3472791612148285, 0.4234483242034912, 0.49961745738983154, 0.5757866501808167, 0.651955783367157, 0.7281249165534973, 0.8042941093444824, 0.8804632425308228, 0.9566323757171631, 1.032801628112793, 1.1089706420898438, 1.1851398944854736, 1.261309027671814, 1.3374781608581543, 1.4136472940444946, 1.489816427230835, 1.5659856796264648, 1.6421548128128052, 1.7183239459991455, 1.7944931983947754, 1.8706622123718262, 1.9468313455581665, 2.023000478744507, 2.0991697311401367, 2.1753387451171875, 2.2515079975128174, 2.3276772499084473, 2.403846263885498, 2.480015516281128]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 30.0, 48.0, 78.0, 86.0, 121.0, 205.0, 309.0, 524.0, 939.0, 1610.0, 2642.0, 4895.0, 8901.0, 16857.0, 31385.0, 58225.0, 100608.0, 154838.0, 189809.0, 176991.0, 127582.0, 77803.0, 43249.0, 22905.0, 12488.0, 6612.0, 3661.0, 2078.0, 1170.0, 689.0, 421.0, 255.0, 169.0, 91.0, 71.0, 59.0, 35.0, 18.0, 11.0, 9.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.265625, -4.13128662109375, -3.9969482421875, -3.86260986328125, -3.728271484375, -3.59393310546875, -3.4595947265625, -3.32525634765625, -3.19091796875, -3.05657958984375, -2.9222412109375, -2.78790283203125, -2.653564453125, -2.51922607421875, -2.3848876953125, -2.25054931640625, -2.1162109375, -1.98187255859375, -1.8475341796875, -1.71319580078125, -1.578857421875, -1.44451904296875, -1.3101806640625, -1.17584228515625, -1.04150390625, -0.90716552734375, -0.7728271484375, -0.63848876953125, -0.504150390625, -0.36981201171875, -0.2354736328125, -0.10113525390625, 0.033203125, 0.16754150390625, 0.3018798828125, 0.43621826171875, 0.570556640625, 0.70489501953125, 0.8392333984375, 0.97357177734375, 1.10791015625, 1.24224853515625, 1.3765869140625, 1.51092529296875, 1.645263671875, 1.77960205078125, 1.9139404296875, 2.04827880859375, 2.1826171875, 2.31695556640625, 2.4512939453125, 2.58563232421875, 2.719970703125, 2.85430908203125, 2.9886474609375, 3.12298583984375, 3.25732421875, 3.39166259765625, 3.5260009765625, 3.66033935546875, 3.794677734375, 3.92901611328125, 4.0633544921875, 4.19769287109375, 4.33203125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 9.0, 13.0, 12.0, 13.0, 19.0, 23.0, 27.0, 40.0, 31.0, 42.0, 39.0, 45.0, 49.0, 44.0, 44.0, 41.0, 35.0, 38.0, 40.0, 37.0, 41.0, 42.0, 30.0, 29.0, 40.0, 22.0, 25.0, 20.0, 10.0, 16.0, 12.0, 12.0, 11.0, 8.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.19921875, -3.10540771484375, -3.0115966796875, -2.91778564453125, -2.823974609375, -2.73016357421875, -2.6363525390625, -2.54254150390625, -2.44873046875, -2.35491943359375, -2.2611083984375, -2.16729736328125, -2.073486328125, -1.97967529296875, -1.8858642578125, -1.79205322265625, -1.6982421875, -1.60443115234375, -1.5106201171875, -1.41680908203125, -1.322998046875, -1.22918701171875, -1.1353759765625, -1.04156494140625, -0.94775390625, -0.85394287109375, -0.7601318359375, -0.66632080078125, -0.572509765625, -0.47869873046875, -0.3848876953125, -0.29107666015625, -0.197265625, -0.10345458984375, -0.0096435546875, 0.08416748046875, 0.177978515625, 0.27178955078125, 0.3656005859375, 0.45941162109375, 0.55322265625, 0.64703369140625, 0.7408447265625, 0.83465576171875, 0.928466796875, 1.02227783203125, 1.1160888671875, 1.20989990234375, 1.3037109375, 1.39752197265625, 1.4913330078125, 1.58514404296875, 1.678955078125, 1.77276611328125, 1.8665771484375, 1.96038818359375, 2.05419921875, 2.14801025390625, 2.2418212890625, 2.33563232421875, 2.429443359375, 2.52325439453125, 2.6170654296875, 2.71087646484375, 2.8046875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 17.0, 16.0, 22.0, 29.0, 54.0, 79.0, 142.0, 169.0, 318.0, 479.0, 813.0, 1300.0, 2166.0, 3702.0, 6402.0, 11074.0, 18402.0, 31268.0, 51294.0, 80654.0, 116918.0, 148935.0, 157984.0, 138826.0, 102753.0, 68981.0, 42734.0, 25952.0, 15233.0, 8960.0, 5053.0, 3093.0, 1814.0, 1077.0, 697.0, 417.0, 247.0, 150.0, 116.0, 60.0, 44.0, 31.0, 22.0, 16.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.71484375, -3.599884033203125, -3.48492431640625, -3.369964599609375, -3.2550048828125, -3.140045166015625, -3.02508544921875, -2.910125732421875, -2.795166015625, -2.680206298828125, -2.56524658203125, -2.450286865234375, -2.3353271484375, -2.220367431640625, -2.10540771484375, -1.990447998046875, -1.87548828125, -1.760528564453125, -1.64556884765625, -1.530609130859375, -1.4156494140625, -1.300689697265625, -1.18572998046875, -1.070770263671875, -0.955810546875, -0.840850830078125, -0.72589111328125, -0.610931396484375, -0.4959716796875, -0.381011962890625, -0.26605224609375, -0.151092529296875, -0.0361328125, 0.078826904296875, 0.19378662109375, 0.308746337890625, 0.4237060546875, 0.538665771484375, 0.65362548828125, 0.768585205078125, 0.883544921875, 0.998504638671875, 1.11346435546875, 1.228424072265625, 1.3433837890625, 1.458343505859375, 1.57330322265625, 1.688262939453125, 1.80322265625, 1.918182373046875, 2.03314208984375, 2.148101806640625, 2.2630615234375, 2.378021240234375, 2.49298095703125, 2.607940673828125, 2.722900390625, 2.837860107421875, 2.95281982421875, 3.067779541015625, 3.1827392578125, 3.297698974609375, 3.41265869140625, 3.527618408203125, 3.642578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 11.0, 12.0, 10.0, 13.0, 11.0, 13.0, 15.0, 23.0, 26.0, 26.0, 28.0, 26.0, 35.0, 33.0, 39.0, 34.0, 48.0, 36.0, 43.0, 32.0, 35.0, 31.0, 32.0, 25.0, 33.0, 27.0, 34.0, 27.0, 27.0, 20.0, 23.0, 16.0, 23.0, 14.0, 9.0, 18.0, 14.0, 3.0, 12.0, 2.0, 11.0, 8.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0], "bins": [-1.66796875, -1.618438720703125, -1.56890869140625, -1.519378662109375, -1.4698486328125, -1.420318603515625, -1.37078857421875, -1.321258544921875, -1.271728515625, -1.222198486328125, -1.17266845703125, -1.123138427734375, -1.0736083984375, -1.024078369140625, -0.97454833984375, -0.925018310546875, -0.87548828125, -0.825958251953125, -0.77642822265625, -0.726898193359375, -0.6773681640625, -0.627838134765625, -0.57830810546875, -0.528778076171875, -0.479248046875, -0.429718017578125, -0.38018798828125, -0.330657958984375, -0.2811279296875, -0.231597900390625, -0.18206787109375, -0.132537841796875, -0.0830078125, -0.033477783203125, 0.01605224609375, 0.065582275390625, 0.1151123046875, 0.164642333984375, 0.21417236328125, 0.263702392578125, 0.313232421875, 0.362762451171875, 0.41229248046875, 0.461822509765625, 0.5113525390625, 0.560882568359375, 0.61041259765625, 0.659942626953125, 0.70947265625, 0.759002685546875, 0.80853271484375, 0.858062744140625, 0.9075927734375, 0.957122802734375, 1.00665283203125, 1.056182861328125, 1.105712890625, 1.155242919921875, 1.20477294921875, 1.254302978515625, 1.3038330078125, 1.353363037109375, 1.40289306640625, 1.452423095703125, 1.501953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 13.0, 20.0, 31.0, 33.0, 50.0, 55.0, 85.0, 89.0, 140.0, 158.0, 197.0, 271.0, 371.0, 463.0, 612.0, 853.0, 1121.0, 1565.0, 2179.0, 3323.0, 5623.0, 12627.0, 42964.0, 203496.0, 492337.0, 206416.0, 43399.0, 12877.0, 5642.0, 3226.0, 2102.0, 1521.0, 1102.0, 811.0, 670.0, 503.0, 379.0, 294.0, 211.0, 178.0, 146.0, 83.0, 76.0, 59.0, 49.0, 41.0, 22.0, 13.0, 15.0, 12.0, 9.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.8515625, -6.626953125, -6.40234375, -6.177734375, -5.953125, -5.728515625, -5.50390625, -5.279296875, -5.0546875, -4.830078125, -4.60546875, -4.380859375, -4.15625, -3.931640625, -3.70703125, -3.482421875, -3.2578125, -3.033203125, -2.80859375, -2.583984375, -2.359375, -2.134765625, -1.91015625, -1.685546875, -1.4609375, -1.236328125, -1.01171875, -0.787109375, -0.5625, -0.337890625, -0.11328125, 0.111328125, 0.3359375, 0.560546875, 0.78515625, 1.009765625, 1.234375, 1.458984375, 1.68359375, 1.908203125, 2.1328125, 2.357421875, 2.58203125, 2.806640625, 3.03125, 3.255859375, 3.48046875, 3.705078125, 3.9296875, 4.154296875, 4.37890625, 4.603515625, 4.828125, 5.052734375, 5.27734375, 5.501953125, 5.7265625, 5.951171875, 6.17578125, 6.400390625, 6.625, 6.849609375, 7.07421875, 7.298828125, 7.5234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 25.0, 60.0, 102.0, 197.0, 213.0, 182.0, 96.0, 47.0, 15.0, 12.0, 5.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009016990661621094, -0.0008754655718803406, -0.0008492320775985718, -0.000822998583316803, -0.0007967650890350342, -0.0007705315947532654, -0.0007442981004714966, -0.0007180646061897278, -0.000691831111907959, -0.0006655976176261902, -0.0006393641233444214, -0.0006131306290626526, -0.0005868971347808838, -0.000560663640499115, -0.0005344301462173462, -0.0005081966519355774, -0.0004819631576538086, -0.0004557296633720398, -0.000429496169090271, -0.0004032626748085022, -0.0003770291805267334, -0.0003507956862449646, -0.0003245621919631958, -0.000298328697681427, -0.0002720952033996582, -0.0002458617091178894, -0.0002196282148361206, -0.0001933947205543518, -0.000167161226272583, -0.0001409277319908142, -0.00011469423770904541, -8.846074342727661e-05, -6.222724914550781e-05, -3.5993754863739014e-05, -9.760260581970215e-06, 1.6473233699798584e-05, 4.270672798156738e-05, 6.894022226333618e-05, 9.517371654510498e-05, 0.00012140721082687378, 0.00014764070510864258, 0.00017387419939041138, 0.00020010769367218018, 0.00022634118795394897, 0.0002525746822357178, 0.00027880817651748657, 0.00030504167079925537, 0.00033127516508102417, 0.00035750865936279297, 0.00038374215364456177, 0.00040997564792633057, 0.00043620914220809937, 0.00046244263648986816, 0.000488676130771637, 0.0005149096250534058, 0.0005411431193351746, 0.0005673766136169434, 0.0005936101078987122, 0.000619843602180481, 0.0006460770964622498, 0.0006723105907440186, 0.0006985440850257874, 0.0007247775793075562, 0.000751011073589325, 0.0007772445678710938]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 13.0, 15.0, 18.0, 32.0, 41.0, 47.0, 60.0, 78.0, 143.0, 179.0, 275.0, 374.0, 533.0, 739.0, 1164.0, 1742.0, 2586.0, 4005.0, 9112.0, 52654.0, 457300.0, 445733.0, 50738.0, 9014.0, 3926.0, 2631.0, 1705.0, 1159.0, 750.0, 530.0, 358.0, 267.0, 187.0, 110.0, 84.0, 73.0, 43.0, 37.0, 25.0, 21.0, 18.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-9.9375, -9.6451416015625, -9.352783203125, -9.0604248046875, -8.76806640625, -8.4757080078125, -8.183349609375, -7.8909912109375, -7.5986328125, -7.3062744140625, -7.013916015625, -6.7215576171875, -6.42919921875, -6.1368408203125, -5.844482421875, -5.5521240234375, -5.259765625, -4.9674072265625, -4.675048828125, -4.3826904296875, -4.09033203125, -3.7979736328125, -3.505615234375, -3.2132568359375, -2.9208984375, -2.6285400390625, -2.336181640625, -2.0438232421875, -1.75146484375, -1.4591064453125, -1.166748046875, -0.8743896484375, -0.58203125, -0.2896728515625, 0.002685546875, 0.2950439453125, 0.58740234375, 0.8797607421875, 1.172119140625, 1.4644775390625, 1.7568359375, 2.0491943359375, 2.341552734375, 2.6339111328125, 2.92626953125, 3.2186279296875, 3.510986328125, 3.8033447265625, 4.095703125, 4.3880615234375, 4.680419921875, 4.9727783203125, 5.26513671875, 5.5574951171875, 5.849853515625, 6.1422119140625, 6.4345703125, 6.7269287109375, 7.019287109375, 7.3116455078125, 7.60400390625, 7.8963623046875, 8.188720703125, 8.4810791015625, 8.7734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 16.0, 36.0, 56.0, 108.0, 173.0, 202.0, 155.0, 113.0, 69.0, 27.0, 17.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9176177978515625, -1.847930908203125, -1.7782440185546875, -1.70855712890625, -1.6388702392578125, -1.569183349609375, -1.4994964599609375, -1.4298095703125, -1.3601226806640625, -1.290435791015625, -1.2207489013671875, -1.15106201171875, -1.0813751220703125, -1.011688232421875, -0.9420013427734375, -0.872314453125, -0.8026275634765625, -0.732940673828125, -0.6632537841796875, -0.59356689453125, -0.5238800048828125, -0.454193115234375, -0.3845062255859375, -0.3148193359375, -0.2451324462890625, -0.175445556640625, -0.1057586669921875, -0.03607177734375, 0.0336151123046875, 0.103302001953125, 0.1729888916015625, 0.24267578125, 0.3123626708984375, 0.382049560546875, 0.4517364501953125, 0.52142333984375, 0.5911102294921875, 0.660797119140625, 0.7304840087890625, 0.8001708984375, 0.8698577880859375, 0.939544677734375, 1.0092315673828125, 1.07891845703125, 1.1486053466796875, 1.218292236328125, 1.2879791259765625, 1.357666015625, 1.4273529052734375, 1.497039794921875, 1.5667266845703125, 1.63641357421875, 1.7061004638671875, 1.775787353515625, 1.8454742431640625, 1.9151611328125, 1.9848480224609375, 2.054534912109375, 2.1242218017578125, 2.19390869140625, 2.2635955810546875, 2.333282470703125, 2.4029693603515625, 2.47265625]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 8.0, 8.0, 12.0, 18.0, 16.0, 17.0, 17.0, 18.0, 35.0, 21.0, 34.0, 42.0, 39.0, 44.0, 37.0, 52.0, 51.0, 74.0, 59.0, 37.0, 35.0, 41.0, 46.0, 38.0, 29.0, 28.0, 20.0, 17.0, 11.0, 21.0, 9.0, 7.0, 10.0, 3.0, 6.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.421260833740234, -4.286639213562012, -4.152018070220947, -4.017396450042725, -3.882775068283081, -3.7481536865234375, -3.613532066345215, -3.4789106845855713, -3.3442893028259277, -3.209667921066284, -3.0750465393066406, -2.940424919128418, -2.8058035373687744, -2.671182155609131, -2.536560535430908, -2.4019391536712646, -2.267317771911621, -2.1326963901519775, -1.9980748891830444, -1.8634533882141113, -1.7288320064544678, -1.5942106246948242, -1.4595891237258911, -1.324967622756958, -1.1903462409973145, -1.055724859237671, -0.9211033582687378, -0.7864819169044495, -0.6518604755401611, -0.5172390341758728, -0.3826175928115845, -0.24799615144729614, -0.11337423324584961, 0.02124720811843872, 0.15586864948272705, 0.2904900908470154, 0.4251115322113037, 0.559732973575592, 0.6943544149398804, 0.8289758563041687, 0.963597297668457, 1.0982186794281006, 1.2328401803970337, 1.3674616813659668, 1.5020830631256104, 1.636704444885254, 1.771325945854187, 1.9059474468231201, 2.0405688285827637, 2.1751902103424072, 2.309811592102051, 2.4444332122802734, 2.579054594039917, 2.7136759757995605, 2.848297595977783, 2.9829189777374268, 3.1175403594970703, 3.252161741256714, 3.3867831230163574, 3.52140474319458, 3.6560261249542236, 3.790647506713867, 3.92526912689209, 4.059890270233154, 4.194511890411377]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 22.0, 15.0, 22.0, 23.0, 26.0, 20.0, 23.0, 36.0, 37.0, 38.0, 42.0, 37.0, 40.0, 27.0, 36.0, 34.0, 37.0, 36.0, 26.0, 40.0, 35.0, 35.0, 30.0, 28.0, 22.0, 22.0, 26.0, 20.0, 17.0, 5.0, 7.0, 14.0, 13.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.6036057472229004, -2.5236926078796387, -2.443779468536377, -2.3638663291931152, -2.2839531898498535, -2.204040050506592, -2.12412691116333, -2.0442137718200684, -1.9643006324768066, -1.884387493133545, -1.8044743537902832, -1.7245612144470215, -1.6446480751037598, -1.564734935760498, -1.4848217964172363, -1.4049086570739746, -1.3249953985214233, -1.2450822591781616, -1.1651691198349, -1.0852559804916382, -1.0053428411483765, -0.9254297018051147, -0.8455165028572083, -0.7656033635139465, -0.6856902241706848, -0.6057770848274231, -0.5258639454841614, -0.44595077633857727, -0.36603763699531555, -0.28612449765205383, -0.20621132850646973, -0.126298189163208, -0.04638504981994629, 0.03352809697389603, 0.11344124376773834, 0.19335439801216125, 0.273267537355423, 0.3531806766986847, 0.4330938458442688, 0.5130069851875305, 0.5929201245307922, 0.672833263874054, 0.7527464032173157, 0.8326596021652222, 0.9125727415084839, 0.9924858808517456, 1.0723990201950073, 1.152312159538269, 1.2322252988815308, 1.3121384382247925, 1.3920515775680542, 1.471964716911316, 1.5518778562545776, 1.6317909955978394, 1.7117042541503906, 1.7916173934936523, 1.871530532836914, 1.9514436721801758, 2.0313568115234375, 2.111269950866699, 2.191183090209961, 2.2710962295532227, 2.3510093688964844, 2.430922508239746, 2.510835647583008]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 8.0, 28.0, 26.0, 32.0, 58.0, 99.0, 93.0, 168.0, 261.0, 368.0, 520.0, 783.0, 1111.0, 1782.0, 2639.0, 4183.0, 6756.0, 10744.0, 17625.0, 29981.0, 52567.0, 95982.0, 180449.0, 346564.0, 627920.0, 889814.0, 817818.0, 510290.0, 270558.0, 141820.0, 76576.0, 42805.0, 24500.0, 14710.0, 8873.0, 5612.0, 3596.0, 2236.0, 1481.0, 968.0, 616.0, 443.0, 268.0, 176.0, 126.0, 83.0, 54.0, 38.0, 23.0, 15.0, 8.0, 8.0, 2.0, 2.0, 3.0], "bins": [-4.6328125, -4.499725341796875, -4.36663818359375, -4.233551025390625, -4.1004638671875, -3.967376708984375, -3.83428955078125, -3.701202392578125, -3.568115234375, -3.435028076171875, -3.30194091796875, -3.168853759765625, -3.0357666015625, -2.902679443359375, -2.76959228515625, -2.636505126953125, -2.50341796875, -2.370330810546875, -2.23724365234375, -2.104156494140625, -1.9710693359375, -1.837982177734375, -1.70489501953125, -1.571807861328125, -1.438720703125, -1.305633544921875, -1.17254638671875, -1.039459228515625, -0.9063720703125, -0.773284912109375, -0.64019775390625, -0.507110595703125, -0.3740234375, -0.240936279296875, -0.10784912109375, 0.025238037109375, 0.1583251953125, 0.291412353515625, 0.42449951171875, 0.557586669921875, 0.690673828125, 0.823760986328125, 0.95684814453125, 1.089935302734375, 1.2230224609375, 1.356109619140625, 1.48919677734375, 1.622283935546875, 1.75537109375, 1.888458251953125, 2.02154541015625, 2.154632568359375, 2.2877197265625, 2.420806884765625, 2.55389404296875, 2.686981201171875, 2.820068359375, 2.953155517578125, 3.08624267578125, 3.219329833984375, 3.3524169921875, 3.485504150390625, 3.61859130859375, 3.751678466796875, 3.884765625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 5.0, 2.0, 9.0, 11.0, 9.0, 10.0, 10.0, 22.0, 22.0, 19.0, 27.0, 25.0, 22.0, 30.0, 31.0, 41.0, 31.0, 46.0, 37.0, 40.0, 34.0, 40.0, 33.0, 37.0, 42.0, 43.0, 39.0, 26.0, 35.0, 34.0, 24.0, 23.0, 23.0, 21.0, 19.0, 16.0, 8.0, 12.0, 6.0, 4.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.2724609375, -2.19921875, -2.1259765625, -2.052734375, -1.9794921875, -1.90625, -1.8330078125, -1.759765625, -1.6865234375, -1.61328125, -1.5400390625, -1.466796875, -1.3935546875, -1.3203125, -1.2470703125, -1.173828125, -1.1005859375, -1.02734375, -0.9541015625, -0.880859375, -0.8076171875, -0.734375, -0.6611328125, -0.587890625, -0.5146484375, -0.44140625, -0.3681640625, -0.294921875, -0.2216796875, -0.1484375, -0.0751953125, -0.001953125, 0.0712890625, 0.14453125, 0.2177734375, 0.291015625, 0.3642578125, 0.4375, 0.5107421875, 0.583984375, 0.6572265625, 0.73046875, 0.8037109375, 0.876953125, 0.9501953125, 1.0234375, 1.0966796875, 1.169921875, 1.2431640625, 1.31640625, 1.3896484375, 1.462890625, 1.5361328125, 1.609375, 1.6826171875, 1.755859375, 1.8291015625, 1.90234375, 1.9755859375, 2.048828125, 2.1220703125, 2.1953125, 2.2685546875, 2.341796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 33.0, 31.0, 52.0, 81.0, 112.0, 204.0, 286.0, 404.0, 675.0, 1115.0, 1652.0, 2733.0, 4343.0, 7060.0, 11690.0, 19764.0, 34120.0, 59776.0, 107753.0, 195242.0, 353582.0, 604979.0, 838242.0, 780767.0, 512215.0, 290859.0, 159397.0, 87459.0, 49180.0, 27997.0, 16448.0, 9874.0, 5990.0, 3713.0, 2310.0, 1463.0, 889.0, 631.0, 381.0, 264.0, 154.0, 91.0, 85.0, 55.0, 30.0, 21.0, 14.0, 13.0, 7.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.38690185546875, -4.2347412109375, -4.08258056640625, -3.930419921875, -3.77825927734375, -3.6260986328125, -3.47393798828125, -3.32177734375, -3.16961669921875, -3.0174560546875, -2.86529541015625, -2.713134765625, -2.56097412109375, -2.4088134765625, -2.25665283203125, -2.1044921875, -1.95233154296875, -1.8001708984375, -1.64801025390625, -1.495849609375, -1.34368896484375, -1.1915283203125, -1.03936767578125, -0.88720703125, -0.73504638671875, -0.5828857421875, -0.43072509765625, -0.278564453125, -0.12640380859375, 0.0257568359375, 0.17791748046875, 0.330078125, 0.48223876953125, 0.6343994140625, 0.78656005859375, 0.938720703125, 1.09088134765625, 1.2430419921875, 1.39520263671875, 1.54736328125, 1.69952392578125, 1.8516845703125, 2.00384521484375, 2.156005859375, 2.30816650390625, 2.4603271484375, 2.61248779296875, 2.7646484375, 2.91680908203125, 3.0689697265625, 3.22113037109375, 3.373291015625, 3.52545166015625, 3.6776123046875, 3.82977294921875, 3.98193359375, 4.13409423828125, 4.2862548828125, 4.43841552734375, 4.590576171875, 4.74273681640625, 4.8948974609375, 5.04705810546875, 5.19921875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 2.0, 10.0, 10.0, 12.0, 18.0, 26.0, 29.0, 31.0, 40.0, 71.0, 67.0, 89.0, 102.0, 132.0, 170.0, 198.0, 247.0, 226.0, 270.0, 289.0, 268.0, 246.0, 258.0, 220.0, 218.0, 165.0, 148.0, 123.0, 84.0, 78.0, 62.0, 44.0, 36.0, 24.0, 15.0, 13.0, 8.0, 8.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6845703125, -1.633544921875, -1.58251953125, -1.531494140625, -1.48046875, -1.429443359375, -1.37841796875, -1.327392578125, -1.2763671875, -1.225341796875, -1.17431640625, -1.123291015625, -1.072265625, -1.021240234375, -0.97021484375, -0.919189453125, -0.8681640625, -0.817138671875, -0.76611328125, -0.715087890625, -0.6640625, -0.613037109375, -0.56201171875, -0.510986328125, -0.4599609375, -0.408935546875, -0.35791015625, -0.306884765625, -0.255859375, -0.204833984375, -0.15380859375, -0.102783203125, -0.0517578125, -0.000732421875, 0.05029296875, 0.101318359375, 0.15234375, 0.203369140625, 0.25439453125, 0.305419921875, 0.3564453125, 0.407470703125, 0.45849609375, 0.509521484375, 0.560546875, 0.611572265625, 0.66259765625, 0.713623046875, 0.7646484375, 0.815673828125, 0.86669921875, 0.917724609375, 0.96875, 1.019775390625, 1.07080078125, 1.121826171875, 1.1728515625, 1.223876953125, 1.27490234375, 1.325927734375, 1.376953125, 1.427978515625, 1.47900390625, 1.530029296875, 1.5810546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 11.0, 11.0, 9.0, 18.0, 18.0, 21.0, 27.0, 38.0, 35.0, 54.0, 45.0, 60.0, 57.0, 70.0, 72.0, 53.0, 62.0, 44.0, 46.0, 44.0, 32.0, 41.0, 21.0, 21.0, 17.0, 16.0, 9.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.877341270446777, -5.695503234863281, -5.513665199279785, -5.331827163696289, -5.149989604949951, -4.968151569366455, -4.786313533782959, -4.604475498199463, -4.422637939453125, -4.240799903869629, -4.058961868286133, -3.877124071121216, -3.695286273956299, -3.5134482383728027, -3.3316102027893066, -3.1497721672058105, -2.9679341316223145, -2.7860960960388184, -2.6042582988739014, -2.4224202632904053, -2.2405824661254883, -2.058744430541992, -1.876906394958496, -1.6950684785842896, -1.513230562210083, -1.3313926458358765, -1.14955472946167, -0.9677166938781738, -0.7858787775039673, -0.6040408611297607, -0.42220282554626465, -0.2403649091720581, -0.05852651596069336, 0.12331143021583557, 0.3051493763923645, 0.4869873523712158, 0.6688252687454224, 0.8506631851196289, 1.032501220703125, 1.2143391370773315, 1.396177053451538, 1.5780149698257446, 1.7598528861999512, 1.9416909217834473, 2.1235289573669434, 2.3053667545318604, 2.4872047901153564, 2.6690425872802734, 2.8508806228637695, 3.0327186584472656, 3.2145564556121826, 3.3963944911956787, 3.5782322883605957, 3.760070323944092, 3.941908359527588, 4.123746395111084, 4.305583953857422, 4.487421989440918, 4.669260025024414, 4.85109806060791, 5.032935619354248, 5.214773654937744, 5.39661169052124, 5.578449726104736, 5.760287761688232]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0, 2.0, 6.0, 4.0, 6.0, 15.0, 12.0, 9.0, 17.0, 11.0, 18.0, 22.0, 24.0, 22.0, 38.0, 28.0, 35.0, 26.0, 33.0, 33.0, 36.0, 34.0, 52.0, 40.0, 34.0, 38.0, 33.0, 37.0, 36.0, 38.0, 31.0, 24.0, 22.0, 19.0, 21.0, 27.0, 14.0, 11.0, 13.0, 19.0, 3.0, 17.0, 7.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-2.9414868354797363, -2.855492115020752, -2.7694976329803467, -2.6835029125213623, -2.597508430480957, -2.5115137100219727, -2.4255189895629883, -2.339524507522583, -2.2535300254821777, -2.1675353050231934, -2.081540822982788, -1.9955461025238037, -1.9095516204833984, -1.823556900024414, -1.7375622987747192, -1.6515676975250244, -1.56557297706604, -1.4795783758163452, -1.3935837745666504, -1.307589054107666, -1.2215945720672607, -1.1355998516082764, -1.0496052503585815, -0.9636106491088867, -0.8776160478591919, -0.7916214466094971, -0.7056268453598022, -0.6196321845054626, -0.5336375832557678, -0.447642982006073, -0.3616483211517334, -0.2756537199020386, -0.18965911865234375, -0.10366450250148773, -0.017669886350631714, 0.0683247447013855, 0.15431934595108032, 0.24031394720077515, 0.32630860805511475, 0.41230320930480957, 0.4982978105545044, 0.5842924118041992, 0.670287013053894, 0.7562816739082336, 0.8422762751579285, 0.9282708764076233, 1.014265537261963, 1.1002601385116577, 1.1862547397613525, 1.2722493410110474, 1.3582439422607422, 1.4442386627197266, 1.5302331447601318, 1.6162278652191162, 1.702222466468811, 1.7882170677185059, 1.8742116689682007, 1.9602062702178955, 2.04620099067688, 2.132195472717285, 2.2181901931762695, 2.304184675216675, 2.390179395675659, 2.4761738777160645, 2.562168598175049]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 13.0, 15.0, 29.0, 45.0, 62.0, 97.0, 193.0, 365.0, 643.0, 1373.0, 2880.0, 6527.0, 15368.0, 38433.0, 103326.0, 266688.0, 345720.0, 164898.0, 60674.0, 23282.0, 9698.0, 4349.0, 1962.0, 894.0, 443.0, 212.0, 144.0, 79.0, 44.0, 33.0, 21.0, 9.0, 15.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8223419189453125, -0.792144775390625, -0.7619476318359375, -0.73175048828125, -0.7015533447265625, -0.671356201171875, -0.6411590576171875, -0.6109619140625, -0.5807647705078125, -0.550567626953125, -0.5203704833984375, -0.49017333984375, -0.4599761962890625, -0.429779052734375, -0.3995819091796875, -0.369384765625, -0.3391876220703125, -0.308990478515625, -0.2787933349609375, -0.24859619140625, -0.2183990478515625, -0.188201904296875, -0.1580047607421875, -0.1278076171875, -0.0976104736328125, -0.067413330078125, -0.0372161865234375, -0.00701904296875, 0.0231781005859375, 0.053375244140625, 0.0835723876953125, 0.11376953125, 0.1439666748046875, 0.174163818359375, 0.2043609619140625, 0.23455810546875, 0.2647552490234375, 0.294952392578125, 0.3251495361328125, 0.3553466796875, 0.3855438232421875, 0.415740966796875, 0.4459381103515625, 0.47613525390625, 0.5063323974609375, 0.536529541015625, 0.5667266845703125, 0.596923828125, 0.6271209716796875, 0.657318115234375, 0.6875152587890625, 0.71771240234375, 0.7479095458984375, 0.778106689453125, 0.8083038330078125, 0.8385009765625, 0.8686981201171875, 0.898895263671875, 0.9290924072265625, 0.95928955078125, 0.9894866943359375, 1.019683837890625, 1.0498809814453125, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 11.0, 19.0, 17.0, 25.0, 33.0, 21.0, 33.0, 28.0, 36.0, 44.0, 31.0, 40.0, 43.0, 56.0, 51.0, 47.0, 55.0, 41.0, 41.0, 39.0, 43.0, 26.0, 24.0, 28.0, 17.0, 20.0, 17.0, 17.0, 17.0, 10.0, 12.0, 12.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59765625, -3.479827880859375, -3.36199951171875, -3.244171142578125, -3.1263427734375, -3.008514404296875, -2.89068603515625, -2.772857666015625, -2.655029296875, -2.537200927734375, -2.41937255859375, -2.301544189453125, -2.1837158203125, -2.065887451171875, -1.94805908203125, -1.830230712890625, -1.71240234375, -1.594573974609375, -1.47674560546875, -1.358917236328125, -1.2410888671875, -1.123260498046875, -1.00543212890625, -0.887603759765625, -0.769775390625, -0.651947021484375, -0.53411865234375, -0.416290283203125, -0.2984619140625, -0.180633544921875, -0.06280517578125, 0.055023193359375, 0.1728515625, 0.290679931640625, 0.40850830078125, 0.526336669921875, 0.6441650390625, 0.761993408203125, 0.87982177734375, 0.997650146484375, 1.115478515625, 1.233306884765625, 1.35113525390625, 1.468963623046875, 1.5867919921875, 1.704620361328125, 1.82244873046875, 1.940277099609375, 2.05810546875, 2.175933837890625, 2.29376220703125, 2.411590576171875, 2.5294189453125, 2.647247314453125, 2.76507568359375, 2.882904052734375, 3.000732421875, 3.118560791015625, 3.23638916015625, 3.354217529296875, 3.4720458984375, 3.589874267578125, 3.70770263671875, 3.825531005859375, 3.943359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 8.0, 14.0, 16.0, 29.0, 36.0, 70.0, 111.0, 188.0, 315.0, 606.0, 1145.0, 2283.0, 5561.0, 16564.0, 92937.0, 884183.0, 29265.0, 8795.0, 3258.0, 1482.0, 727.0, 374.0, 240.0, 118.0, 87.0, 53.0, 30.0, 26.0, 6.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.017669677734375, -1.93768310546875, -1.857696533203125, -1.7777099609375, -1.697723388671875, -1.61773681640625, -1.537750244140625, -1.457763671875, -1.377777099609375, -1.29779052734375, -1.217803955078125, -1.1378173828125, -1.057830810546875, -0.97784423828125, -0.897857666015625, -0.81787109375, -0.737884521484375, -0.65789794921875, -0.577911376953125, -0.4979248046875, -0.417938232421875, -0.33795166015625, -0.257965087890625, -0.177978515625, -0.097991943359375, -0.01800537109375, 0.061981201171875, 0.1419677734375, 0.221954345703125, 0.30194091796875, 0.381927490234375, 0.4619140625, 0.541900634765625, 0.62188720703125, 0.701873779296875, 0.7818603515625, 0.861846923828125, 0.94183349609375, 1.021820068359375, 1.101806640625, 1.181793212890625, 1.26177978515625, 1.341766357421875, 1.4217529296875, 1.501739501953125, 1.58172607421875, 1.661712646484375, 1.74169921875, 1.821685791015625, 1.90167236328125, 1.981658935546875, 2.0616455078125, 2.141632080078125, 2.22161865234375, 2.301605224609375, 2.381591796875, 2.461578369140625, 2.54156494140625, 2.621551513671875, 2.7015380859375, 2.781524658203125, 2.86151123046875, 2.941497802734375, 3.021484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 10.0, 17.0, 16.0, 20.0, 27.0, 38.0, 23.0, 31.0, 41.0, 33.0, 43.0, 40.0, 39.0, 40.0, 37.0, 52.0, 46.0, 46.0, 42.0, 37.0, 26.0, 27.0, 41.0, 31.0, 19.0, 23.0, 18.0, 15.0, 13.0, 17.0, 10.0, 5.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.255859375, -2.185516357421875, -2.11517333984375, -2.044830322265625, -1.9744873046875, -1.904144287109375, -1.83380126953125, -1.763458251953125, -1.693115234375, -1.622772216796875, -1.55242919921875, -1.482086181640625, -1.4117431640625, -1.341400146484375, -1.27105712890625, -1.200714111328125, -1.13037109375, -1.060028076171875, -0.98968505859375, -0.919342041015625, -0.8489990234375, -0.778656005859375, -0.70831298828125, -0.637969970703125, -0.567626953125, -0.497283935546875, -0.42694091796875, -0.356597900390625, -0.2862548828125, -0.215911865234375, -0.14556884765625, -0.075225830078125, -0.0048828125, 0.065460205078125, 0.13580322265625, 0.206146240234375, 0.2764892578125, 0.346832275390625, 0.41717529296875, 0.487518310546875, 0.557861328125, 0.628204345703125, 0.69854736328125, 0.768890380859375, 0.8392333984375, 0.909576416015625, 0.97991943359375, 1.050262451171875, 1.12060546875, 1.190948486328125, 1.26129150390625, 1.331634521484375, 1.4019775390625, 1.472320556640625, 1.54266357421875, 1.613006591796875, 1.683349609375, 1.753692626953125, 1.82403564453125, 1.894378662109375, 1.9647216796875, 2.035064697265625, 2.10540771484375, 2.175750732421875, 2.24609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 0.0, 3.0, 10.0, 17.0, 24.0, 27.0, 33.0, 73.0, 97.0, 163.0, 221.0, 371.0, 675.0, 1736.0, 6957.0, 84252.0, 938120.0, 11626.0, 2206.0, 801.0, 389.0, 240.0, 167.0, 110.0, 62.0, 53.0, 34.0, 20.0, 24.0, 4.0, 5.0, 4.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1881103515625, -1.148681640625, -1.1092529296875, -1.06982421875, -1.0303955078125, -0.990966796875, -0.9515380859375, -0.912109375, -0.8726806640625, -0.833251953125, -0.7938232421875, -0.75439453125, -0.7149658203125, -0.675537109375, -0.6361083984375, -0.5966796875, -0.5572509765625, -0.517822265625, -0.4783935546875, -0.43896484375, -0.3995361328125, -0.360107421875, -0.3206787109375, -0.28125, -0.2418212890625, -0.202392578125, -0.1629638671875, -0.12353515625, -0.0841064453125, -0.044677734375, -0.0052490234375, 0.0341796875, 0.0736083984375, 0.113037109375, 0.1524658203125, 0.19189453125, 0.2313232421875, 0.270751953125, 0.3101806640625, 0.349609375, 0.3890380859375, 0.428466796875, 0.4678955078125, 0.50732421875, 0.5467529296875, 0.586181640625, 0.6256103515625, 0.6650390625, 0.7044677734375, 0.743896484375, 0.7833251953125, 0.82275390625, 0.8621826171875, 0.901611328125, 0.9410400390625, 0.98046875, 1.0198974609375, 1.059326171875, 1.0987548828125, 1.13818359375, 1.1776123046875, 1.217041015625, 1.2564697265625, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 20.0, 41.0, 67.0, 86.0, 150.0, 166.0, 152.0, 99.0, 96.0, 53.0, 24.0, 13.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012135505676269531, -0.00011796876788139343, -0.00011458247900009155, -0.00011119619011878967, -0.00010780990123748779, -0.00010442361235618591, -0.00010103732347488403, -9.765103459358215e-05, -9.426474571228027e-05, -9.08784568309784e-05, -8.749216794967651e-05, -8.410587906837463e-05, -8.071959018707275e-05, -7.733330130577087e-05, -7.3947012424469e-05, -7.056072354316711e-05, -6.717443466186523e-05, -6.378814578056335e-05, -6.0401856899261475e-05, -5.7015568017959595e-05, -5.3629279136657715e-05, -5.0242990255355835e-05, -4.6856701374053955e-05, -4.3470412492752075e-05, -4.0084123611450195e-05, -3.6697834730148315e-05, -3.3311545848846436e-05, -2.9925256967544556e-05, -2.6538968086242676e-05, -2.3152679204940796e-05, -1.9766390323638916e-05, -1.6380101442337036e-05, -1.2993812561035156e-05, -9.607523679733276e-06, -6.2212347984313965e-06, -2.8349459171295166e-06, 5.513429641723633e-07, 3.937631845474243e-06, 7.323920726776123e-06, 1.0710209608078003e-05, 1.4096498489379883e-05, 1.7482787370681763e-05, 2.0869076251983643e-05, 2.4255365133285522e-05, 2.7641654014587402e-05, 3.102794289588928e-05, 3.441423177719116e-05, 3.780052065849304e-05, 4.118680953979492e-05, 4.45730984210968e-05, 4.795938730239868e-05, 5.134567618370056e-05, 5.473196506500244e-05, 5.811825394630432e-05, 6.15045428276062e-05, 6.489083170890808e-05, 6.827712059020996e-05, 7.166340947151184e-05, 7.504969835281372e-05, 7.84359872341156e-05, 8.182227611541748e-05, 8.520856499671936e-05, 8.859485387802124e-05, 9.198114275932312e-05, 9.5367431640625e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 5.0, 18.0, 22.0, 25.0, 35.0, 53.0, 52.0, 83.0, 122.0, 158.0, 287.0, 451.0, 743.0, 1266.0, 2051.0, 3426.0, 6426.0, 19152.0, 192160.0, 728236.0, 69760.0, 11734.0, 5010.0, 2768.0, 1706.0, 1027.0, 606.0, 371.0, 243.0, 175.0, 113.0, 76.0, 54.0, 44.0, 23.0, 20.0, 18.0, 5.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.71533203125, -0.6938629150390625, -0.672393798828125, -0.6509246826171875, -0.62945556640625, -0.6079864501953125, -0.586517333984375, -0.5650482177734375, -0.5435791015625, -0.5221099853515625, -0.500640869140625, -0.4791717529296875, -0.45770263671875, -0.4362335205078125, -0.414764404296875, -0.3932952880859375, -0.371826171875, -0.3503570556640625, -0.328887939453125, -0.3074188232421875, -0.28594970703125, -0.2644805908203125, -0.243011474609375, -0.2215423583984375, -0.2000732421875, -0.1786041259765625, -0.157135009765625, -0.1356658935546875, -0.11419677734375, -0.0927276611328125, -0.071258544921875, -0.0497894287109375, -0.0283203125, -0.0068511962890625, 0.014617919921875, 0.0360870361328125, 0.05755615234375, 0.0790252685546875, 0.100494384765625, 0.1219635009765625, 0.1434326171875, 0.1649017333984375, 0.186370849609375, 0.2078399658203125, 0.22930908203125, 0.2507781982421875, 0.272247314453125, 0.2937164306640625, 0.315185546875, 0.3366546630859375, 0.358123779296875, 0.3795928955078125, 0.40106201171875, 0.4225311279296875, 0.444000244140625, 0.4654693603515625, 0.4869384765625, 0.5084075927734375, 0.529876708984375, 0.5513458251953125, 0.57281494140625, 0.5942840576171875, 0.615753173828125, 0.6372222900390625, 0.65869140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 17.0, 39.0, 104.0, 249.0, 325.0, 145.0, 55.0, 22.0, 14.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17509841918945312, -0.16928863525390625, -0.16347885131835938, -0.1576690673828125, -0.15185928344726562, -0.14604949951171875, -0.14023971557617188, -0.134429931640625, -0.12862014770507812, -0.12281036376953125, -0.11700057983398438, -0.1111907958984375, -0.10538101196289062, -0.09957122802734375, -0.09376144409179688, -0.08795166015625, -0.08214187622070312, -0.07633209228515625, -0.07052230834960938, -0.0647125244140625, -0.058902740478515625, -0.05309295654296875, -0.047283172607421875, -0.041473388671875, -0.035663604736328125, -0.02985382080078125, -0.024044036865234375, -0.0182342529296875, -0.012424468994140625, -0.00661468505859375, -0.000804901123046875, 0.0050048828125, 0.010814666748046875, 0.01662445068359375, 0.022434234619140625, 0.0282440185546875, 0.034053802490234375, 0.03986358642578125, 0.045673370361328125, 0.051483154296875, 0.057292938232421875, 0.06310272216796875, 0.06891250610351562, 0.0747222900390625, 0.08053207397460938, 0.08634185791015625, 0.09215164184570312, 0.09796142578125, 0.10377120971679688, 0.10958099365234375, 0.11539077758789062, 0.1212005615234375, 0.12701034545898438, 0.13282012939453125, 0.13862991333007812, 0.144439697265625, 0.15024948120117188, 0.15605926513671875, 0.16186904907226562, 0.1676788330078125, 0.17348861694335938, 0.17929840087890625, 0.18510818481445312, 0.19091796875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 6.0, 10.0, 12.0, 14.0, 20.0, 16.0, 24.0, 32.0, 37.0, 43.0, 56.0, 49.0, 56.0, 71.0, 67.0, 68.0, 66.0, 45.0, 52.0, 35.0, 39.0, 43.0, 25.0, 23.0, 17.0, 16.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0382232666015625, -5.853695869445801, -5.669168472290039, -5.484641075134277, -5.300113201141357, -5.115585803985596, -4.931058406829834, -4.746531009674072, -4.562003135681152, -4.377475738525391, -4.192948341369629, -4.008420944213867, -3.8238930702209473, -3.6393656730651855, -3.454838275909424, -3.270310878753662, -3.0857834815979004, -2.9012560844421387, -2.716728448867798, -2.532201051712036, -2.3476734161376953, -2.1631460189819336, -1.9786186218261719, -1.7940911054611206, -1.6095635890960693, -1.425036072731018, -1.2405085563659668, -1.055981159210205, -0.8714536428451538, -0.6869261264801025, -0.5023987293243408, -0.31787121295928955, -0.13334321975708008, 0.051184266805648804, 0.23571175336837769, 0.4202392101287842, 0.6047667264938354, 0.7892942428588867, 0.9738216400146484, 1.1583491563796997, 1.342876672744751, 1.5274041891098022, 1.7119317054748535, 1.8964591026306152, 2.080986499786377, 2.2655141353607178, 2.4500415325164795, 2.6345691680908203, 2.819096565246582, 3.0036239624023438, 3.1881515979766846, 3.3726789951324463, 3.557206630706787, 3.741734027862549, 3.9262614250183105, 4.110788822174072, 4.295316696166992, 4.479844093322754, 4.664371490478516, 4.848898887634277, 5.033426761627197, 5.217954158782959, 5.402481555938721, 5.587008953094482, 5.771536350250244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 6.0, 4.0, 7.0, 16.0, 9.0, 11.0, 17.0, 12.0, 16.0, 18.0, 23.0, 24.0, 33.0, 37.0, 29.0, 26.0, 33.0, 28.0, 38.0, 38.0, 44.0, 47.0, 35.0, 35.0, 30.0, 39.0, 40.0, 37.0, 31.0, 26.0, 21.0, 22.0, 20.0, 22.0, 20.0, 11.0, 13.0, 11.0, 13.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-2.915468454360962, -2.8307132720947266, -2.745957851409912, -2.6612026691436768, -2.5764474868774414, -2.491692304611206, -2.4069368839263916, -2.3221817016601562, -2.237426519393921, -2.1526713371276855, -2.067915916442871, -1.9831607341766357, -1.8984055519104004, -1.8136502504348755, -1.7288949489593506, -1.6441397666931152, -1.5593844652175903, -1.4746291637420654, -1.38987398147583, -1.3051186800003052, -1.2203634977340698, -1.135608196258545, -1.0508530139923096, -0.9660977125167847, -0.8813424706459045, -0.7965872287750244, -0.7118319869041443, -0.6270767450332642, -0.5423214435577393, -0.4575662314891815, -0.372810959815979, -0.2880557179450989, -0.20330047607421875, -0.11854522675275803, -0.0337899774312973, 0.05096527934074402, 0.13572052121162415, 0.22047576308250427, 0.3052310347557068, 0.3899862766265869, 0.47474151849746704, 0.5594967603683472, 0.6442520022392273, 0.7290072441101074, 0.8137625455856323, 0.8985177278518677, 0.9832730293273926, 1.068028211593628, 1.1527835130691528, 1.2375388145446777, 1.322293996810913, 1.407049298286438, 1.4918044805526733, 1.5765597820281982, 1.6613149642944336, 1.7460702657699585, 1.8308255672454834, 1.9155808687210083, 2.000336170196533, 2.0850913524627686, 2.169846534729004, 2.2546017169952393, 2.3393571376800537, 2.424112319946289, 2.5088675022125244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 17.0, 27.0, 35.0, 57.0, 88.0, 122.0, 185.0, 286.0, 431.0, 696.0, 1111.0, 1903.0, 3288.0, 5812.0, 10544.0, 18859.0, 33677.0, 57791.0, 93381.0, 135890.0, 167106.0, 166151.0, 132296.0, 89937.0, 55354.0, 32104.0, 18091.0, 10067.0, 5515.0, 3052.0, 1833.0, 1064.0, 644.0, 374.0, 256.0, 156.0, 120.0, 65.0, 46.0, 29.0, 28.0, 19.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2265625, -4.09429931640625, -3.9620361328125, -3.82977294921875, -3.697509765625, -3.56524658203125, -3.4329833984375, -3.30072021484375, -3.16845703125, -3.03619384765625, -2.9039306640625, -2.77166748046875, -2.639404296875, -2.50714111328125, -2.3748779296875, -2.24261474609375, -2.1103515625, -1.97808837890625, -1.8458251953125, -1.71356201171875, -1.581298828125, -1.44903564453125, -1.3167724609375, -1.18450927734375, -1.05224609375, -0.91998291015625, -0.7877197265625, -0.65545654296875, -0.523193359375, -0.39093017578125, -0.2586669921875, -0.12640380859375, 0.005859375, 0.13812255859375, 0.2703857421875, 0.40264892578125, 0.534912109375, 0.66717529296875, 0.7994384765625, 0.93170166015625, 1.06396484375, 1.19622802734375, 1.3284912109375, 1.46075439453125, 1.593017578125, 1.72528076171875, 1.8575439453125, 1.98980712890625, 2.1220703125, 2.25433349609375, 2.3865966796875, 2.51885986328125, 2.651123046875, 2.78338623046875, 2.9156494140625, 3.04791259765625, 3.18017578125, 3.31243896484375, 3.4447021484375, 3.57696533203125, 3.709228515625, 3.84149169921875, 3.9737548828125, 4.10601806640625, 4.23828125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 4.0, 9.0, 10.0, 24.0, 13.0, 19.0, 21.0, 21.0, 20.0, 22.0, 40.0, 27.0, 39.0, 33.0, 40.0, 51.0, 33.0, 41.0, 41.0, 40.0, 37.0, 32.0, 37.0, 41.0, 34.0, 23.0, 33.0, 19.0, 27.0, 20.0, 18.0, 16.0, 18.0, 8.0, 9.0, 7.0, 14.0, 6.0, 5.0, 1.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.968017578125, -2.87158203125, -2.775146484375, -2.6787109375, -2.582275390625, -2.48583984375, -2.389404296875, -2.29296875, -2.196533203125, -2.10009765625, -2.003662109375, -1.9072265625, -1.810791015625, -1.71435546875, -1.617919921875, -1.521484375, -1.425048828125, -1.32861328125, -1.232177734375, -1.1357421875, -1.039306640625, -0.94287109375, -0.846435546875, -0.75, -0.653564453125, -0.55712890625, -0.460693359375, -0.3642578125, -0.267822265625, -0.17138671875, -0.074951171875, 0.021484375, 0.117919921875, 0.21435546875, 0.310791015625, 0.4072265625, 0.503662109375, 0.60009765625, 0.696533203125, 0.79296875, 0.889404296875, 0.98583984375, 1.082275390625, 1.1787109375, 1.275146484375, 1.37158203125, 1.468017578125, 1.564453125, 1.660888671875, 1.75732421875, 1.853759765625, 1.9501953125, 2.046630859375, 2.14306640625, 2.239501953125, 2.3359375, 2.432373046875, 2.52880859375, 2.625244140625, 2.7216796875, 2.818115234375, 2.91455078125, 3.010986328125, 3.107421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 7.0, 18.0, 36.0, 49.0, 73.0, 117.0, 165.0, 317.0, 503.0, 798.0, 1360.0, 2190.0, 3784.0, 6525.0, 10644.0, 18411.0, 29744.0, 48212.0, 73391.0, 103778.0, 133679.0, 147435.0, 138712.0, 111602.0, 80247.0, 52811.0, 33582.0, 20618.0, 11946.0, 7128.0, 4295.0, 2587.0, 1464.0, 880.0, 554.0, 314.0, 199.0, 137.0, 75.0, 53.0, 30.0, 26.0, 21.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.88671875, -3.771087646484375, -3.65545654296875, -3.539825439453125, -3.4241943359375, -3.308563232421875, -3.19293212890625, -3.077301025390625, -2.961669921875, -2.846038818359375, -2.73040771484375, -2.614776611328125, -2.4991455078125, -2.383514404296875, -2.26788330078125, -2.152252197265625, -2.03662109375, -1.920989990234375, -1.80535888671875, -1.689727783203125, -1.5740966796875, -1.458465576171875, -1.34283447265625, -1.227203369140625, -1.111572265625, -0.995941162109375, -0.88031005859375, -0.764678955078125, -0.6490478515625, -0.533416748046875, -0.41778564453125, -0.302154541015625, -0.1865234375, -0.070892333984375, 0.04473876953125, 0.160369873046875, 0.2760009765625, 0.391632080078125, 0.50726318359375, 0.622894287109375, 0.738525390625, 0.854156494140625, 0.96978759765625, 1.085418701171875, 1.2010498046875, 1.316680908203125, 1.43231201171875, 1.547943115234375, 1.66357421875, 1.779205322265625, 1.89483642578125, 2.010467529296875, 2.1260986328125, 2.241729736328125, 2.35736083984375, 2.472991943359375, 2.588623046875, 2.704254150390625, 2.81988525390625, 2.935516357421875, 3.0511474609375, 3.166778564453125, 3.28240966796875, 3.398040771484375, 3.513671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 6.0, 3.0, 7.0, 17.0, 13.0, 17.0, 18.0, 16.0, 24.0, 28.0, 27.0, 28.0, 48.0, 30.0, 46.0, 43.0, 39.0, 34.0, 44.0, 44.0, 47.0, 38.0, 40.0, 40.0, 36.0, 33.0, 23.0, 22.0, 26.0, 28.0, 23.0, 23.0, 19.0, 14.0, 15.0, 4.0, 8.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.099609375, -2.035552978515625, -1.97149658203125, -1.907440185546875, -1.8433837890625, -1.779327392578125, -1.71527099609375, -1.651214599609375, -1.587158203125, -1.523101806640625, -1.45904541015625, -1.394989013671875, -1.3309326171875, -1.266876220703125, -1.20281982421875, -1.138763427734375, -1.07470703125, -1.010650634765625, -0.94659423828125, -0.882537841796875, -0.8184814453125, -0.754425048828125, -0.69036865234375, -0.626312255859375, -0.562255859375, -0.498199462890625, -0.43414306640625, -0.370086669921875, -0.3060302734375, -0.241973876953125, -0.17791748046875, -0.113861083984375, -0.0498046875, 0.014251708984375, 0.07830810546875, 0.142364501953125, 0.2064208984375, 0.270477294921875, 0.33453369140625, 0.398590087890625, 0.462646484375, 0.526702880859375, 0.59075927734375, 0.654815673828125, 0.7188720703125, 0.782928466796875, 0.84698486328125, 0.911041259765625, 0.97509765625, 1.039154052734375, 1.10321044921875, 1.167266845703125, 1.2313232421875, 1.295379638671875, 1.35943603515625, 1.423492431640625, 1.487548828125, 1.551605224609375, 1.61566162109375, 1.679718017578125, 1.7437744140625, 1.807830810546875, 1.87188720703125, 1.935943603515625, 2.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 9.0, 12.0, 11.0, 27.0, 39.0, 47.0, 69.0, 116.0, 163.0, 244.0, 376.0, 698.0, 1120.0, 1787.0, 3114.0, 5363.0, 9602.0, 17432.0, 32410.0, 59348.0, 104130.0, 160288.0, 196487.0, 176084.0, 120811.0, 71256.0, 39184.0, 21067.0, 11568.0, 6369.0, 3703.0, 2170.0, 1301.0, 795.0, 493.0, 298.0, 208.0, 115.0, 79.0, 49.0, 39.0, 28.0, 12.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.384765625, -2.311737060546875, -2.23870849609375, -2.165679931640625, -2.0926513671875, -2.019622802734375, -1.94659423828125, -1.873565673828125, -1.800537109375, -1.727508544921875, -1.65447998046875, -1.581451416015625, -1.5084228515625, -1.435394287109375, -1.36236572265625, -1.289337158203125, -1.21630859375, -1.143280029296875, -1.07025146484375, -0.997222900390625, -0.9241943359375, -0.851165771484375, -0.77813720703125, -0.705108642578125, -0.632080078125, -0.559051513671875, -0.48602294921875, -0.412994384765625, -0.3399658203125, -0.266937255859375, -0.19390869140625, -0.120880126953125, -0.0478515625, 0.025177001953125, 0.09820556640625, 0.171234130859375, 0.2442626953125, 0.317291259765625, 0.39031982421875, 0.463348388671875, 0.536376953125, 0.609405517578125, 0.68243408203125, 0.755462646484375, 0.8284912109375, 0.901519775390625, 0.97454833984375, 1.047576904296875, 1.12060546875, 1.193634033203125, 1.26666259765625, 1.339691162109375, 1.4127197265625, 1.485748291015625, 1.55877685546875, 1.631805419921875, 1.704833984375, 1.777862548828125, 1.85089111328125, 1.923919677734375, 1.9969482421875, 2.069976806640625, 2.14300537109375, 2.216033935546875, 2.2890625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 11.0, 10.0, 22.0, 15.0, 53.0, 58.0, 82.0, 87.0, 106.0, 113.0, 104.0, 91.0, 78.0, 55.0, 38.0, 24.0, 13.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004456043243408203, -0.00043368712067604065, -0.000421769917011261, -0.0004098527133464813, -0.00039793550968170166, -0.000386018306016922, -0.00037410110235214233, -0.00036218389868736267, -0.000350266695022583, -0.00033834949135780334, -0.0003264322876930237, -0.000314515084028244, -0.00030259788036346436, -0.0002906806766986847, -0.00027876347303390503, -0.00026684626936912537, -0.0002549290657043457, -0.00024301186203956604, -0.00023109465837478638, -0.00021917745471000671, -0.00020726025104522705, -0.0001953430473804474, -0.00018342584371566772, -0.00017150864005088806, -0.0001595914363861084, -0.00014767423272132874, -0.00013575702905654907, -0.0001238398253917694, -0.00011192262172698975, -0.00010000541806221008, -8.808821439743042e-05, -7.617101073265076e-05, -6.42538070678711e-05, -5.233660340309143e-05, -4.041939973831177e-05, -2.8502196073532104e-05, -1.658499240875244e-05, -4.667788743972778e-06, 7.249414920806885e-06, 1.9166618585586548e-05, 3.108382225036621e-05, 4.3001025915145874e-05, 5.491822957992554e-05, 6.68354332447052e-05, 7.875263690948486e-05, 9.066984057426453e-05, 0.00010258704423904419, 0.00011450424790382385, 0.00012642145156860352, 0.00013833865523338318, 0.00015025585889816284, 0.0001621730625629425, 0.00017409026622772217, 0.00018600746989250183, 0.0001979246735572815, 0.00020984187722206116, 0.00022175908088684082, 0.00023367628455162048, 0.00024559348821640015, 0.0002575106918811798, 0.00026942789554595947, 0.00028134509921073914, 0.0002932623028755188, 0.00030517950654029846, 0.0003170967102050781]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 12.0, 16.0, 25.0, 17.0, 37.0, 52.0, 58.0, 98.0, 130.0, 170.0, 240.0, 350.0, 577.0, 883.0, 1376.0, 2336.0, 3973.0, 6767.0, 12000.0, 21484.0, 39239.0, 69864.0, 118888.0, 173203.0, 193835.0, 160429.0, 104667.0, 60084.0, 33658.0, 18785.0, 10251.0, 5812.0, 3471.0, 1993.0, 1304.0, 823.0, 552.0, 350.0, 220.0, 153.0, 98.0, 88.0, 52.0, 33.0, 28.0, 21.0, 19.0, 10.0, 11.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.384765625, -2.31109619140625, -2.2374267578125, -2.16375732421875, -2.090087890625, -2.01641845703125, -1.9427490234375, -1.86907958984375, -1.79541015625, -1.72174072265625, -1.6480712890625, -1.57440185546875, -1.500732421875, -1.42706298828125, -1.3533935546875, -1.27972412109375, -1.2060546875, -1.13238525390625, -1.0587158203125, -0.98504638671875, -0.911376953125, -0.83770751953125, -0.7640380859375, -0.69036865234375, -0.61669921875, -0.54302978515625, -0.4693603515625, -0.39569091796875, -0.322021484375, -0.24835205078125, -0.1746826171875, -0.10101318359375, -0.02734375, 0.04632568359375, 0.1199951171875, 0.19366455078125, 0.267333984375, 0.34100341796875, 0.4146728515625, 0.48834228515625, 0.56201171875, 0.63568115234375, 0.7093505859375, 0.78302001953125, 0.856689453125, 0.93035888671875, 1.0040283203125, 1.07769775390625, 1.1513671875, 1.22503662109375, 1.2987060546875, 1.37237548828125, 1.446044921875, 1.51971435546875, 1.5933837890625, 1.66705322265625, 1.74072265625, 1.81439208984375, 1.8880615234375, 1.96173095703125, 2.035400390625, 2.10906982421875, 2.1827392578125, 2.25640869140625, 2.330078125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 9.0, 5.0, 11.0, 13.0, 16.0, 24.0, 25.0, 35.0, 32.0, 38.0, 38.0, 50.0, 48.0, 66.0, 57.0, 55.0, 60.0, 43.0, 52.0, 45.0, 47.0, 34.0, 30.0, 24.0, 14.0, 26.0, 15.0, 16.0, 13.0, 8.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.642578125, -0.6241302490234375, -0.605682373046875, -0.5872344970703125, -0.56878662109375, -0.5503387451171875, -0.531890869140625, -0.5134429931640625, -0.4949951171875, -0.4765472412109375, -0.458099365234375, -0.4396514892578125, -0.42120361328125, -0.4027557373046875, -0.384307861328125, -0.3658599853515625, -0.347412109375, -0.3289642333984375, -0.310516357421875, -0.2920684814453125, -0.27362060546875, -0.2551727294921875, -0.236724853515625, -0.2182769775390625, -0.1998291015625, -0.1813812255859375, -0.162933349609375, -0.1444854736328125, -0.12603759765625, -0.1075897216796875, -0.089141845703125, -0.0706939697265625, -0.05224609375, -0.0337982177734375, -0.015350341796875, 0.0030975341796875, 0.02154541015625, 0.0399932861328125, 0.058441162109375, 0.0768890380859375, 0.0953369140625, 0.1137847900390625, 0.132232666015625, 0.1506805419921875, 0.16912841796875, 0.1875762939453125, 0.206024169921875, 0.2244720458984375, 0.242919921875, 0.2613677978515625, 0.279815673828125, 0.2982635498046875, 0.31671142578125, 0.3351593017578125, 0.353607177734375, 0.3720550537109375, 0.3905029296875, 0.4089508056640625, 0.427398681640625, 0.4458465576171875, 0.46429443359375, 0.4827423095703125, 0.501190185546875, 0.5196380615234375, 0.5380859375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 6.0, 8.0, 11.0, 16.0, 21.0, 21.0, 30.0, 32.0, 35.0, 44.0, 48.0, 68.0, 58.0, 63.0, 81.0, 74.0, 58.0, 59.0, 49.0, 39.0, 27.0, 31.0, 33.0, 23.0, 11.0, 9.0, 12.0, 6.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.592738151550293, -6.400635719299316, -6.20853328704834, -6.016430854797363, -5.824328422546387, -5.63222599029541, -5.440123558044434, -5.248021125793457, -5.0559186935424805, -4.863816261291504, -4.671713829040527, -4.479611396789551, -4.287508964538574, -4.095406532287598, -3.9033043384552, -3.7112019062042236, -3.519099712371826, -3.3269972801208496, -3.134894847869873, -2.9427924156188965, -2.75068998336792, -2.5585875511169434, -2.366485357284546, -2.1743829250335693, -1.9822804927825928, -1.7901780605316162, -1.5980756282806396, -1.4059733152389526, -1.213870882987976, -1.0217684507369995, -0.8296661376953125, -0.6375637054443359, -0.4454612731933594, -0.2533588707447052, -0.061256468296051025, 0.13084590435028076, 0.3229483366012573, 0.5150507688522339, 0.7071530818939209, 0.8992555141448975, 1.091357946395874, 1.2834603786468506, 1.4755628108978271, 1.6676651239395142, 1.8597675561904907, 2.0518698692321777, 2.2439723014831543, 2.436074733734131, 2.6281771659851074, 2.820279598236084, 3.0123820304870605, 3.204484462738037, 3.3965868949890137, 3.5886893272399902, 3.7807915210723877, 3.9728939533233643, 4.164996147155762, 4.357098579406738, 4.549201011657715, 4.741303443908691, 4.933405876159668, 5.1255083084106445, 5.317610740661621, 5.509713172912598, 5.701815605163574]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 18.0, 24.0, 27.0, 28.0, 35.0, 32.0, 32.0, 37.0, 50.0, 42.0, 39.0, 37.0, 57.0, 40.0, 42.0, 38.0, 47.0, 30.0, 34.0, 25.0, 28.0, 28.0, 18.0, 27.0, 17.0, 15.0, 11.0, 5.0, 11.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.537686347961426, -3.4350030422210693, -3.332319498062134, -3.2296361923217773, -3.126952886581421, -3.0242693424224854, -2.921586036682129, -2.8189024925231934, -2.716219186782837, -2.6135358810424805, -2.510852336883545, -2.4081690311431885, -2.305485725402832, -2.2028021812438965, -2.10011887550354, -1.997435450553894, -1.8947521448135376, -1.7920687198638916, -1.6893854141235352, -1.5867019891738892, -1.4840185642242432, -1.3813352584838867, -1.2786518335342407, -1.1759684085845947, -1.0732851028442383, -0.9706017374992371, -0.8679183125495911, -0.7652349472045898, -0.6625515222549438, -0.5598681569099426, -0.4571847915649414, -0.3545013666152954, -0.2518179416656494, -0.1491345465183258, -0.04645116627216339, 0.05623221397399902, 0.15891560912132263, 0.26159900426864624, 0.36428236961364746, 0.46696579456329346, 0.5696491599082947, 0.6723325252532959, 0.7750159502029419, 0.8776993155479431, 0.9803826808929443, 1.0830661058425903, 1.1857495307922363, 1.2884328365325928, 1.3911162614822388, 1.4937996864318848, 1.5964829921722412, 1.6991664171218872, 1.8018498420715332, 1.9045331478118896, 2.007216453552246, 2.1098999977111816, 2.212583303451538, 2.3152666091918945, 2.41795015335083, 2.5206334590911865, 2.623316764831543, 2.7260003089904785, 2.828683614730835, 2.9313669204711914, 3.034050464630127]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 9.0, 7.0, 10.0, 22.0, 20.0, 29.0, 35.0, 60.0, 77.0, 126.0, 169.0, 253.0, 401.0, 579.0, 967.0, 1484.0, 2329.0, 3797.0, 6305.0, 10285.0, 18535.0, 34119.0, 65099.0, 132402.0, 281641.0, 586474.0, 970300.0, 954120.0, 568134.0, 274482.0, 133205.0, 66654.0, 35300.0, 19418.0, 11036.0, 6572.0, 3785.0, 2356.0, 1392.0, 902.0, 518.0, 368.0, 191.0, 127.0, 77.0, 47.0, 40.0, 8.0, 4.0, 11.0, 5.0, 3.0, 1.0, 3.0], "bins": [-6.375, -6.20263671875, -6.0302734375, -5.85791015625, -5.685546875, -5.51318359375, -5.3408203125, -5.16845703125, -4.99609375, -4.82373046875, -4.6513671875, -4.47900390625, -4.306640625, -4.13427734375, -3.9619140625, -3.78955078125, -3.6171875, -3.44482421875, -3.2724609375, -3.10009765625, -2.927734375, -2.75537109375, -2.5830078125, -2.41064453125, -2.23828125, -2.06591796875, -1.8935546875, -1.72119140625, -1.548828125, -1.37646484375, -1.2041015625, -1.03173828125, -0.859375, -0.68701171875, -0.5146484375, -0.34228515625, -0.169921875, 0.00244140625, 0.1748046875, 0.34716796875, 0.51953125, 0.69189453125, 0.8642578125, 1.03662109375, 1.208984375, 1.38134765625, 1.5537109375, 1.72607421875, 1.8984375, 2.07080078125, 2.2431640625, 2.41552734375, 2.587890625, 2.76025390625, 2.9326171875, 3.10498046875, 3.27734375, 3.44970703125, 3.6220703125, 3.79443359375, 3.966796875, 4.13916015625, 4.3115234375, 4.48388671875, 4.65625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 10.0, 14.0, 7.0, 16.0, 13.0, 15.0, 22.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 39.0, 34.0, 41.0, 52.0, 49.0, 41.0, 43.0, 29.0, 53.0, 45.0, 40.0, 35.0, 38.0, 22.0, 33.0, 22.0, 13.0, 25.0, 12.0, 13.0, 11.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.052734375, -2.965850830078125, -2.87896728515625, -2.792083740234375, -2.7052001953125, -2.618316650390625, -2.53143310546875, -2.444549560546875, -2.357666015625, -2.270782470703125, -2.18389892578125, -2.097015380859375, -2.0101318359375, -1.923248291015625, -1.83636474609375, -1.749481201171875, -1.66259765625, -1.575714111328125, -1.48883056640625, -1.401947021484375, -1.3150634765625, -1.228179931640625, -1.14129638671875, -1.054412841796875, -0.967529296875, -0.880645751953125, -0.79376220703125, -0.706878662109375, -0.6199951171875, -0.533111572265625, -0.44622802734375, -0.359344482421875, -0.2724609375, -0.185577392578125, -0.09869384765625, -0.011810302734375, 0.0750732421875, 0.161956787109375, 0.24884033203125, 0.335723876953125, 0.422607421875, 0.509490966796875, 0.59637451171875, 0.683258056640625, 0.7701416015625, 0.857025146484375, 0.94390869140625, 1.030792236328125, 1.11767578125, 1.204559326171875, 1.29144287109375, 1.378326416015625, 1.4652099609375, 1.552093505859375, 1.63897705078125, 1.725860595703125, 1.812744140625, 1.899627685546875, 1.98651123046875, 2.073394775390625, 2.1602783203125, 2.247161865234375, 2.33404541015625, 2.420928955078125, 2.5078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 29.0, 34.0, 45.0, 74.0, 102.0, 171.0, 232.0, 376.0, 577.0, 905.0, 1361.0, 2128.0, 3283.0, 5203.0, 8395.0, 13655.0, 22872.0, 38670.0, 66692.0, 117931.0, 211257.0, 372398.0, 612727.0, 810640.0, 739668.0, 494160.0, 288017.0, 162159.0, 91197.0, 52108.0, 30061.0, 17832.0, 10897.0, 6661.0, 4154.0, 2649.0, 1666.0, 1098.0, 760.0, 476.0, 332.0, 202.0, 145.0, 99.0, 65.0, 50.0, 20.0, 20.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.390625, -5.220947265625, -5.05126953125, -4.881591796875, -4.7119140625, -4.542236328125, -4.37255859375, -4.202880859375, -4.033203125, -3.863525390625, -3.69384765625, -3.524169921875, -3.3544921875, -3.184814453125, -3.01513671875, -2.845458984375, -2.67578125, -2.506103515625, -2.33642578125, -2.166748046875, -1.9970703125, -1.827392578125, -1.65771484375, -1.488037109375, -1.318359375, -1.148681640625, -0.97900390625, -0.809326171875, -0.6396484375, -0.469970703125, -0.30029296875, -0.130615234375, 0.0390625, 0.208740234375, 0.37841796875, 0.548095703125, 0.7177734375, 0.887451171875, 1.05712890625, 1.226806640625, 1.396484375, 1.566162109375, 1.73583984375, 1.905517578125, 2.0751953125, 2.244873046875, 2.41455078125, 2.584228515625, 2.75390625, 2.923583984375, 3.09326171875, 3.262939453125, 3.4326171875, 3.602294921875, 3.77197265625, 3.941650390625, 4.111328125, 4.281005859375, 4.45068359375, 4.620361328125, 4.7900390625, 4.959716796875, 5.12939453125, 5.299072265625, 5.46875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 14.0, 13.0, 16.0, 13.0, 26.0, 35.0, 35.0, 30.0, 61.0, 75.0, 83.0, 98.0, 101.0, 149.0, 203.0, 193.0, 189.0, 214.0, 284.0, 264.0, 260.0, 254.0, 220.0, 190.0, 183.0, 157.0, 142.0, 109.0, 82.0, 71.0, 78.0, 50.0, 33.0, 33.0, 19.0, 16.0, 20.0, 12.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.623046875, -1.569915771484375, -1.51678466796875, -1.463653564453125, -1.4105224609375, -1.357391357421875, -1.30426025390625, -1.251129150390625, -1.197998046875, -1.144866943359375, -1.09173583984375, -1.038604736328125, -0.9854736328125, -0.932342529296875, -0.87921142578125, -0.826080322265625, -0.77294921875, -0.719818115234375, -0.66668701171875, -0.613555908203125, -0.5604248046875, -0.507293701171875, -0.45416259765625, -0.401031494140625, -0.347900390625, -0.294769287109375, -0.24163818359375, -0.188507080078125, -0.1353759765625, -0.082244873046875, -0.02911376953125, 0.024017333984375, 0.0771484375, 0.130279541015625, 0.18341064453125, 0.236541748046875, 0.2896728515625, 0.342803955078125, 0.39593505859375, 0.449066162109375, 0.502197265625, 0.555328369140625, 0.60845947265625, 0.661590576171875, 0.7147216796875, 0.767852783203125, 0.82098388671875, 0.874114990234375, 0.92724609375, 0.980377197265625, 1.03350830078125, 1.086639404296875, 1.1397705078125, 1.192901611328125, 1.24603271484375, 1.299163818359375, 1.352294921875, 1.405426025390625, 1.45855712890625, 1.511688232421875, 1.5648193359375, 1.617950439453125, 1.67108154296875, 1.724212646484375, 1.77734375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 4.0, 9.0, 13.0, 18.0, 15.0, 16.0, 24.0, 32.0, 34.0, 32.0, 50.0, 59.0, 52.0, 45.0, 43.0, 51.0, 50.0, 43.0, 53.0, 55.0, 52.0, 42.0, 26.0, 29.0, 28.0, 23.0, 14.0, 12.0, 11.0, 10.0, 13.0, 7.0, 3.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2430925369262695, -5.061591148376465, -4.88008975982666, -4.6985883712768555, -4.517086982727051, -4.335585594177246, -4.154084205627441, -3.9725828170776367, -3.791081428527832, -3.6095800399780273, -3.4280786514282227, -3.246577262878418, -3.0650758743286133, -2.8835744857788086, -2.702073097229004, -2.520571708679199, -2.3390703201293945, -2.15756893157959, -1.9760675430297852, -1.7945661544799805, -1.6130647659301758, -1.431563377380371, -1.2500619888305664, -1.0685606002807617, -0.887059211730957, -0.7055578231811523, -0.5240564346313477, -0.34255504608154297, -0.16105365753173828, 0.020447731018066406, 0.2019491195678711, 0.3834505081176758, 0.5649518966674805, 0.7464532852172852, 0.9279546737670898, 1.1094560623168945, 1.2909574508666992, 1.472458839416504, 1.6539602279663086, 1.8354616165161133, 2.016963005065918, 2.1984643936157227, 2.3799657821655273, 2.561467170715332, 2.7429685592651367, 2.9244699478149414, 3.105971336364746, 3.287472724914551, 3.4689741134643555, 3.65047550201416, 3.831976890563965, 4.0134782791137695, 4.194979667663574, 4.376481056213379, 4.557982444763184, 4.739483833312988, 4.920985221862793, 5.102486610412598, 5.283987998962402, 5.465489387512207, 5.646990776062012, 5.828492164611816, 6.009993553161621, 6.191494941711426, 6.3729963302612305]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 17.0, 15.0, 8.0, 17.0, 34.0, 20.0, 18.0, 29.0, 38.0, 38.0, 33.0, 46.0, 31.0, 29.0, 45.0, 45.0, 46.0, 41.0, 37.0, 50.0, 33.0, 38.0, 35.0, 31.0, 21.0, 33.0, 16.0, 13.0, 14.0, 17.0, 19.0, 2.0, 9.0, 9.0, 12.0, 5.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.1414031982421875, -4.029458999633789, -3.9175145626068115, -3.805570363998413, -3.6936261653900146, -3.581681728363037, -3.4697375297546387, -3.3577933311462402, -3.2458488941192627, -3.1339046955108643, -3.0219602584838867, -2.9100160598754883, -2.79807186126709, -2.6861274242401123, -2.574183225631714, -2.4622387886047363, -2.350294589996338, -2.2383503913879395, -2.126405954360962, -2.0144617557525635, -1.9025174379348755, -1.7905731201171875, -1.678628921508789, -1.566684603691101, -1.4547405242919922, -1.3427962064743042, -1.2308520078659058, -1.1189076900482178, -1.0069633722305298, -0.8950191140174866, -0.7830748558044434, -0.6711305379867554, -0.5591862201690674, -0.4472419321537018, -0.3352976441383362, -0.22335338592529297, -0.11140909790992737, 0.0005351901054382324, 0.11247944831848145, 0.22442376613616943, 0.33636802434921265, 0.44831231236457825, 0.5602566003799438, 0.6722008585929871, 0.7841451168060303, 0.8960894346237183, 1.0080337524414062, 1.1199779510498047, 1.2319222688674927, 1.3438665866851807, 1.455810785293579, 1.567755103111267, 1.679699420928955, 1.7916436195373535, 1.9035879373550415, 2.0155322551727295, 2.127476453781128, 2.2394206523895264, 2.351365089416504, 2.4633092880249023, 2.575253486633301, 2.6871979236602783, 2.7991421222686768, 2.9110865592956543, 3.0230307579040527]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 12.0, 5.0, 14.0, 19.0, 27.0, 49.0, 59.0, 70.0, 137.0, 221.0, 334.0, 484.0, 769.0, 1317.0, 2010.0, 3393.0, 5778.0, 9869.0, 16975.0, 30169.0, 54598.0, 96809.0, 159514.0, 208051.0, 183464.0, 118416.0, 67481.0, 37606.0, 21276.0, 12061.0, 6941.0, 4078.0, 2457.0, 1405.0, 969.0, 622.0, 348.0, 262.0, 151.0, 113.0, 76.0, 40.0, 23.0, 27.0, 12.0, 9.0, 15.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.58251953125, -0.564697265625, -0.546875, -0.529052734375, -0.51123046875, -0.493408203125, -0.4755859375, -0.457763671875, -0.43994140625, -0.422119140625, -0.404296875, -0.386474609375, -0.36865234375, -0.350830078125, -0.3330078125, -0.315185546875, -0.29736328125, -0.279541015625, -0.26171875, -0.243896484375, -0.22607421875, -0.208251953125, -0.1904296875, -0.172607421875, -0.15478515625, -0.136962890625, -0.119140625, -0.101318359375, -0.08349609375, -0.065673828125, -0.0478515625, -0.030029296875, -0.01220703125, 0.005615234375, 0.0234375, 0.041259765625, 0.05908203125, 0.076904296875, 0.0947265625, 0.112548828125, 0.13037109375, 0.148193359375, 0.166015625, 0.183837890625, 0.20166015625, 0.219482421875, 0.2373046875, 0.255126953125, 0.27294921875, 0.290771484375, 0.30859375, 0.326416015625, 0.34423828125, 0.362060546875, 0.3798828125, 0.397705078125, 0.41552734375, 0.433349609375, 0.451171875, 0.468994140625, 0.48681640625, 0.504638671875, 0.5224609375, 0.540283203125, 0.55810546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 14.0, 17.0, 17.0, 31.0, 19.0, 27.0, 32.0, 33.0, 45.0, 48.0, 50.0, 46.0, 46.0, 49.0, 57.0, 58.0, 45.0, 50.0, 30.0, 43.0, 30.0, 26.0, 29.0, 22.0, 22.0, 22.0, 24.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2186279296875, -4.066162109375, -3.9136962890625, -3.76123046875, -3.6087646484375, -3.456298828125, -3.3038330078125, -3.1513671875, -2.9989013671875, -2.846435546875, -2.6939697265625, -2.54150390625, -2.3890380859375, -2.236572265625, -2.0841064453125, -1.931640625, -1.7791748046875, -1.626708984375, -1.4742431640625, -1.32177734375, -1.1693115234375, -1.016845703125, -0.8643798828125, -0.7119140625, -0.5594482421875, -0.406982421875, -0.2545166015625, -0.10205078125, 0.0504150390625, 0.202880859375, 0.3553466796875, 0.5078125, 0.6602783203125, 0.812744140625, 0.9652099609375, 1.11767578125, 1.2701416015625, 1.422607421875, 1.5750732421875, 1.7275390625, 1.8800048828125, 2.032470703125, 2.1849365234375, 2.33740234375, 2.4898681640625, 2.642333984375, 2.7947998046875, 2.947265625, 3.0997314453125, 3.252197265625, 3.4046630859375, 3.55712890625, 3.7095947265625, 3.862060546875, 4.0145263671875, 4.1669921875, 4.3194580078125, 4.471923828125, 4.6243896484375, 4.77685546875, 4.9293212890625, 5.081787109375, 5.2342529296875, 5.38671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 15.0, 14.0, 30.0, 32.0, 40.0, 106.0, 127.0, 168.0, 258.0, 441.0, 698.0, 1220.0, 2296.0, 4421.0, 9500.0, 22672.0, 109613.0, 828059.0, 39704.0, 14855.0, 6762.0, 3215.0, 1724.0, 953.0, 576.0, 368.0, 252.0, 129.0, 101.0, 63.0, 46.0, 31.0, 20.0, 6.0, 14.0, 7.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7063446044921875, -1.648040771484375, -1.5897369384765625, -1.53143310546875, -1.4731292724609375, -1.414825439453125, -1.3565216064453125, -1.2982177734375, -1.2399139404296875, -1.181610107421875, -1.1233062744140625, -1.06500244140625, -1.0066986083984375, -0.948394775390625, -0.8900909423828125, -0.831787109375, -0.7734832763671875, -0.715179443359375, -0.6568756103515625, -0.59857177734375, -0.5402679443359375, -0.481964111328125, -0.4236602783203125, -0.3653564453125, -0.3070526123046875, -0.248748779296875, -0.1904449462890625, -0.13214111328125, -0.0738372802734375, -0.015533447265625, 0.0427703857421875, 0.10107421875, 0.1593780517578125, 0.217681884765625, 0.2759857177734375, 0.33428955078125, 0.3925933837890625, 0.450897216796875, 0.5092010498046875, 0.5675048828125, 0.6258087158203125, 0.684112548828125, 0.7424163818359375, 0.80072021484375, 0.8590240478515625, 0.917327880859375, 0.9756317138671875, 1.033935546875, 1.0922393798828125, 1.150543212890625, 1.2088470458984375, 1.26715087890625, 1.3254547119140625, 1.383758544921875, 1.4420623779296875, 1.5003662109375, 1.5586700439453125, 1.616973876953125, 1.6752777099609375, 1.73358154296875, 1.7918853759765625, 1.850189208984375, 1.9084930419921875, 1.966796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 7.0, 8.0, 15.0, 13.0, 19.0, 14.0, 19.0, 31.0, 19.0, 32.0, 40.0, 39.0, 51.0, 40.0, 36.0, 42.0, 51.0, 40.0, 46.0, 45.0, 45.0, 43.0, 39.0, 28.0, 22.0, 27.0, 34.0, 25.0, 20.0, 19.0, 13.0, 14.0, 12.0, 8.0, 7.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.3424072265625, -2.251220703125, -2.1600341796875, -2.06884765625, -1.9776611328125, -1.886474609375, -1.7952880859375, -1.7041015625, -1.6129150390625, -1.521728515625, -1.4305419921875, -1.33935546875, -1.2481689453125, -1.156982421875, -1.0657958984375, -0.974609375, -0.8834228515625, -0.792236328125, -0.7010498046875, -0.60986328125, -0.5186767578125, -0.427490234375, -0.3363037109375, -0.2451171875, -0.1539306640625, -0.062744140625, 0.0284423828125, 0.11962890625, 0.2108154296875, 0.302001953125, 0.3931884765625, 0.484375, 0.5755615234375, 0.666748046875, 0.7579345703125, 0.84912109375, 0.9403076171875, 1.031494140625, 1.1226806640625, 1.2138671875, 1.3050537109375, 1.396240234375, 1.4874267578125, 1.57861328125, 1.6697998046875, 1.760986328125, 1.8521728515625, 1.943359375, 2.0345458984375, 2.125732421875, 2.2169189453125, 2.30810546875, 2.3992919921875, 2.490478515625, 2.5816650390625, 2.6728515625, 2.7640380859375, 2.855224609375, 2.9464111328125, 3.03759765625, 3.1287841796875, 3.219970703125, 3.3111572265625, 3.40234375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 8.0, 2.0, 11.0, 8.0, 12.0, 16.0, 28.0, 41.0, 48.0, 50.0, 96.0, 131.0, 194.0, 333.0, 475.0, 793.0, 1296.0, 2049.0, 3709.0, 6809.0, 13414.0, 30020.0, 809480.0, 131997.0, 23126.0, 10830.0, 5520.0, 3199.0, 1736.0, 1107.0, 691.0, 457.0, 269.0, 210.0, 116.0, 68.0, 45.0, 50.0, 29.0, 25.0, 12.0, 15.0, 10.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.318115234375, -0.30626678466796875, -0.2944183349609375, -0.28256988525390625, -0.270721435546875, -0.25887298583984375, -0.2470245361328125, -0.23517608642578125, -0.22332763671875, -0.21147918701171875, -0.1996307373046875, -0.18778228759765625, -0.175933837890625, -0.16408538818359375, -0.1522369384765625, -0.14038848876953125, -0.1285400390625, -0.11669158935546875, -0.1048431396484375, -0.09299468994140625, -0.081146240234375, -0.06929779052734375, -0.0574493408203125, -0.04560089111328125, -0.03375244140625, -0.02190399169921875, -0.0100555419921875, 0.00179290771484375, 0.013641357421875, 0.02548980712890625, 0.0373382568359375, 0.04918670654296875, 0.06103515625, 0.07288360595703125, 0.0847320556640625, 0.09658050537109375, 0.108428955078125, 0.12027740478515625, 0.1321258544921875, 0.14397430419921875, 0.15582275390625, 0.16767120361328125, 0.1795196533203125, 0.19136810302734375, 0.203216552734375, 0.21506500244140625, 0.2269134521484375, 0.23876190185546875, 0.2506103515625, 0.26245880126953125, 0.2743072509765625, 0.28615570068359375, 0.298004150390625, 0.30985260009765625, 0.3217010498046875, 0.33354949951171875, 0.34539794921875, 0.35724639892578125, 0.3690948486328125, 0.38094329833984375, 0.392791748046875, 0.40464019775390625, 0.4164886474609375, 0.42833709716796875, 0.440185546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 12.0, 7.0, 13.0, 18.0, 16.0, 26.0, 21.0, 30.0, 19.0, 43.0, 30.0, 45.0, 41.0, 53.0, 60.0, 38.0, 54.0, 58.0, 58.0, 45.0, 45.0, 36.0, 21.0, 39.0, 24.0, 32.0, 17.0, 22.0, 13.0, 9.0, 10.0, 13.0, 4.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.103725612163544e-05, -3.0007213354110718e-05, -2.8977170586586e-05, -2.794712781906128e-05, -2.691708505153656e-05, -2.588704228401184e-05, -2.485699951648712e-05, -2.3826956748962402e-05, -2.2796913981437683e-05, -2.1766871213912964e-05, -2.0736828446388245e-05, -1.9706785678863525e-05, -1.8676742911338806e-05, -1.7646700143814087e-05, -1.6616657376289368e-05, -1.558661460876465e-05, -1.455657184123993e-05, -1.352652907371521e-05, -1.249648630619049e-05, -1.1466443538665771e-05, -1.0436400771141052e-05, -9.406358003616333e-06, -8.376315236091614e-06, -7.3462724685668945e-06, -6.316229701042175e-06, -5.286186933517456e-06, -4.256144165992737e-06, -3.2261013984680176e-06, -2.1960586309432983e-06, -1.166015863418579e-06, -1.3597309589385986e-07, 8.940696716308594e-07, 1.9241124391555786e-06, 2.954155206680298e-06, 3.984197974205017e-06, 5.014240741729736e-06, 6.0442835092544556e-06, 7.074326276779175e-06, 8.104369044303894e-06, 9.134411811828613e-06, 1.0164454579353333e-05, 1.1194497346878052e-05, 1.2224540114402771e-05, 1.325458288192749e-05, 1.428462564945221e-05, 1.531466841697693e-05, 1.6344711184501648e-05, 1.7374753952026367e-05, 1.8404796719551086e-05, 1.9434839487075806e-05, 2.0464882254600525e-05, 2.1494925022125244e-05, 2.2524967789649963e-05, 2.3555010557174683e-05, 2.4585053324699402e-05, 2.561509609222412e-05, 2.664513885974884e-05, 2.767518162727356e-05, 2.870522439479828e-05, 2.9735267162322998e-05, 3.076530992984772e-05, 3.1795352697372437e-05, 3.2825395464897156e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 19.0, 22.0, 29.0, 27.0, 49.0, 53.0, 98.0, 117.0, 154.0, 238.0, 352.0, 536.0, 825.0, 1222.0, 2055.0, 3467.0, 6248.0, 11312.0, 21582.0, 43809.0, 88449.0, 170722.0, 255350.0, 209157.0, 114180.0, 56987.0, 28100.0, 14410.0, 7706.0, 4267.0, 2555.0, 1561.0, 928.0, 605.0, 404.0, 252.0, 189.0, 122.0, 77.0, 67.0, 45.0, 43.0, 27.0, 26.0, 25.0, 16.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-0.1854248046875, -0.17957305908203125, -0.1737213134765625, -0.16786956787109375, -0.162017822265625, -0.15616607666015625, -0.1503143310546875, -0.14446258544921875, -0.13861083984375, -0.13275909423828125, -0.1269073486328125, -0.12105560302734375, -0.115203857421875, -0.10935211181640625, -0.1035003662109375, -0.09764862060546875, -0.091796875, -0.08594512939453125, -0.0800933837890625, -0.07424163818359375, -0.068389892578125, -0.06253814697265625, -0.0566864013671875, -0.05083465576171875, -0.04498291015625, -0.03913116455078125, -0.0332794189453125, -0.02742767333984375, -0.021575927734375, -0.01572418212890625, -0.0098724365234375, -0.00402069091796875, 0.0018310546875, 0.00768280029296875, 0.0135345458984375, 0.01938629150390625, 0.025238037109375, 0.03108978271484375, 0.0369415283203125, 0.04279327392578125, 0.04864501953125, 0.05449676513671875, 0.0603485107421875, 0.06620025634765625, 0.072052001953125, 0.07790374755859375, 0.0837554931640625, 0.08960723876953125, 0.095458984375, 0.10131072998046875, 0.1071624755859375, 0.11301422119140625, 0.118865966796875, 0.12471771240234375, 0.1305694580078125, 0.13642120361328125, 0.14227294921875, 0.14812469482421875, 0.1539764404296875, 0.15982818603515625, 0.165679931640625, 0.17153167724609375, 0.1773834228515625, 0.18323516845703125, 0.1890869140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 5.0, 13.0, 14.0, 17.0, 12.0, 22.0, 26.0, 24.0, 33.0, 25.0, 48.0, 44.0, 55.0, 56.0, 60.0, 73.0, 53.0, 60.0, 54.0, 28.0, 49.0, 36.0, 26.0, 27.0, 17.0, 18.0, 14.0, 15.0, 10.0, 4.0, 8.0, 4.0, 4.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.033934593200683594, -0.03277397155761719, -0.03161334991455078, -0.030452728271484375, -0.02929210662841797, -0.028131484985351562, -0.026970863342285156, -0.02581024169921875, -0.024649620056152344, -0.023488998413085938, -0.02232837677001953, -0.021167755126953125, -0.02000713348388672, -0.018846511840820312, -0.017685890197753906, -0.0165252685546875, -0.015364646911621094, -0.014204025268554688, -0.013043403625488281, -0.011882781982421875, -0.010722160339355469, -0.009561538696289062, -0.008400917053222656, -0.00724029541015625, -0.006079673767089844, -0.0049190521240234375, -0.0037584304809570312, -0.002597808837890625, -0.0014371871948242188, -0.0002765655517578125, 0.0008840560913085938, 0.002044677734375, 0.0032052993774414062, 0.0043659210205078125, 0.005526542663574219, 0.006687164306640625, 0.007847785949707031, 0.009008407592773438, 0.010169029235839844, 0.01132965087890625, 0.012490272521972656, 0.013650894165039062, 0.014811515808105469, 0.015972137451171875, 0.01713275909423828, 0.018293380737304688, 0.019454002380371094, 0.0206146240234375, 0.021775245666503906, 0.022935867309570312, 0.02409648895263672, 0.025257110595703125, 0.02641773223876953, 0.027578353881835938, 0.028738975524902344, 0.02989959716796875, 0.031060218811035156, 0.03222084045410156, 0.03338146209716797, 0.034542083740234375, 0.03570270538330078, 0.03686332702636719, 0.038023948669433594, 0.0391845703125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 3.0, 11.0, 14.0, 16.0, 14.0, 17.0, 27.0, 28.0, 43.0, 31.0, 51.0, 60.0, 55.0, 45.0, 44.0, 56.0, 44.0, 46.0, 60.0, 49.0, 45.0, 43.0, 32.0, 23.0, 28.0, 16.0, 14.0, 13.0, 12.0, 13.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.221388816833496, -5.038038730621338, -4.85468864440918, -4.6713385581970215, -4.487988471984863, -4.304637908935547, -4.121288299560547, -3.9379377365112305, -3.7545876502990723, -3.571237564086914, -3.387887477874756, -3.2045373916625977, -3.0211870670318604, -2.837836980819702, -2.654486894607544, -2.4711365699768066, -2.2877867221832275, -2.1044366359710693, -1.9210864305496216, -1.7377363443374634, -1.5543861389160156, -1.3710360527038574, -1.1876859664916992, -1.0043357610702515, -0.8209856748580933, -0.6376355290412903, -0.4542854130268097, -0.2709352970123291, -0.08758515119552612, 0.09576499462127686, 0.27911508083343506, 0.4624652862548828, 0.645815372467041, 0.829165518283844, 1.012515664100647, 1.1958657503128052, 1.379215955734253, 1.5625660419464111, 1.7459161281585693, 1.929266333580017, 2.112616539001465, 2.295966625213623, 2.4793167114257812, 2.6626667976379395, 2.8460171222686768, 3.029367208480835, 3.212717294692993, 3.3960676193237305, 3.5794174671173096, 3.7627675533294678, 3.946117639541626, 4.129467964172363, 4.3128180503845215, 4.49616813659668, 4.679518222808838, 4.862868309020996, 5.046218395233154, 5.2295684814453125, 5.412918567657471, 5.596268653869629, 5.779618740081787, 5.962968826293945, 6.146319389343262, 6.32966947555542, 6.513019561767578]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 11.0, 14.0, 15.0, 31.0, 22.0, 18.0, 29.0, 39.0, 38.0, 36.0, 43.0, 29.0, 32.0, 45.0, 45.0, 44.0, 41.0, 36.0, 54.0, 34.0, 34.0, 33.0, 34.0, 21.0, 30.0, 19.0, 12.0, 15.0, 17.0, 18.0, 3.0, 10.0, 7.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.09265661239624, -3.9814138412475586, -3.870170831680298, -3.758928060531616, -3.6476850509643555, -3.536442279815674, -3.425199508666992, -3.3139567375183105, -3.20271372795105, -3.091470956802368, -2.9802279472351074, -2.868985176086426, -2.757742404937744, -2.6464993953704834, -2.5352566242218018, -2.424013614654541, -2.3127708435058594, -2.2015280723571777, -2.090285062789917, -1.9790422916412354, -1.8677994012832642, -1.756556510925293, -1.6453137397766113, -1.5340708494186401, -1.422827959060669, -1.3115850687026978, -1.2003421783447266, -1.089099407196045, -0.9778565168380737, -0.8666136264801025, -0.7553707957267761, -0.6441279649734497, -0.5328850746154785, -0.4216422140598297, -0.3103993535041809, -0.1991564929485321, -0.0879136323928833, 0.02332925796508789, 0.1345720887184143, 0.24581491947174072, 0.3570578098297119, 0.4683006703853607, 0.5795435309410095, 0.6907863616943359, 0.8020292520523071, 0.9132721424102783, 1.02451491355896, 1.1357578039169312, 1.2470006942749023, 1.3582435846328735, 1.4694864749908447, 1.5807292461395264, 1.6919721364974976, 1.8032150268554688, 1.9144577980041504, 2.025700569152832, 2.1369435787200928, 2.2481863498687744, 2.359429359436035, 2.470672130584717, 2.5819149017333984, 2.693157911300659, 2.804400682449341, 2.9156436920166016, 3.026886463165283]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 26.0, 43.0, 64.0, 86.0, 149.0, 210.0, 388.0, 666.0, 1034.0, 1773.0, 3069.0, 5580.0, 10332.0, 19473.0, 36804.0, 66839.0, 112644.0, 165928.0, 190714.0, 167139.0, 115680.0, 68165.0, 37485.0, 20077.0, 10823.0, 5652.0, 3185.0, 1798.0, 1030.0, 626.0, 379.0, 244.0, 139.0, 78.0, 56.0, 60.0, 30.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.0797119140625, -4.901611328125, -4.7235107421875, -4.54541015625, -4.3673095703125, -4.189208984375, -4.0111083984375, -3.8330078125, -3.6549072265625, -3.476806640625, -3.2987060546875, -3.12060546875, -2.9425048828125, -2.764404296875, -2.5863037109375, -2.408203125, -2.2301025390625, -2.052001953125, -1.8739013671875, -1.69580078125, -1.5177001953125, -1.339599609375, -1.1614990234375, -0.9833984375, -0.8052978515625, -0.627197265625, -0.4490966796875, -0.27099609375, -0.0928955078125, 0.085205078125, 0.2633056640625, 0.44140625, 0.6195068359375, 0.797607421875, 0.9757080078125, 1.15380859375, 1.3319091796875, 1.510009765625, 1.6881103515625, 1.8662109375, 2.0443115234375, 2.222412109375, 2.4005126953125, 2.57861328125, 2.7567138671875, 2.934814453125, 3.1129150390625, 3.291015625, 3.4691162109375, 3.647216796875, 3.8253173828125, 4.00341796875, 4.1815185546875, 4.359619140625, 4.5377197265625, 4.7158203125, 4.8939208984375, 5.072021484375, 5.2501220703125, 5.42822265625, 5.6063232421875, 5.784423828125, 5.9625244140625, 6.140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 4.0, 7.0, 14.0, 10.0, 21.0, 29.0, 20.0, 21.0, 21.0, 30.0, 38.0, 43.0, 41.0, 40.0, 55.0, 46.0, 51.0, 61.0, 41.0, 59.0, 50.0, 42.0, 47.0, 33.0, 32.0, 24.0, 23.0, 15.0, 15.0, 14.0, 6.0, 12.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.30718994140625, -4.1612548828125, -4.01531982421875, -3.869384765625, -3.72344970703125, -3.5775146484375, -3.43157958984375, -3.28564453125, -3.13970947265625, -2.9937744140625, -2.84783935546875, -2.701904296875, -2.55596923828125, -2.4100341796875, -2.26409912109375, -2.1181640625, -1.97222900390625, -1.8262939453125, -1.68035888671875, -1.534423828125, -1.38848876953125, -1.2425537109375, -1.09661865234375, -0.95068359375, -0.80474853515625, -0.6588134765625, -0.51287841796875, -0.366943359375, -0.22100830078125, -0.0750732421875, 0.07086181640625, 0.216796875, 0.36273193359375, 0.5086669921875, 0.65460205078125, 0.800537109375, 0.94647216796875, 1.0924072265625, 1.23834228515625, 1.38427734375, 1.53021240234375, 1.6761474609375, 1.82208251953125, 1.968017578125, 2.11395263671875, 2.2598876953125, 2.40582275390625, 2.5517578125, 2.69769287109375, 2.8436279296875, 2.98956298828125, 3.135498046875, 3.28143310546875, 3.4273681640625, 3.57330322265625, 3.71923828125, 3.86517333984375, 4.0111083984375, 4.15704345703125, 4.302978515625, 4.44891357421875, 4.5948486328125, 4.74078369140625, 4.88671875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 13.0, 12.0, 12.0, 17.0, 36.0, 33.0, 57.0, 79.0, 103.0, 196.0, 287.0, 405.0, 625.0, 1023.0, 1771.0, 3011.0, 5222.0, 9895.0, 17824.0, 34005.0, 62454.0, 107475.0, 161693.0, 193809.0, 173018.0, 119502.0, 70579.0, 38764.0, 20876.0, 11102.0, 6040.0, 3415.0, 1926.0, 1179.0, 701.0, 470.0, 318.0, 195.0, 133.0, 86.0, 56.0, 39.0, 38.0, 22.0, 13.0, 9.0, 4.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.67779541015625, -5.4923095703125, -5.30682373046875, -5.121337890625, -4.93585205078125, -4.7503662109375, -4.56488037109375, -4.37939453125, -4.19390869140625, -4.0084228515625, -3.82293701171875, -3.637451171875, -3.45196533203125, -3.2664794921875, -3.08099365234375, -2.8955078125, -2.71002197265625, -2.5245361328125, -2.33905029296875, -2.153564453125, -1.96807861328125, -1.7825927734375, -1.59710693359375, -1.41162109375, -1.22613525390625, -1.0406494140625, -0.85516357421875, -0.669677734375, -0.48419189453125, -0.2987060546875, -0.11322021484375, 0.072265625, 0.25775146484375, 0.4432373046875, 0.62872314453125, 0.814208984375, 0.99969482421875, 1.1851806640625, 1.37066650390625, 1.55615234375, 1.74163818359375, 1.9271240234375, 2.11260986328125, 2.298095703125, 2.48358154296875, 2.6690673828125, 2.85455322265625, 3.0400390625, 3.22552490234375, 3.4110107421875, 3.59649658203125, 3.781982421875, 3.96746826171875, 4.1529541015625, 4.33843994140625, 4.52392578125, 4.70941162109375, 4.8948974609375, 5.08038330078125, 5.265869140625, 5.45135498046875, 5.6368408203125, 5.82232666015625, 6.0078125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 4.0, 12.0, 13.0, 9.0, 19.0, 10.0, 15.0, 18.0, 31.0, 23.0, 33.0, 36.0, 43.0, 42.0, 47.0, 33.0, 43.0, 45.0, 34.0, 37.0, 41.0, 37.0, 44.0, 33.0, 30.0, 23.0, 35.0, 27.0, 23.0, 24.0, 16.0, 20.0, 20.0, 10.0, 15.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.038421630859375, -1.96551513671875, -1.892608642578125, -1.8197021484375, -1.746795654296875, -1.67388916015625, -1.600982666015625, -1.528076171875, -1.455169677734375, -1.38226318359375, -1.309356689453125, -1.2364501953125, -1.163543701171875, -1.09063720703125, -1.017730712890625, -0.94482421875, -0.871917724609375, -0.79901123046875, -0.726104736328125, -0.6531982421875, -0.580291748046875, -0.50738525390625, -0.434478759765625, -0.361572265625, -0.288665771484375, -0.21575927734375, -0.142852783203125, -0.0699462890625, 0.002960205078125, 0.07586669921875, 0.148773193359375, 0.2216796875, 0.294586181640625, 0.36749267578125, 0.440399169921875, 0.5133056640625, 0.586212158203125, 0.65911865234375, 0.732025146484375, 0.804931640625, 0.877838134765625, 0.95074462890625, 1.023651123046875, 1.0965576171875, 1.169464111328125, 1.24237060546875, 1.315277099609375, 1.38818359375, 1.461090087890625, 1.53399658203125, 1.606903076171875, 1.6798095703125, 1.752716064453125, 1.82562255859375, 1.898529052734375, 1.971435546875, 2.044342041015625, 2.11724853515625, 2.190155029296875, 2.2630615234375, 2.335968017578125, 2.40887451171875, 2.481781005859375, 2.5546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 6.0, 4.0, 4.0, 9.0, 15.0, 19.0, 30.0, 41.0, 49.0, 97.0, 105.0, 151.0, 219.0, 380.0, 521.0, 824.0, 1320.0, 1920.0, 3121.0, 4948.0, 7873.0, 12922.0, 21075.0, 33874.0, 54983.0, 84998.0, 120953.0, 149523.0, 154529.0, 130626.0, 95465.0, 63379.0, 39858.0, 24656.0, 14939.0, 9342.0, 5648.0, 3578.0, 2248.0, 1489.0, 951.0, 647.0, 403.0, 258.0, 175.0, 116.0, 92.0, 61.0, 29.0, 37.0, 16.0, 11.0, 10.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.416015625, -2.338470458984375, -2.26092529296875, -2.183380126953125, -2.1058349609375, -2.028289794921875, -1.95074462890625, -1.873199462890625, -1.795654296875, -1.718109130859375, -1.64056396484375, -1.563018798828125, -1.4854736328125, -1.407928466796875, -1.33038330078125, -1.252838134765625, -1.17529296875, -1.097747802734375, -1.02020263671875, -0.942657470703125, -0.8651123046875, -0.787567138671875, -0.71002197265625, -0.632476806640625, -0.554931640625, -0.477386474609375, -0.39984130859375, -0.322296142578125, -0.2447509765625, -0.167205810546875, -0.08966064453125, -0.012115478515625, 0.0654296875, 0.142974853515625, 0.22052001953125, 0.298065185546875, 0.3756103515625, 0.453155517578125, 0.53070068359375, 0.608245849609375, 0.685791015625, 0.763336181640625, 0.84088134765625, 0.918426513671875, 0.9959716796875, 1.073516845703125, 1.15106201171875, 1.228607177734375, 1.30615234375, 1.383697509765625, 1.46124267578125, 1.538787841796875, 1.6163330078125, 1.693878173828125, 1.77142333984375, 1.848968505859375, 1.926513671875, 2.004058837890625, 2.08160400390625, 2.159149169921875, 2.2366943359375, 2.314239501953125, 2.39178466796875, 2.469329833984375, 2.546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 3.0, 7.0, 27.0, 8.0, 19.0, 19.0, 26.0, 33.0, 38.0, 53.0, 46.0, 32.0, 55.0, 73.0, 52.0, 71.0, 59.0, 59.0, 60.0, 44.0, 42.0, 24.0, 27.0, 28.0, 19.0, 12.0, 9.0, 11.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.0003085136413574219, -0.0002989768981933594, -0.0002894401550292969, -0.0002799034118652344, -0.0002703666687011719, -0.0002608299255371094, -0.0002512931823730469, -0.00024175643920898438, -0.00023221969604492188, -0.00022268295288085938, -0.00021314620971679688, -0.00020360946655273438, -0.00019407272338867188, -0.00018453598022460938, -0.00017499923706054688, -0.00016546249389648438, -0.00015592575073242188, -0.00014638900756835938, -0.00013685226440429688, -0.00012731552124023438, -0.00011777877807617188, -0.00010824203491210938, -9.870529174804688e-05, -8.916854858398438e-05, -7.963180541992188e-05, -7.009506225585938e-05, -6.0558319091796875e-05, -5.1021575927734375e-05, -4.1484832763671875e-05, -3.1948089599609375e-05, -2.2411346435546875e-05, -1.2874603271484375e-05, -3.337860107421875e-06, 6.198883056640625e-06, 1.5735626220703125e-05, 2.5272369384765625e-05, 3.4809112548828125e-05, 4.4345855712890625e-05, 5.3882598876953125e-05, 6.341934204101562e-05, 7.295608520507812e-05, 8.249282836914062e-05, 9.202957153320312e-05, 0.00010156631469726562, 0.00011110305786132812, 0.00012063980102539062, 0.00013017654418945312, 0.00013971328735351562, 0.00014925003051757812, 0.00015878677368164062, 0.00016832351684570312, 0.00017786026000976562, 0.00018739700317382812, 0.00019693374633789062, 0.00020647048950195312, 0.00021600723266601562, 0.00022554397583007812, 0.00023508071899414062, 0.0002446174621582031, 0.0002541542053222656, 0.0002636909484863281, 0.0002732276916503906, 0.0002827644348144531, 0.0002923011779785156]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 9.0, 13.0, 20.0, 29.0, 43.0, 50.0, 76.0, 117.0, 158.0, 252.0, 329.0, 542.0, 732.0, 1074.0, 1620.0, 2381.0, 3554.0, 5402.0, 8293.0, 12755.0, 20154.0, 31505.0, 48395.0, 72817.0, 102931.0, 130820.0, 143108.0, 133325.0, 106192.0, 76229.0, 50986.0, 33601.0, 21440.0, 13552.0, 8722.0, 5735.0, 3718.0, 2596.0, 1653.0, 1149.0, 764.0, 535.0, 368.0, 250.0, 177.0, 119.0, 85.0, 58.0, 33.0, 35.0, 24.0, 8.0, 11.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.0606689453125, -1.988525390625, -1.9163818359375, -1.84423828125, -1.7720947265625, -1.699951171875, -1.6278076171875, -1.5556640625, -1.4835205078125, -1.411376953125, -1.3392333984375, -1.26708984375, -1.1949462890625, -1.122802734375, -1.0506591796875, -0.978515625, -0.9063720703125, -0.834228515625, -0.7620849609375, -0.68994140625, -0.6177978515625, -0.545654296875, -0.4735107421875, -0.4013671875, -0.3292236328125, -0.257080078125, -0.1849365234375, -0.11279296875, -0.0406494140625, 0.031494140625, 0.1036376953125, 0.17578125, 0.2479248046875, 0.320068359375, 0.3922119140625, 0.46435546875, 0.5364990234375, 0.608642578125, 0.6807861328125, 0.7529296875, 0.8250732421875, 0.897216796875, 0.9693603515625, 1.04150390625, 1.1136474609375, 1.185791015625, 1.2579345703125, 1.330078125, 1.4022216796875, 1.474365234375, 1.5465087890625, 1.61865234375, 1.6907958984375, 1.762939453125, 1.8350830078125, 1.9072265625, 1.9793701171875, 2.051513671875, 2.1236572265625, 2.19580078125, 2.2679443359375, 2.340087890625, 2.4122314453125, 2.484375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 7.0, 5.0, 9.0, 7.0, 8.0, 6.0, 20.0, 25.0, 31.0, 15.0, 28.0, 25.0, 35.0, 47.0, 43.0, 40.0, 46.0, 52.0, 55.0, 52.0, 47.0, 58.0, 51.0, 37.0, 36.0, 31.0, 32.0, 26.0, 19.0, 15.0, 16.0, 16.0, 10.0, 7.0, 5.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71044921875, -0.686431884765625, -0.66241455078125, -0.638397216796875, -0.6143798828125, -0.590362548828125, -0.56634521484375, -0.542327880859375, -0.518310546875, -0.494293212890625, -0.47027587890625, -0.446258544921875, -0.4222412109375, -0.398223876953125, -0.37420654296875, -0.350189208984375, -0.326171875, -0.302154541015625, -0.27813720703125, -0.254119873046875, -0.2301025390625, -0.206085205078125, -0.18206787109375, -0.158050537109375, -0.134033203125, -0.110015869140625, -0.08599853515625, -0.061981201171875, -0.0379638671875, -0.013946533203125, 0.01007080078125, 0.034088134765625, 0.05810546875, 0.082122802734375, 0.10614013671875, 0.130157470703125, 0.1541748046875, 0.178192138671875, 0.20220947265625, 0.226226806640625, 0.250244140625, 0.274261474609375, 0.29827880859375, 0.322296142578125, 0.3463134765625, 0.370330810546875, 0.39434814453125, 0.418365478515625, 0.4423828125, 0.466400146484375, 0.49041748046875, 0.514434814453125, 0.5384521484375, 0.562469482421875, 0.58648681640625, 0.610504150390625, 0.634521484375, 0.658538818359375, 0.68255615234375, 0.706573486328125, 0.7305908203125, 0.754608154296875, 0.77862548828125, 0.802642822265625, 0.82666015625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 7.0, 4.0, 2.0, 10.0, 10.0, 15.0, 20.0, 19.0, 21.0, 19.0, 27.0, 44.0, 30.0, 38.0, 36.0, 50.0, 59.0, 59.0, 51.0, 50.0, 51.0, 53.0, 51.0, 29.0, 39.0, 38.0, 29.0, 28.0, 20.0, 22.0, 14.0, 11.0, 6.0, 10.0, 10.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.928782939910889, -4.745309829711914, -4.5618367195129395, -4.378363609313965, -4.19489049911499, -4.011417388916016, -3.827944040298462, -3.6444709300994873, -3.4609978199005127, -3.277524709701538, -3.0940515995025635, -2.9105782508850098, -2.727105140686035, -2.5436320304870605, -2.360158920288086, -2.1766858100891113, -1.9932126998901367, -1.809739589691162, -1.6262664794921875, -1.4427932500839233, -1.2593201398849487, -1.0758470296859741, -0.89237380027771, -0.7089006900787354, -0.5254275798797607, -0.34195443987846375, -0.15848129987716675, 0.024991869926452637, 0.20846498012542725, 0.39193809032440186, 0.575411319732666, 0.7588844299316406, 0.9423580169677734, 1.125831127166748, 1.3093042373657227, 1.4927774667739868, 1.6762505769729614, 1.859723687171936, 2.0431969165802, 2.226670026779175, 2.4101431369781494, 2.593616247177124, 2.7770893573760986, 2.9605627059936523, 3.144035816192627, 3.3275089263916016, 3.510982036590576, 3.694455146789551, 3.8779282569885254, 4.0614013671875, 4.244874477386475, 4.428347587585449, 4.611820697784424, 4.795293807983398, 4.978767395019531, 5.162240028381348, 5.3457136154174805, 5.529186725616455, 5.71265983581543, 5.896132946014404, 6.079606056213379, 6.2630791664123535, 6.446552276611328, 6.630025863647461, 6.813498497009277]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 14.0, 16.0, 13.0, 15.0, 15.0, 19.0, 22.0, 22.0, 20.0, 34.0, 28.0, 40.0, 36.0, 26.0, 35.0, 54.0, 39.0, 50.0, 44.0, 42.0, 44.0, 35.0, 29.0, 24.0, 31.0, 32.0, 22.0, 17.0, 18.0, 24.0, 16.0, 12.0, 16.0, 12.0, 16.0, 6.0, 5.0, 3.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-3.8244690895080566, -3.712723970413208, -3.6009790897369385, -3.48923397064209, -3.3774890899658203, -3.2657439708709717, -3.153998851776123, -3.0422539710998535, -2.930508852005005, -2.8187637329101562, -2.7070188522338867, -2.595273733139038, -2.4835286140441895, -2.37178373336792, -2.2600386142730713, -2.1482934951782227, -2.036548614501953, -1.924803614616394, -1.813058614730835, -1.7013134956359863, -1.5895684957504272, -1.4778234958648682, -1.3660783767700195, -1.2543333768844604, -1.1425883769989014, -1.0308433771133423, -0.9190983176231384, -0.8073532581329346, -0.6956082582473755, -0.5838632583618164, -0.47211819887161255, -0.3603731393814087, -0.2486283779144287, -0.13688334822654724, -0.02513831853866577, 0.0866067111492157, 0.19835174083709717, 0.31009674072265625, 0.4218418002128601, 0.533586859703064, 0.645331859588623, 0.7570768594741821, 0.868821918964386, 0.9805669784545898, 1.092311978340149, 1.204056978225708, 1.3158020973205566, 1.4275470972061157, 1.5392920970916748, 1.6510370969772339, 1.762782096862793, 1.8745272159576416, 1.9862722158432007, 2.0980172157287598, 2.2097623348236084, 2.321507453918457, 2.4332523345947266, 2.544997453689575, 2.6567423343658447, 2.7684874534606934, 2.880232334136963, 2.9919774532318115, 3.10372257232666, 3.2154674530029297, 3.3272125720977783]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 22.0, 22.0, 39.0, 53.0, 64.0, 109.0, 174.0, 267.0, 385.0, 587.0, 891.0, 1554.0, 2707.0, 4293.0, 7585.0, 13128.0, 24379.0, 45902.0, 90837.0, 189045.0, 405765.0, 788998.0, 1039414.0, 785845.0, 406213.0, 191629.0, 92727.0, 46413.0, 24488.0, 13014.0, 7417.0, 4140.0, 2458.0, 1417.0, 881.0, 542.0, 325.0, 200.0, 122.0, 85.0, 46.0, 27.0, 19.0, 14.0, 8.0, 5.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.90234375, -6.6962890625, -6.490234375, -6.2841796875, -6.078125, -5.8720703125, -5.666015625, -5.4599609375, -5.25390625, -5.0478515625, -4.841796875, -4.6357421875, -4.4296875, -4.2236328125, -4.017578125, -3.8115234375, -3.60546875, -3.3994140625, -3.193359375, -2.9873046875, -2.78125, -2.5751953125, -2.369140625, -2.1630859375, -1.95703125, -1.7509765625, -1.544921875, -1.3388671875, -1.1328125, -0.9267578125, -0.720703125, -0.5146484375, -0.30859375, -0.1025390625, 0.103515625, 0.3095703125, 0.515625, 0.7216796875, 0.927734375, 1.1337890625, 1.33984375, 1.5458984375, 1.751953125, 1.9580078125, 2.1640625, 2.3701171875, 2.576171875, 2.7822265625, 2.98828125, 3.1943359375, 3.400390625, 3.6064453125, 3.8125, 4.0185546875, 4.224609375, 4.4306640625, 4.63671875, 4.8427734375, 5.048828125, 5.2548828125, 5.4609375, 5.6669921875, 5.873046875, 6.0791015625, 6.28515625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 9.0, 18.0, 21.0, 21.0, 21.0, 14.0, 33.0, 41.0, 39.0, 29.0, 44.0, 51.0, 48.0, 45.0, 50.0, 60.0, 52.0, 48.0, 29.0, 46.0, 39.0, 31.0, 30.0, 20.0, 23.0, 15.0, 17.0, 20.0, 11.0, 9.0, 3.0, 8.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.701171875, -3.58648681640625, -3.4718017578125, -3.35711669921875, -3.242431640625, -3.12774658203125, -3.0130615234375, -2.89837646484375, -2.78369140625, -2.66900634765625, -2.5543212890625, -2.43963623046875, -2.324951171875, -2.21026611328125, -2.0955810546875, -1.98089599609375, -1.8662109375, -1.75152587890625, -1.6368408203125, -1.52215576171875, -1.407470703125, -1.29278564453125, -1.1781005859375, -1.06341552734375, -0.94873046875, -0.83404541015625, -0.7193603515625, -0.60467529296875, -0.489990234375, -0.37530517578125, -0.2606201171875, -0.14593505859375, -0.03125, 0.08343505859375, 0.1981201171875, 0.31280517578125, 0.427490234375, 0.54217529296875, 0.6568603515625, 0.77154541015625, 0.88623046875, 1.00091552734375, 1.1156005859375, 1.23028564453125, 1.344970703125, 1.45965576171875, 1.5743408203125, 1.68902587890625, 1.8037109375, 1.91839599609375, 2.0330810546875, 2.14776611328125, 2.262451171875, 2.37713623046875, 2.4918212890625, 2.60650634765625, 2.72119140625, 2.83587646484375, 2.9505615234375, 3.06524658203125, 3.179931640625, 3.29461669921875, 3.4093017578125, 3.52398681640625, 3.638671875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 25.0, 35.0, 48.0, 71.0, 115.0, 195.0, 239.0, 417.0, 589.0, 984.0, 1403.0, 2121.0, 3284.0, 5206.0, 8142.0, 13094.0, 21577.0, 35271.0, 59213.0, 99988.0, 168750.0, 285494.0, 459535.0, 654453.0, 734496.0, 608889.0, 410282.0, 251651.0, 147935.0, 86820.0, 52016.0, 30878.0, 18989.0, 11692.0, 7347.0, 4578.0, 2913.0, 1904.0, 1240.0, 843.0, 519.0, 366.0, 215.0, 147.0, 97.0, 71.0, 46.0, 20.0, 19.0, 20.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.765625, -5.58184814453125, -5.3980712890625, -5.21429443359375, -5.030517578125, -4.84674072265625, -4.6629638671875, -4.47918701171875, -4.29541015625, -4.11163330078125, -3.9278564453125, -3.74407958984375, -3.560302734375, -3.37652587890625, -3.1927490234375, -3.00897216796875, -2.8251953125, -2.64141845703125, -2.4576416015625, -2.27386474609375, -2.090087890625, -1.90631103515625, -1.7225341796875, -1.53875732421875, -1.35498046875, -1.17120361328125, -0.9874267578125, -0.80364990234375, -0.619873046875, -0.43609619140625, -0.2523193359375, -0.06854248046875, 0.115234375, 0.29901123046875, 0.4827880859375, 0.66656494140625, 0.850341796875, 1.03411865234375, 1.2178955078125, 1.40167236328125, 1.58544921875, 1.76922607421875, 1.9530029296875, 2.13677978515625, 2.320556640625, 2.50433349609375, 2.6881103515625, 2.87188720703125, 3.0556640625, 3.23944091796875, 3.4232177734375, 3.60699462890625, 3.790771484375, 3.97454833984375, 4.1583251953125, 4.34210205078125, 4.52587890625, 4.70965576171875, 4.8934326171875, 5.07720947265625, 5.260986328125, 5.44476318359375, 5.6285400390625, 5.81231689453125, 5.99609375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 6.0, 9.0, 13.0, 12.0, 22.0, 30.0, 45.0, 40.0, 50.0, 70.0, 94.0, 135.0, 137.0, 162.0, 171.0, 233.0, 233.0, 258.0, 284.0, 266.0, 240.0, 232.0, 237.0, 215.0, 197.0, 143.0, 119.0, 89.0, 81.0, 56.0, 44.0, 30.0, 25.0, 19.0, 14.0, 15.0, 8.0, 5.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.02386474609375, -1.9559326171875, -1.88800048828125, -1.820068359375, -1.75213623046875, -1.6842041015625, -1.61627197265625, -1.54833984375, -1.48040771484375, -1.4124755859375, -1.34454345703125, -1.276611328125, -1.20867919921875, -1.1407470703125, -1.07281494140625, -1.0048828125, -0.93695068359375, -0.8690185546875, -0.80108642578125, -0.733154296875, -0.66522216796875, -0.5972900390625, -0.52935791015625, -0.46142578125, -0.39349365234375, -0.3255615234375, -0.25762939453125, -0.189697265625, -0.12176513671875, -0.0538330078125, 0.01409912109375, 0.08203125, 0.14996337890625, 0.2178955078125, 0.28582763671875, 0.353759765625, 0.42169189453125, 0.4896240234375, 0.55755615234375, 0.62548828125, 0.69342041015625, 0.7613525390625, 0.82928466796875, 0.897216796875, 0.96514892578125, 1.0330810546875, 1.10101318359375, 1.1689453125, 1.23687744140625, 1.3048095703125, 1.37274169921875, 1.440673828125, 1.50860595703125, 1.5765380859375, 1.64447021484375, 1.71240234375, 1.78033447265625, 1.8482666015625, 1.91619873046875, 1.984130859375, 2.05206298828125, 2.1199951171875, 2.18792724609375, 2.255859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 11.0, 10.0, 19.0, 16.0, 34.0, 29.0, 49.0, 42.0, 54.0, 57.0, 73.0, 62.0, 62.0, 52.0, 67.0, 65.0, 53.0, 38.0, 35.0, 36.0, 26.0, 33.0, 14.0, 10.0, 14.0, 6.0, 6.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.956415176391602, -7.686728477478027, -7.417041778564453, -7.147355079650879, -6.877668380737305, -6.6079816818237305, -6.338294982910156, -6.068608283996582, -5.798921585083008, -5.529234886169434, -5.259548187255859, -4.989861488342285, -4.720174789428711, -4.450488090515137, -4.1808013916015625, -3.9111149311065674, -3.6414284706115723, -3.371741771697998, -3.102055072784424, -2.8323683738708496, -2.5626816749572754, -2.292994976043701, -2.023308515548706, -1.7536218166351318, -1.4839351177215576, -1.2142484188079834, -0.944561779499054, -0.6748751401901245, -0.4051884412765503, -0.13550174236297607, 0.1341848373413086, 0.4038715362548828, 0.673558235168457, 0.9432449340820312, 1.2129316329956055, 1.4826182126998901, 1.7523049116134644, 2.021991729736328, 2.2916781902313232, 2.5613648891448975, 2.8310515880584717, 3.100738286972046, 3.37042498588562, 3.6401114463806152, 3.9097981452941895, 4.179484844207764, 4.449171543121338, 4.718858242034912, 4.988544940948486, 5.2582316398620605, 5.527918338775635, 5.797605037689209, 6.067291736602783, 6.336978435516357, 6.606664657592773, 6.876351356506348, 7.146038055419922, 7.415724754333496, 7.68541145324707, 7.9550981521606445, 8.224784851074219, 8.494471549987793, 8.764158248901367, 9.033844947814941, 9.303531646728516]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 12.0, 22.0, 22.0, 34.0, 20.0, 25.0, 39.0, 41.0, 30.0, 32.0, 33.0, 47.0, 47.0, 38.0, 46.0, 41.0, 50.0, 36.0, 40.0, 38.0, 36.0, 29.0, 20.0, 25.0, 17.0, 21.0, 18.0, 18.0, 14.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.775452136993408, -4.6400041580200195, -4.504555702209473, -4.369107723236084, -4.233659744262695, -4.098211288452148, -3.9627633094787598, -3.827315092086792, -3.691866874694824, -3.5564186573028564, -3.4209704399108887, -3.2855224609375, -3.1500742435455322, -3.0146260261535645, -2.879178047180176, -2.743729829788208, -2.6082816123962402, -2.4728333950042725, -2.3373851776123047, -2.201937198638916, -2.0664889812469482, -1.9310407638549805, -1.7955926656723022, -1.660144567489624, -1.5246963500976562, -1.3892481327056885, -1.2538000345230103, -1.118351936340332, -0.9829037189483643, -0.8474555611610413, -0.7120074033737183, -0.5765592455863953, -0.44111084938049316, -0.30566269159317017, -0.17021453380584717, -0.03476637601852417, 0.10068178176879883, 0.23612993955612183, 0.3715780973434448, 0.5070262551307678, 0.6424744129180908, 0.7779225707054138, 0.9133707284927368, 1.048818826675415, 1.1842670440673828, 1.3197152614593506, 1.4551633596420288, 1.590611457824707, 1.7260596752166748, 1.8615078926086426, 1.9969559907913208, 2.132404088973999, 2.267852306365967, 2.4033005237579346, 2.5387487411499023, 2.674196720123291, 2.809644937515259, 2.9450931549072266, 3.0805411338806152, 3.215989351272583, 3.351437568664551, 3.4868857860565186, 3.6223340034484863, 3.757781982421875, 3.8932301998138428]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 10.0, 27.0, 44.0, 59.0, 81.0, 155.0, 196.0, 344.0, 539.0, 967.0, 1597.0, 2658.0, 4677.0, 8303.0, 14445.0, 25468.0, 45088.0, 76950.0, 126681.0, 178772.0, 189858.0, 147354.0, 94600.0, 55407.0, 31703.0, 17956.0, 10395.0, 5807.0, 3459.0, 1920.0, 1151.0, 690.0, 462.0, 254.0, 165.0, 112.0, 73.0, 48.0, 24.0, 19.0, 14.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5245132446289062, -0.5065460205078125, -0.48857879638671875, -0.470611572265625, -0.45264434814453125, -0.4346771240234375, -0.41670989990234375, -0.39874267578125, -0.38077545166015625, -0.3628082275390625, -0.34484100341796875, -0.326873779296875, -0.30890655517578125, -0.2909393310546875, -0.27297210693359375, -0.2550048828125, -0.23703765869140625, -0.2190704345703125, -0.20110321044921875, -0.183135986328125, -0.16516876220703125, -0.1472015380859375, -0.12923431396484375, -0.11126708984375, -0.09329986572265625, -0.0753326416015625, -0.05736541748046875, -0.039398193359375, -0.02143096923828125, -0.0034637451171875, 0.01450347900390625, 0.032470703125, 0.05043792724609375, 0.0684051513671875, 0.08637237548828125, 0.104339599609375, 0.12230682373046875, 0.1402740478515625, 0.15824127197265625, 0.17620849609375, 0.19417572021484375, 0.2121429443359375, 0.23011016845703125, 0.248077392578125, 0.26604461669921875, 0.2840118408203125, 0.30197906494140625, 0.3199462890625, 0.33791351318359375, 0.3558807373046875, 0.37384796142578125, 0.391815185546875, 0.40978240966796875, 0.4277496337890625, 0.44571685791015625, 0.46368408203125, 0.48165130615234375, 0.4996185302734375, 0.5175857543945312, 0.535552978515625, 0.5535202026367188, 0.5714874267578125, 0.5894546508789062, 0.607421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 6.0, 7.0, 6.0, 16.0, 11.0, 18.0, 15.0, 28.0, 30.0, 20.0, 33.0, 33.0, 34.0, 37.0, 30.0, 42.0, 42.0, 35.0, 33.0, 45.0, 31.0, 53.0, 44.0, 44.0, 34.0, 35.0, 30.0, 36.0, 23.0, 27.0, 21.0, 14.0, 15.0, 16.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.6171875, -5.46527099609375, -5.3133544921875, -5.16143798828125, -5.009521484375, -4.85760498046875, -4.7056884765625, -4.55377197265625, -4.40185546875, -4.24993896484375, -4.0980224609375, -3.94610595703125, -3.794189453125, -3.64227294921875, -3.4903564453125, -3.33843994140625, -3.1865234375, -3.03460693359375, -2.8826904296875, -2.73077392578125, -2.578857421875, -2.42694091796875, -2.2750244140625, -2.12310791015625, -1.97119140625, -1.81927490234375, -1.6673583984375, -1.51544189453125, -1.363525390625, -1.21160888671875, -1.0596923828125, -0.90777587890625, -0.755859375, -0.60394287109375, -0.4520263671875, -0.30010986328125, -0.148193359375, 0.00372314453125, 0.1556396484375, 0.30755615234375, 0.45947265625, 0.61138916015625, 0.7633056640625, 0.91522216796875, 1.067138671875, 1.21905517578125, 1.3709716796875, 1.52288818359375, 1.6748046875, 1.82672119140625, 1.9786376953125, 2.13055419921875, 2.282470703125, 2.43438720703125, 2.5863037109375, 2.73822021484375, 2.89013671875, 3.04205322265625, 3.1939697265625, 3.34588623046875, 3.497802734375, 3.64971923828125, 3.8016357421875, 3.95355224609375, 4.10546875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 13.0, 11.0, 23.0, 20.0, 19.0, 29.0, 39.0, 45.0, 65.0, 111.0, 106.0, 167.0, 234.0, 363.0, 487.0, 742.0, 1143.0, 1845.0, 3083.0, 5634.0, 10447.0, 20734.0, 67814.0, 811320.0, 76479.0, 22257.0, 10723.0, 5734.0, 3237.0, 1920.0, 1193.0, 742.0, 515.0, 344.0, 230.0, 170.0, 138.0, 99.0, 67.0, 54.0, 43.0, 24.0, 20.0, 14.0, 14.0, 8.0, 5.0, 6.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.50390625, -1.457672119140625, -1.41143798828125, -1.365203857421875, -1.3189697265625, -1.272735595703125, -1.22650146484375, -1.180267333984375, -1.134033203125, -1.087799072265625, -1.04156494140625, -0.995330810546875, -0.9490966796875, -0.902862548828125, -0.85662841796875, -0.810394287109375, -0.76416015625, -0.717926025390625, -0.67169189453125, -0.625457763671875, -0.5792236328125, -0.532989501953125, -0.48675537109375, -0.440521240234375, -0.394287109375, -0.348052978515625, -0.30181884765625, -0.255584716796875, -0.2093505859375, -0.163116455078125, -0.11688232421875, -0.070648193359375, -0.0244140625, 0.021820068359375, 0.06805419921875, 0.114288330078125, 0.1605224609375, 0.206756591796875, 0.25299072265625, 0.299224853515625, 0.345458984375, 0.391693115234375, 0.43792724609375, 0.484161376953125, 0.5303955078125, 0.576629638671875, 0.62286376953125, 0.669097900390625, 0.71533203125, 0.761566162109375, 0.80780029296875, 0.854034423828125, 0.9002685546875, 0.946502685546875, 0.99273681640625, 1.038970947265625, 1.085205078125, 1.131439208984375, 1.17767333984375, 1.223907470703125, 1.2701416015625, 1.316375732421875, 1.36260986328125, 1.408843994140625, 1.455078125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 12.0, 8.0, 6.0, 8.0, 6.0, 23.0, 17.0, 16.0, 11.0, 24.0, 29.0, 21.0, 25.0, 28.0, 41.0, 44.0, 34.0, 40.0, 43.0, 38.0, 42.0, 38.0, 38.0, 41.0, 37.0, 28.0, 29.0, 30.0, 29.0, 29.0, 28.0, 24.0, 14.0, 10.0, 20.0, 18.0, 9.0, 8.0, 7.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80108642578125, -2.7115478515625, -2.62200927734375, -2.532470703125, -2.44293212890625, -2.3533935546875, -2.26385498046875, -2.17431640625, -2.08477783203125, -1.9952392578125, -1.90570068359375, -1.816162109375, -1.72662353515625, -1.6370849609375, -1.54754638671875, -1.4580078125, -1.36846923828125, -1.2789306640625, -1.18939208984375, -1.099853515625, -1.01031494140625, -0.9207763671875, -0.83123779296875, -0.74169921875, -0.65216064453125, -0.5626220703125, -0.47308349609375, -0.383544921875, -0.29400634765625, -0.2044677734375, -0.11492919921875, -0.025390625, 0.06414794921875, 0.1536865234375, 0.24322509765625, 0.332763671875, 0.42230224609375, 0.5118408203125, 0.60137939453125, 0.69091796875, 0.78045654296875, 0.8699951171875, 0.95953369140625, 1.049072265625, 1.13861083984375, 1.2281494140625, 1.31768798828125, 1.4072265625, 1.49676513671875, 1.5863037109375, 1.67584228515625, 1.765380859375, 1.85491943359375, 1.9444580078125, 2.03399658203125, 2.12353515625, 2.21307373046875, 2.3026123046875, 2.39215087890625, 2.481689453125, 2.57122802734375, 2.6607666015625, 2.75030517578125, 2.83984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 8.0, 25.0, 30.0, 18.0, 39.0, 48.0, 57.0, 90.0, 120.0, 167.0, 249.0, 345.0, 505.0, 760.0, 1144.0, 1856.0, 2891.0, 4755.0, 8043.0, 14312.0, 28500.0, 591290.0, 333721.0, 26339.0, 13422.0, 7583.0, 4457.0, 2674.0, 1701.0, 1080.0, 686.0, 443.0, 342.0, 228.0, 168.0, 125.0, 90.0, 49.0, 42.0, 31.0, 19.0, 22.0, 15.0, 12.0, 7.0, 12.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.3427734375, -0.3320465087890625, -0.321319580078125, -0.3105926513671875, -0.29986572265625, -0.2891387939453125, -0.278411865234375, -0.2676849365234375, -0.2569580078125, -0.2462310791015625, -0.235504150390625, -0.2247772216796875, -0.21405029296875, -0.2033233642578125, -0.192596435546875, -0.1818695068359375, -0.171142578125, -0.1604156494140625, -0.149688720703125, -0.1389617919921875, -0.12823486328125, -0.1175079345703125, -0.106781005859375, -0.0960540771484375, -0.0853271484375, -0.0746002197265625, -0.063873291015625, -0.0531463623046875, -0.04241943359375, -0.0316925048828125, -0.020965576171875, -0.0102386474609375, 0.00048828125, 0.0112152099609375, 0.021942138671875, 0.0326690673828125, 0.04339599609375, 0.0541229248046875, 0.064849853515625, 0.0755767822265625, 0.0863037109375, 0.0970306396484375, 0.107757568359375, 0.1184844970703125, 0.12921142578125, 0.1399383544921875, 0.150665283203125, 0.1613922119140625, 0.172119140625, 0.1828460693359375, 0.193572998046875, 0.2042999267578125, 0.21502685546875, 0.2257537841796875, 0.236480712890625, 0.2472076416015625, 0.2579345703125, 0.2686614990234375, 0.279388427734375, 0.2901153564453125, 0.30084228515625, 0.3115692138671875, 0.322296142578125, 0.3330230712890625, 0.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 10.0, 6.0, 7.0, 8.0, 11.0, 14.0, 20.0, 13.0, 23.0, 31.0, 26.0, 39.0, 34.0, 35.0, 47.0, 46.0, 50.0, 53.0, 43.0, 49.0, 42.0, 32.0, 45.0, 42.0, 36.0, 31.0, 38.0, 24.0, 29.0, 16.0, 21.0, 14.0, 14.0, 14.0, 8.0, 10.0, 4.0, 3.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.8908252716064453e-05, -2.8051435947418213e-05, -2.7194619178771973e-05, -2.6337802410125732e-05, -2.5480985641479492e-05, -2.4624168872833252e-05, -2.3767352104187012e-05, -2.291053533554077e-05, -2.205371856689453e-05, -2.119690179824829e-05, -2.034008502960205e-05, -1.948326826095581e-05, -1.862645149230957e-05, -1.776963472366333e-05, -1.691281795501709e-05, -1.605600118637085e-05, -1.519918441772461e-05, -1.4342367649078369e-05, -1.3485550880432129e-05, -1.2628734111785889e-05, -1.1771917343139648e-05, -1.0915100574493408e-05, -1.0058283805847168e-05, -9.201467037200928e-06, -8.344650268554688e-06, -7.487833499908447e-06, -6.631016731262207e-06, -5.774199962615967e-06, -4.9173831939697266e-06, -4.060566425323486e-06, -3.203749656677246e-06, -2.346932888031006e-06, -1.4901161193847656e-06, -6.332993507385254e-07, 2.2351741790771484e-07, 1.080334186553955e-06, 1.9371509552001953e-06, 2.7939677238464355e-06, 3.6507844924926758e-06, 4.507601261138916e-06, 5.364418029785156e-06, 6.2212347984313965e-06, 7.078051567077637e-06, 7.934868335723877e-06, 8.791685104370117e-06, 9.648501873016357e-06, 1.0505318641662598e-05, 1.1362135410308838e-05, 1.2218952178955078e-05, 1.3075768947601318e-05, 1.3932585716247559e-05, 1.4789402484893799e-05, 1.564621925354004e-05, 1.650303602218628e-05, 1.735985279083252e-05, 1.821666955947876e-05, 1.9073486328125e-05, 1.993030309677124e-05, 2.078711986541748e-05, 2.164393663406372e-05, 2.250075340270996e-05, 2.33575701713562e-05, 2.421438694000244e-05, 2.507120370864868e-05, 2.5928020477294922e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 17.0, 32.0, 35.0, 55.0, 71.0, 167.0, 222.0, 386.0, 528.0, 980.0, 1726.0, 2985.0, 5483.0, 10822.0, 22318.0, 49275.0, 113264.0, 239353.0, 294454.0, 167022.0, 73997.0, 32770.0, 15397.0, 7687.0, 3982.0, 2250.0, 1301.0, 732.0, 446.0, 279.0, 170.0, 119.0, 62.0, 45.0, 29.0, 27.0, 14.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2765922546386719, -0.26827239990234375, -0.2599525451660156, -0.2516326904296875, -0.24331283569335938, -0.23499298095703125, -0.22667312622070312, -0.218353271484375, -0.21003341674804688, -0.20171356201171875, -0.19339370727539062, -0.1850738525390625, -0.17675399780273438, -0.16843414306640625, -0.16011428833007812, -0.15179443359375, -0.14347457885742188, -0.13515472412109375, -0.12683486938476562, -0.1185150146484375, -0.11019515991210938, -0.10187530517578125, -0.09355545043945312, -0.085235595703125, -0.07691574096679688, -0.06859588623046875, -0.060276031494140625, -0.0519561767578125, -0.043636322021484375, -0.03531646728515625, -0.026996612548828125, -0.0186767578125, -0.010356903076171875, -0.00203704833984375, 0.006282806396484375, 0.0146026611328125, 0.022922515869140625, 0.03124237060546875, 0.039562225341796875, 0.047882080078125, 0.056201934814453125, 0.06452178955078125, 0.07284164428710938, 0.0811614990234375, 0.08948135375976562, 0.09780120849609375, 0.10612106323242188, 0.11444091796875, 0.12276077270507812, 0.13108062744140625, 0.13940048217773438, 0.1477203369140625, 0.15604019165039062, 0.16436004638671875, 0.17267990112304688, 0.180999755859375, 0.18931961059570312, 0.19763946533203125, 0.20595932006835938, 0.2142791748046875, 0.22259902954101562, 0.23091888427734375, 0.23923873901367188, 0.24755859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 9.0, 15.0, 9.0, 10.0, 9.0, 18.0, 15.0, 21.0, 24.0, 34.0, 47.0, 34.0, 70.0, 54.0, 48.0, 64.0, 56.0, 56.0, 51.0, 47.0, 41.0, 35.0, 36.0, 33.0, 25.0, 29.0, 17.0, 10.0, 19.0, 12.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03598356246948242, -0.034613609313964844, -0.033243656158447266, -0.03187370300292969, -0.03050374984741211, -0.02913379669189453, -0.027763843536376953, -0.026393890380859375, -0.025023937225341797, -0.02365398406982422, -0.02228403091430664, -0.020914077758789062, -0.019544124603271484, -0.018174171447753906, -0.016804218292236328, -0.01543426513671875, -0.014064311981201172, -0.012694358825683594, -0.011324405670166016, -0.009954452514648438, -0.00858449935913086, -0.007214546203613281, -0.005844593048095703, -0.004474639892578125, -0.003104686737060547, -0.0017347335815429688, -0.0003647804260253906, 0.0010051727294921875, 0.0023751258850097656, 0.0037450790405273438, 0.005115032196044922, 0.0064849853515625, 0.007854938507080078, 0.009224891662597656, 0.010594844818115234, 0.011964797973632812, 0.01333475112915039, 0.014704704284667969, 0.016074657440185547, 0.017444610595703125, 0.018814563751220703, 0.02018451690673828, 0.02155447006225586, 0.022924423217773438, 0.024294376373291016, 0.025664329528808594, 0.027034282684326172, 0.02840423583984375, 0.029774188995361328, 0.031144142150878906, 0.032514095306396484, 0.03388404846191406, 0.03525400161743164, 0.03662395477294922, 0.0379939079284668, 0.039363861083984375, 0.04073381423950195, 0.04210376739501953, 0.04347372055053711, 0.04484367370605469, 0.046213626861572266, 0.047583580017089844, 0.04895353317260742, 0.050323486328125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 9.0, 15.0, 13.0, 23.0, 31.0, 33.0, 48.0, 45.0, 55.0, 65.0, 66.0, 63.0, 58.0, 62.0, 67.0, 57.0, 57.0, 34.0, 36.0, 36.0, 25.0, 31.0, 10.0, 13.0, 10.0, 8.0, 3.0, 1.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.933457374572754, -7.662163257598877, -7.390869140625, -7.119575023651123, -6.848280906677246, -6.576986789703369, -6.305692672729492, -6.034398555755615, -5.763104438781738, -5.491810321807861, -5.220516204833984, -4.949222087860107, -4.6779279708862305, -4.4066338539123535, -4.135339736938477, -3.8640456199645996, -3.5927515029907227, -3.3214573860168457, -3.0501632690429688, -2.778869152069092, -2.507575035095215, -2.236280918121338, -1.964986801147461, -1.693692684173584, -1.422398567199707, -1.15110445022583, -0.8798103332519531, -0.6085162162780762, -0.3372220993041992, -0.06592798233032227, 0.2053661346435547, 0.47666025161743164, 0.7479534149169922, 1.0192475318908691, 1.290541648864746, 1.561835765838623, 1.8331298828125, 2.104423999786377, 2.375718116760254, 2.647012233734131, 2.918306350708008, 3.1896004676818848, 3.4608945846557617, 3.7321887016296387, 4.003482818603516, 4.274776935577393, 4.5460710525512695, 4.8173651695251465, 5.088659286499023, 5.3599534034729, 5.631247520446777, 5.902541637420654, 6.173835754394531, 6.445129871368408, 6.716423988342285, 6.987718105316162, 7.259012222290039, 7.530306339263916, 7.801600456237793, 8.072895050048828, 8.344188690185547, 8.615482330322266, 8.8867769241333, 9.158071517944336, 9.429365158081055]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 4.0, 5.0, 11.0, 7.0, 9.0, 13.0, 18.0, 11.0, 20.0, 23.0, 32.0, 23.0, 23.0, 40.0, 35.0, 34.0, 35.0, 32.0, 40.0, 51.0, 42.0, 39.0, 43.0, 51.0, 38.0, 36.0, 42.0, 34.0, 30.0, 21.0, 26.0, 17.0, 22.0, 16.0, 17.0, 16.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.752599716186523, -4.61810827255249, -4.483617305755615, -4.349125862121582, -4.214634895324707, -4.080143451690674, -3.9456522464752197, -3.8111610412597656, -3.6766698360443115, -3.5421786308288574, -3.4076874256134033, -3.273196220397949, -3.138704776763916, -3.004213809967041, -2.869722366333008, -2.7352311611175537, -2.6007399559020996, -2.4662487506866455, -2.3317575454711914, -2.1972663402557373, -2.062775135040283, -1.9282838106155396, -1.793792486190796, -1.6593012809753418, -1.5248100757598877, -1.3903188705444336, -1.2558276653289795, -1.1213363409042358, -0.9868451356887817, -0.8523539304733276, -0.7178626656532288, -0.5833714008331299, -0.4488801956176758, -0.3143889605998993, -0.1798977255821228, -0.045406490564346313, 0.08908474445343018, 0.22357594966888428, 0.35806721448898315, 0.49255847930908203, 0.6270496845245361, 0.7615408897399902, 0.8960321545600891, 1.030523419380188, 1.165014624595642, 1.2995058298110962, 1.4339971542358398, 1.568488359451294, 1.702979564666748, 1.8374707698822021, 1.9719619750976562, 2.1064531803131104, 2.2409443855285645, 2.3754358291625977, 2.5099270343780518, 2.644418239593506, 2.77890944480896, 2.913400650024414, 3.047891855239868, 3.1823830604553223, 3.3168745040893555, 3.4513654708862305, 3.5858569145202637, 3.7203481197357178, 3.854839324951172]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 14.0, 26.0, 38.0, 63.0, 84.0, 115.0, 179.0, 286.0, 426.0, 629.0, 969.0, 1481.0, 2389.0, 3808.0, 5710.0, 9054.0, 13802.0, 21247.0, 32086.0, 46996.0, 66732.0, 88452.0, 109439.0, 121545.0, 121791.0, 109076.0, 87754.0, 65971.0, 46994.0, 31963.0, 20821.0, 13694.0, 8710.0, 5664.0, 3668.0, 2378.0, 1554.0, 979.0, 618.0, 430.0, 284.0, 185.0, 134.0, 77.0, 75.0, 44.0, 27.0, 27.0, 14.0, 12.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-3.681640625, -3.566558837890625, -3.45147705078125, -3.336395263671875, -3.2213134765625, -3.106231689453125, -2.99114990234375, -2.876068115234375, -2.760986328125, -2.645904541015625, -2.53082275390625, -2.415740966796875, -2.3006591796875, -2.185577392578125, -2.07049560546875, -1.955413818359375, -1.84033203125, -1.725250244140625, -1.61016845703125, -1.495086669921875, -1.3800048828125, -1.264923095703125, -1.14984130859375, -1.034759521484375, -0.919677734375, -0.804595947265625, -0.68951416015625, -0.574432373046875, -0.4593505859375, -0.344268798828125, -0.22918701171875, -0.114105224609375, 0.0009765625, 0.116058349609375, 0.23114013671875, 0.346221923828125, 0.4613037109375, 0.576385498046875, 0.69146728515625, 0.806549072265625, 0.921630859375, 1.036712646484375, 1.15179443359375, 1.266876220703125, 1.3819580078125, 1.497039794921875, 1.61212158203125, 1.727203369140625, 1.84228515625, 1.957366943359375, 2.07244873046875, 2.187530517578125, 2.3026123046875, 2.417694091796875, 2.53277587890625, 2.647857666015625, 2.762939453125, 2.878021240234375, 2.99310302734375, 3.108184814453125, 3.2232666015625, 3.338348388671875, 3.45343017578125, 3.568511962890625, 3.68359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 15.0, 8.0, 14.0, 17.0, 22.0, 23.0, 26.0, 31.0, 44.0, 28.0, 30.0, 34.0, 38.0, 35.0, 38.0, 37.0, 47.0, 33.0, 39.0, 42.0, 47.0, 30.0, 41.0, 22.0, 26.0, 24.0, 29.0, 20.0, 26.0, 14.0, 22.0, 8.0, 11.0, 7.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.09375, -4.95062255859375, -4.8074951171875, -4.66436767578125, -4.521240234375, -4.37811279296875, -4.2349853515625, -4.09185791015625, -3.94873046875, -3.80560302734375, -3.6624755859375, -3.51934814453125, -3.376220703125, -3.23309326171875, -3.0899658203125, -2.94683837890625, -2.8037109375, -2.66058349609375, -2.5174560546875, -2.37432861328125, -2.231201171875, -2.08807373046875, -1.9449462890625, -1.80181884765625, -1.65869140625, -1.51556396484375, -1.3724365234375, -1.22930908203125, -1.086181640625, -0.94305419921875, -0.7999267578125, -0.65679931640625, -0.513671875, -0.37054443359375, -0.2274169921875, -0.08428955078125, 0.058837890625, 0.20196533203125, 0.3450927734375, 0.48822021484375, 0.63134765625, 0.77447509765625, 0.9176025390625, 1.06072998046875, 1.203857421875, 1.34698486328125, 1.4901123046875, 1.63323974609375, 1.7763671875, 1.91949462890625, 2.0626220703125, 2.20574951171875, 2.348876953125, 2.49200439453125, 2.6351318359375, 2.77825927734375, 2.92138671875, 3.06451416015625, 3.2076416015625, 3.35076904296875, 3.493896484375, 3.63702392578125, 3.7801513671875, 3.92327880859375, 4.06640625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 20.0, 36.0, 67.0, 124.0, 179.0, 350.0, 596.0, 999.0, 1728.0, 3128.0, 5665.0, 9936.0, 17134.0, 30031.0, 50480.0, 79640.0, 116002.0, 148349.0, 158535.0, 141548.0, 106480.0, 71765.0, 44335.0, 26395.0, 14968.0, 8587.0, 4972.0, 2777.0, 1556.0, 867.0, 535.0, 305.0, 174.0, 93.0, 60.0, 43.0, 24.0, 12.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.03515625, -4.879638671875, -4.72412109375, -4.568603515625, -4.4130859375, -4.257568359375, -4.10205078125, -3.946533203125, -3.791015625, -3.635498046875, -3.47998046875, -3.324462890625, -3.1689453125, -3.013427734375, -2.85791015625, -2.702392578125, -2.546875, -2.391357421875, -2.23583984375, -2.080322265625, -1.9248046875, -1.769287109375, -1.61376953125, -1.458251953125, -1.302734375, -1.147216796875, -0.99169921875, -0.836181640625, -0.6806640625, -0.525146484375, -0.36962890625, -0.214111328125, -0.05859375, 0.096923828125, 0.25244140625, 0.407958984375, 0.5634765625, 0.718994140625, 0.87451171875, 1.030029296875, 1.185546875, 1.341064453125, 1.49658203125, 1.652099609375, 1.8076171875, 1.963134765625, 2.11865234375, 2.274169921875, 2.4296875, 2.585205078125, 2.74072265625, 2.896240234375, 3.0517578125, 3.207275390625, 3.36279296875, 3.518310546875, 3.673828125, 3.829345703125, 3.98486328125, 4.140380859375, 4.2958984375, 4.451416015625, 4.60693359375, 4.762451171875, 4.91796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 5.0, 11.0, 8.0, 9.0, 2.0, 8.0, 14.0, 18.0, 27.0, 28.0, 36.0, 35.0, 40.0, 45.0, 59.0, 47.0, 46.0, 54.0, 64.0, 44.0, 30.0, 42.0, 53.0, 48.0, 31.0, 41.0, 21.0, 31.0, 18.0, 18.0, 22.0, 17.0, 6.0, 9.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.6832275390625, -2.569580078125, -2.4559326171875, -2.34228515625, -2.2286376953125, -2.114990234375, -2.0013427734375, -1.8876953125, -1.7740478515625, -1.660400390625, -1.5467529296875, -1.43310546875, -1.3194580078125, -1.205810546875, -1.0921630859375, -0.978515625, -0.8648681640625, -0.751220703125, -0.6375732421875, -0.52392578125, -0.4102783203125, -0.296630859375, -0.1829833984375, -0.0693359375, 0.0443115234375, 0.157958984375, 0.2716064453125, 0.38525390625, 0.4989013671875, 0.612548828125, 0.7261962890625, 0.83984375, 0.9534912109375, 1.067138671875, 1.1807861328125, 1.29443359375, 1.4080810546875, 1.521728515625, 1.6353759765625, 1.7490234375, 1.8626708984375, 1.976318359375, 2.0899658203125, 2.20361328125, 2.3172607421875, 2.430908203125, 2.5445556640625, 2.658203125, 2.7718505859375, 2.885498046875, 2.9991455078125, 3.11279296875, 3.2264404296875, 3.340087890625, 3.4537353515625, 3.5673828125, 3.6810302734375, 3.794677734375, 3.9083251953125, 4.02197265625, 4.1356201171875, 4.249267578125, 4.3629150390625, 4.4765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 10.0, 15.0, 17.0, 35.0, 47.0, 54.0, 72.0, 104.0, 169.0, 235.0, 282.0, 443.0, 624.0, 975.0, 1345.0, 2125.0, 3531.0, 6128.0, 11388.0, 22332.0, 47523.0, 102503.0, 199651.0, 258804.0, 194664.0, 100715.0, 45902.0, 21957.0, 10984.0, 6009.0, 3317.0, 2218.0, 1337.0, 885.0, 623.0, 432.0, 313.0, 246.0, 156.0, 104.0, 84.0, 54.0, 38.0, 29.0, 24.0, 17.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.05767822265625, -3.9200439453125, -3.78240966796875, -3.644775390625, -3.50714111328125, -3.3695068359375, -3.23187255859375, -3.09423828125, -2.95660400390625, -2.8189697265625, -2.68133544921875, -2.543701171875, -2.40606689453125, -2.2684326171875, -2.13079833984375, -1.9931640625, -1.85552978515625, -1.7178955078125, -1.58026123046875, -1.442626953125, -1.30499267578125, -1.1673583984375, -1.02972412109375, -0.89208984375, -0.75445556640625, -0.6168212890625, -0.47918701171875, -0.341552734375, -0.20391845703125, -0.0662841796875, 0.07135009765625, 0.208984375, 0.34661865234375, 0.4842529296875, 0.62188720703125, 0.759521484375, 0.89715576171875, 1.0347900390625, 1.17242431640625, 1.31005859375, 1.44769287109375, 1.5853271484375, 1.72296142578125, 1.860595703125, 1.99822998046875, 2.1358642578125, 2.27349853515625, 2.4111328125, 2.54876708984375, 2.6864013671875, 2.82403564453125, 2.961669921875, 3.09930419921875, 3.2369384765625, 3.37457275390625, 3.51220703125, 3.64984130859375, 3.7874755859375, 3.92510986328125, 4.062744140625, 4.20037841796875, 4.3380126953125, 4.47564697265625, 4.61328125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 8.0, 12.0, 15.0, 28.0, 19.0, 53.0, 29.0, 66.0, 61.0, 70.0, 75.0, 65.0, 68.0, 57.0, 67.0, 72.0, 47.0, 37.0, 31.0, 16.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00034999847412109375, -0.000339265912771225, -0.0003285333514213562, -0.0003178007900714874, -0.00030706822872161865, -0.0002963356673717499, -0.0002856031060218811, -0.00027487054467201233, -0.00026413798332214355, -0.0002534054219722748, -0.000242672860622406, -0.00023194029927253723, -0.00022120773792266846, -0.00021047517657279968, -0.0001997426152229309, -0.00018901005387306213, -0.00017827749252319336, -0.00016754493117332458, -0.0001568123698234558, -0.00014607980847358704, -0.00013534724712371826, -0.0001246146857738495, -0.00011388212442398071, -0.00010314956307411194, -9.241700172424316e-05, -8.168444037437439e-05, -7.095187902450562e-05, -6.021931767463684e-05, -4.9486756324768066e-05, -3.875419497489929e-05, -2.8021633625030518e-05, -1.7289072275161743e-05, -6.556510925292969e-06, 4.176050424575806e-06, 1.490861177444458e-05, 2.5641173124313354e-05, 3.637373447418213e-05, 4.71062958240509e-05, 5.783885717391968e-05, 6.857141852378845e-05, 7.930397987365723e-05, 9.0036541223526e-05, 0.00010076910257339478, 0.00011150166392326355, 0.00012223422527313232, 0.0001329667866230011, 0.00014369934797286987, 0.00015443190932273865, 0.00016516447067260742, 0.0001758970320224762, 0.00018662959337234497, 0.00019736215472221375, 0.00020809471607208252, 0.0002188272774219513, 0.00022955983877182007, 0.00024029240012168884, 0.0002510249614715576, 0.0002617575228214264, 0.00027249008417129517, 0.00028322264552116394, 0.0002939552068710327, 0.0003046877682209015, 0.00031542032957077026, 0.00032615289092063904, 0.0003368854522705078]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 9.0, 11.0, 22.0, 32.0, 37.0, 41.0, 57.0, 72.0, 131.0, 140.0, 204.0, 261.0, 364.0, 527.0, 823.0, 1193.0, 2008.0, 3404.0, 6605.0, 14010.0, 33634.0, 86192.0, 202408.0, 304137.0, 221869.0, 98510.0, 38463.0, 15892.0, 7354.0, 3825.0, 2154.0, 1248.0, 825.0, 571.0, 379.0, 296.0, 240.0, 141.0, 105.0, 79.0, 63.0, 51.0, 41.0, 34.0, 28.0, 16.0, 11.0, 6.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.4765625, -5.3031005859375, -5.129638671875, -4.9561767578125, -4.78271484375, -4.6092529296875, -4.435791015625, -4.2623291015625, -4.0888671875, -3.9154052734375, -3.741943359375, -3.5684814453125, -3.39501953125, -3.2215576171875, -3.048095703125, -2.8746337890625, -2.701171875, -2.5277099609375, -2.354248046875, -2.1807861328125, -2.00732421875, -1.8338623046875, -1.660400390625, -1.4869384765625, -1.3134765625, -1.1400146484375, -0.966552734375, -0.7930908203125, -0.61962890625, -0.4461669921875, -0.272705078125, -0.0992431640625, 0.07421875, 0.2476806640625, 0.421142578125, 0.5946044921875, 0.76806640625, 0.9415283203125, 1.114990234375, 1.2884521484375, 1.4619140625, 1.6353759765625, 1.808837890625, 1.9822998046875, 2.15576171875, 2.3292236328125, 2.502685546875, 2.6761474609375, 2.849609375, 3.0230712890625, 3.196533203125, 3.3699951171875, 3.54345703125, 3.7169189453125, 3.890380859375, 4.0638427734375, 4.2373046875, 4.4107666015625, 4.584228515625, 4.7576904296875, 4.93115234375, 5.1046142578125, 5.278076171875, 5.4515380859375, 5.625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 8.0, 11.0, 24.0, 26.0, 31.0, 40.0, 45.0, 63.0, 62.0, 71.0, 69.0, 55.0, 83.0, 62.0, 62.0, 58.0, 34.0, 35.0, 28.0, 26.0, 21.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.1064453125, -1.0707550048828125, -1.035064697265625, -0.9993743896484375, -0.96368408203125, -0.9279937744140625, -0.892303466796875, -0.8566131591796875, -0.8209228515625, -0.7852325439453125, -0.749542236328125, -0.7138519287109375, -0.67816162109375, -0.6424713134765625, -0.606781005859375, -0.5710906982421875, -0.535400390625, -0.4997100830078125, -0.464019775390625, -0.4283294677734375, -0.39263916015625, -0.3569488525390625, -0.321258544921875, -0.2855682373046875, -0.2498779296875, -0.2141876220703125, -0.178497314453125, -0.1428070068359375, -0.10711669921875, -0.0714263916015625, -0.035736083984375, -4.57763671875e-05, 0.03564453125, 0.0713348388671875, 0.107025146484375, 0.1427154541015625, 0.17840576171875, 0.2140960693359375, 0.249786376953125, 0.2854766845703125, 0.3211669921875, 0.3568572998046875, 0.392547607421875, 0.4282379150390625, 0.46392822265625, 0.4996185302734375, 0.535308837890625, 0.5709991455078125, 0.606689453125, 0.6423797607421875, 0.678070068359375, 0.7137603759765625, 0.74945068359375, 0.7851409912109375, 0.820831298828125, 0.8565216064453125, 0.8922119140625, 0.9279022216796875, 0.963592529296875, 0.9992828369140625, 1.03497314453125, 1.0706634521484375, 1.106353759765625, 1.1420440673828125, 1.177734375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 28.0, 23.0, 26.0, 33.0, 44.0, 46.0, 66.0, 67.0, 78.0, 79.0, 56.0, 62.0, 65.0, 60.0, 46.0, 44.0, 42.0, 25.0, 21.0, 25.0, 10.0, 10.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.256855010986328, -7.958423614501953, -7.659992694854736, -7.361561298370361, -7.0631303787231445, -6.7646989822387695, -6.4662675857543945, -6.1678361892700195, -5.869405269622803, -5.570973873138428, -5.272542953491211, -4.974111557006836, -4.675680160522461, -4.377249240875244, -4.078817844390869, -3.7803866863250732, -3.4819555282592773, -3.1835243701934814, -2.8850932121276855, -2.5866618156433105, -2.2882306575775146, -1.9897994995117188, -1.6913682222366333, -1.3929369449615479, -1.094505786895752, -0.7960745692253113, -0.4976433515548706, -0.19921213388442993, 0.09921908378601074, 0.39765024185180664, 0.6960815191268921, 0.9945127964019775, 1.2929449081420898, 1.5913760662078857, 1.8898073434829712, 2.1882386207580566, 2.4866697788238525, 2.7851009368896484, 3.0835323333740234, 3.3819634914398193, 3.6803946495056152, 3.978825807571411, 4.277256965637207, 4.575688362121582, 4.874119758605957, 5.172550678253174, 5.470982074737549, 5.769412994384766, 6.067844390869141, 6.366275787353516, 6.664706707000732, 6.963138103485107, 7.261569023132324, 7.560000419616699, 7.858431816101074, 8.15686321258545, 8.455293655395508, 8.753725051879883, 9.052156448364258, 9.350586891174316, 9.649018287658691, 9.947449684143066, 10.245881080627441, 10.544312477111816, 10.842743873596191]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 7.0, 8.0, 12.0, 6.0, 13.0, 18.0, 16.0, 24.0, 22.0, 18.0, 43.0, 19.0, 38.0, 32.0, 25.0, 41.0, 37.0, 40.0, 44.0, 39.0, 30.0, 43.0, 33.0, 33.0, 33.0, 35.0, 26.0, 36.0, 23.0, 19.0, 24.0, 18.0, 22.0, 25.0, 8.0, 15.0, 7.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9709115028381348, -3.8391921520233154, -3.707473039627075, -3.575753688812256, -3.4440345764160156, -3.3123152256011963, -3.180595874786377, -3.0488767623901367, -2.9171574115753174, -2.785438060760498, -2.653718948364258, -2.5219995975494385, -2.390280246734619, -2.258561134338379, -2.1268417835235596, -1.9951225519180298, -1.8634033203125, -1.7316840887069702, -1.5999648571014404, -1.468245506286621, -1.3365262746810913, -1.2048070430755615, -1.0730876922607422, -0.9413684606552124, -0.8096492290496826, -0.6779299974441528, -0.5462107062339783, -0.4144914448261261, -0.2827721834182739, -0.15105295181274414, -0.01933366060256958, 0.11238563060760498, 0.24410486221313477, 0.37582412362098694, 0.5075433850288391, 0.6392626762390137, 0.7709819078445435, 0.9027011394500732, 1.0344204902648926, 1.1661397218704224, 1.2978589534759521, 1.429578185081482, 1.5612974166870117, 1.693016767501831, 1.8247359991073608, 1.9564552307128906, 2.08817458152771, 2.2198939323425293, 2.3516130447387695, 2.483332395553589, 2.615051507949829, 2.7467708587646484, 2.8784899711608887, 3.010209321975708, 3.1419286727905273, 3.2736477851867676, 3.405367136001587, 3.5370864868164062, 3.6688055992126465, 3.800524950027466, 3.932244300842285, 4.063963413238525, 4.195682525634766, 4.327402114868164, 4.459121227264404]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 5.0, 9.0, 7.0, 10.0, 12.0, 20.0, 23.0, 46.0, 61.0, 68.0, 139.0, 159.0, 281.0, 454.0, 678.0, 1048.0, 1851.0, 2975.0, 4947.0, 8522.0, 14791.0, 25915.0, 47929.0, 89841.0, 175287.0, 347675.0, 642379.0, 907245.0, 828155.0, 520793.0, 273099.0, 139445.0, 72378.0, 38121.0, 21033.0, 11995.0, 6807.0, 4018.0, 2342.0, 1363.0, 857.0, 562.0, 321.0, 214.0, 137.0, 93.0, 62.0, 50.0, 27.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.06640625, -6.84423828125, -6.6220703125, -6.39990234375, -6.177734375, -5.95556640625, -5.7333984375, -5.51123046875, -5.2890625, -5.06689453125, -4.8447265625, -4.62255859375, -4.400390625, -4.17822265625, -3.9560546875, -3.73388671875, -3.51171875, -3.28955078125, -3.0673828125, -2.84521484375, -2.623046875, -2.40087890625, -2.1787109375, -1.95654296875, -1.734375, -1.51220703125, -1.2900390625, -1.06787109375, -0.845703125, -0.62353515625, -0.4013671875, -0.17919921875, 0.04296875, 0.26513671875, 0.4873046875, 0.70947265625, 0.931640625, 1.15380859375, 1.3759765625, 1.59814453125, 1.8203125, 2.04248046875, 2.2646484375, 2.48681640625, 2.708984375, 2.93115234375, 3.1533203125, 3.37548828125, 3.59765625, 3.81982421875, 4.0419921875, 4.26416015625, 4.486328125, 4.70849609375, 4.9306640625, 5.15283203125, 5.375, 5.59716796875, 5.8193359375, 6.04150390625, 6.263671875, 6.48583984375, 6.7080078125, 6.93017578125, 7.15234375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 7.0, 8.0, 12.0, 12.0, 10.0, 24.0, 32.0, 24.0, 31.0, 34.0, 38.0, 45.0, 41.0, 49.0, 59.0, 58.0, 47.0, 35.0, 36.0, 49.0, 36.0, 43.0, 42.0, 43.0, 35.0, 25.0, 31.0, 19.0, 13.0, 7.0, 9.0, 7.0, 9.0, 9.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.822662353515625, -3.67071533203125, -3.518768310546875, -3.3668212890625, -3.214874267578125, -3.06292724609375, -2.910980224609375, -2.759033203125, -2.607086181640625, -2.45513916015625, -2.303192138671875, -2.1512451171875, -1.999298095703125, -1.84735107421875, -1.695404052734375, -1.54345703125, -1.391510009765625, -1.23956298828125, -1.087615966796875, -0.9356689453125, -0.783721923828125, -0.63177490234375, -0.479827880859375, -0.327880859375, -0.175933837890625, -0.02398681640625, 0.127960205078125, 0.2799072265625, 0.431854248046875, 0.58380126953125, 0.735748291015625, 0.8876953125, 1.039642333984375, 1.19158935546875, 1.343536376953125, 1.4954833984375, 1.647430419921875, 1.79937744140625, 1.951324462890625, 2.103271484375, 2.255218505859375, 2.40716552734375, 2.559112548828125, 2.7110595703125, 2.863006591796875, 3.01495361328125, 3.166900634765625, 3.31884765625, 3.470794677734375, 3.62274169921875, 3.774688720703125, 3.9266357421875, 4.078582763671875, 4.23052978515625, 4.382476806640625, 4.534423828125, 4.686370849609375, 4.83831787109375, 4.990264892578125, 5.1422119140625, 5.294158935546875, 5.44610595703125, 5.598052978515625, 5.75]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 18.0, 35.0, 49.0, 110.0, 164.0, 253.0, 412.0, 727.0, 1243.0, 2199.0, 3628.0, 6580.0, 11854.0, 22001.0, 40766.0, 78443.0, 152811.0, 294116.0, 539645.0, 824988.0, 872000.0, 615402.0, 346684.0, 180697.0, 93642.0, 48797.0, 25480.0, 13776.0, 7642.0, 4294.0, 2400.0, 1336.0, 845.0, 474.0, 279.0, 186.0, 108.0, 59.0, 45.0, 22.0, 15.0, 19.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.0723876953125, -7.785400390625, -7.4984130859375, -7.21142578125, -6.9244384765625, -6.637451171875, -6.3504638671875, -6.0634765625, -5.7764892578125, -5.489501953125, -5.2025146484375, -4.91552734375, -4.6285400390625, -4.341552734375, -4.0545654296875, -3.767578125, -3.4805908203125, -3.193603515625, -2.9066162109375, -2.61962890625, -2.3326416015625, -2.045654296875, -1.7586669921875, -1.4716796875, -1.1846923828125, -0.897705078125, -0.6107177734375, -0.32373046875, -0.0367431640625, 0.250244140625, 0.5372314453125, 0.82421875, 1.1112060546875, 1.398193359375, 1.6851806640625, 1.97216796875, 2.2591552734375, 2.546142578125, 2.8331298828125, 3.1201171875, 3.4071044921875, 3.694091796875, 3.9810791015625, 4.26806640625, 4.5550537109375, 4.842041015625, 5.1290283203125, 5.416015625, 5.7030029296875, 5.989990234375, 6.2769775390625, 6.56396484375, 6.8509521484375, 7.137939453125, 7.4249267578125, 7.7119140625, 7.9989013671875, 8.285888671875, 8.5728759765625, 8.85986328125, 9.1468505859375, 9.433837890625, 9.7208251953125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 15.0, 15.0, 29.0, 37.0, 37.0, 48.0, 61.0, 77.0, 111.0, 113.0, 143.0, 150.0, 204.0, 238.0, 254.0, 271.0, 257.0, 253.0, 202.0, 246.0, 233.0, 173.0, 152.0, 154.0, 110.0, 102.0, 70.0, 53.0, 43.0, 43.0, 37.0, 30.0, 23.0, 20.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.6339111328125, -2.551025390625, -2.4681396484375, -2.38525390625, -2.3023681640625, -2.219482421875, -2.1365966796875, -2.0537109375, -1.9708251953125, -1.887939453125, -1.8050537109375, -1.72216796875, -1.6392822265625, -1.556396484375, -1.4735107421875, -1.390625, -1.3077392578125, -1.224853515625, -1.1419677734375, -1.05908203125, -0.9761962890625, -0.893310546875, -0.8104248046875, -0.7275390625, -0.6446533203125, -0.561767578125, -0.4788818359375, -0.39599609375, -0.3131103515625, -0.230224609375, -0.1473388671875, -0.064453125, 0.0184326171875, 0.101318359375, 0.1842041015625, 0.26708984375, 0.3499755859375, 0.432861328125, 0.5157470703125, 0.5986328125, 0.6815185546875, 0.764404296875, 0.8472900390625, 0.93017578125, 1.0130615234375, 1.095947265625, 1.1788330078125, 1.26171875, 1.3446044921875, 1.427490234375, 1.5103759765625, 1.59326171875, 1.6761474609375, 1.759033203125, 1.8419189453125, 1.9248046875, 2.0076904296875, 2.090576171875, 2.1734619140625, 2.25634765625, 2.3392333984375, 2.422119140625, 2.5050048828125, 2.587890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 20.0, 23.0, 18.0, 22.0, 32.0, 26.0, 41.0, 41.0, 49.0, 48.0, 57.0, 53.0, 58.0, 72.0, 63.0, 61.0, 39.0, 40.0, 47.0, 37.0, 30.0, 24.0, 22.0, 11.0, 15.0, 3.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.052596092224121, -9.751803398132324, -9.451009750366211, -9.150217056274414, -8.849424362182617, -8.54863166809082, -8.247838020324707, -7.94704532623291, -7.646252155303955, -7.345458984375, -7.044666290283203, -6.743873119354248, -6.443079948425293, -6.142287254333496, -5.841494083404541, -5.540700912475586, -5.239908218383789, -4.939115047454834, -4.638322353363037, -4.337529182434082, -4.036736488342285, -3.73594331741333, -3.435150146484375, -3.134357213973999, -2.833564281463623, -2.532771348953247, -2.231978416442871, -1.931185245513916, -1.63039231300354, -1.329599380493164, -1.0288063287734985, -0.728013277053833, -0.42722129821777344, -0.12642830610275269, 0.17436468601226807, 0.4751576781272888, 0.7759506702423096, 1.0767436027526855, 1.377536654472351, 1.6783297061920166, 1.9791226387023926, 2.2799155712127686, 2.5807085037231445, 2.8815016746520996, 3.1822946071624756, 3.4830875396728516, 3.7838807106018066, 4.084673881530762, 4.385466575622559, 4.686259746551514, 4.9870524406433105, 5.287845611572266, 5.5886383056640625, 5.889431476593018, 6.190224647521973, 6.4910173416137695, 6.791810512542725, 7.09260368347168, 7.393396377563477, 7.694189548492432, 7.994982719421387, 8.295775413513184, 8.59656810760498, 8.897361755371094, 9.19815444946289]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 13.0, 12.0, 16.0, 11.0, 15.0, 10.0, 17.0, 36.0, 24.0, 32.0, 28.0, 21.0, 31.0, 30.0, 42.0, 38.0, 27.0, 43.0, 44.0, 28.0, 53.0, 37.0, 35.0, 40.0, 34.0, 36.0, 26.0, 30.0, 27.0, 26.0, 20.0, 17.0, 24.0, 12.0, 12.0, 8.0, 5.0, 11.0, 6.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.544286251068115, -5.38059663772583, -5.216907024383545, -5.05321741104126, -4.889527797698975, -4.7258381843566895, -4.562148571014404, -4.398458957672119, -4.234769344329834, -4.071079730987549, -3.9073901176452637, -3.7437005043029785, -3.5800108909606934, -3.416321277618408, -3.252631664276123, -3.088942050933838, -2.9252524375915527, -2.7615628242492676, -2.5978732109069824, -2.4341835975646973, -2.270493984222412, -2.106804370880127, -1.9431147575378418, -1.7794251441955566, -1.6157355308532715, -1.4520459175109863, -1.2883563041687012, -1.124666690826416, -0.9609770774841309, -0.7972874641418457, -0.6335978507995605, -0.4699082374572754, -0.30621910095214844, -0.14252948760986328, 0.021160125732421875, 0.18484973907470703, 0.3485393524169922, 0.5122289657592773, 0.6759185791015625, 0.8396081924438477, 1.0032978057861328, 1.166987419128418, 1.3306770324707031, 1.4943666458129883, 1.6580562591552734, 1.8217458724975586, 1.9854354858398438, 2.149125099182129, 2.312814712524414, 2.476504325866699, 2.6401939392089844, 2.8038835525512695, 2.9675731658935547, 3.13126277923584, 3.294952392578125, 3.45864200592041, 3.6223316192626953, 3.7860212326049805, 3.9497108459472656, 4.113400459289551, 4.277090072631836, 4.440779685974121, 4.604469299316406, 4.768158912658691, 4.931848526000977]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 7.0, 11.0, 8.0, 23.0, 17.0, 35.0, 73.0, 93.0, 115.0, 194.0, 324.0, 501.0, 741.0, 1217.0, 2139.0, 3366.0, 5548.0, 9446.0, 16172.0, 27408.0, 47725.0, 81612.0, 132071.0, 183242.0, 187068.0, 139279.0, 87014.0, 51309.0, 29384.0, 17032.0, 10141.0, 5950.0, 3526.0, 2116.0, 1317.0, 812.0, 518.0, 330.0, 228.0, 139.0, 92.0, 66.0, 44.0, 25.0, 23.0, 14.0, 15.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6492996215820312, -0.6277008056640625, -0.6061019897460938, -0.584503173828125, -0.5629043579101562, -0.5413055419921875, -0.5197067260742188, -0.49810791015625, -0.47650909423828125, -0.4549102783203125, -0.43331146240234375, -0.411712646484375, -0.39011383056640625, -0.3685150146484375, -0.34691619873046875, -0.3253173828125, -0.30371856689453125, -0.2821197509765625, -0.26052093505859375, -0.238922119140625, -0.21732330322265625, -0.1957244873046875, -0.17412567138671875, -0.15252685546875, -0.13092803955078125, -0.1093292236328125, -0.08773040771484375, -0.066131591796875, -0.04453277587890625, -0.0229339599609375, -0.00133514404296875, 0.020263671875, 0.04186248779296875, 0.0634613037109375, 0.08506011962890625, 0.106658935546875, 0.12825775146484375, 0.1498565673828125, 0.17145538330078125, 0.19305419921875, 0.21465301513671875, 0.2362518310546875, 0.25785064697265625, 0.279449462890625, 0.30104827880859375, 0.3226470947265625, 0.34424591064453125, 0.3658447265625, 0.38744354248046875, 0.4090423583984375, 0.43064117431640625, 0.452239990234375, 0.47383880615234375, 0.4954376220703125, 0.5170364379882812, 0.53863525390625, 0.5602340698242188, 0.5818328857421875, 0.6034317016601562, 0.625030517578125, 0.6466293334960938, 0.6682281494140625, 0.6898269653320312, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 2.0, 3.0, 9.0, 9.0, 11.0, 12.0, 10.0, 7.0, 14.0, 17.0, 30.0, 23.0, 29.0, 29.0, 32.0, 28.0, 35.0, 35.0, 46.0, 42.0, 40.0, 58.0, 44.0, 39.0, 53.0, 29.0, 36.0, 38.0, 34.0, 41.0, 21.0, 26.0, 21.0, 18.0, 20.0, 17.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75775146484375, -5.5623779296875, -5.36700439453125, -5.171630859375, -4.97625732421875, -4.7808837890625, -4.58551025390625, -4.39013671875, -4.19476318359375, -3.9993896484375, -3.80401611328125, -3.608642578125, -3.41326904296875, -3.2178955078125, -3.02252197265625, -2.8271484375, -2.63177490234375, -2.4364013671875, -2.24102783203125, -2.045654296875, -1.85028076171875, -1.6549072265625, -1.45953369140625, -1.26416015625, -1.06878662109375, -0.8734130859375, -0.67803955078125, -0.482666015625, -0.28729248046875, -0.0919189453125, 0.10345458984375, 0.298828125, 0.49420166015625, 0.6895751953125, 0.88494873046875, 1.080322265625, 1.27569580078125, 1.4710693359375, 1.66644287109375, 1.86181640625, 2.05718994140625, 2.2525634765625, 2.44793701171875, 2.643310546875, 2.83868408203125, 3.0340576171875, 3.22943115234375, 3.4248046875, 3.62017822265625, 3.8155517578125, 4.01092529296875, 4.206298828125, 4.40167236328125, 4.5970458984375, 4.79241943359375, 4.98779296875, 5.18316650390625, 5.3785400390625, 5.57391357421875, 5.769287109375, 5.96466064453125, 6.1600341796875, 6.35540771484375, 6.55078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 5.0, 13.0, 13.0, 12.0, 18.0, 29.0, 38.0, 46.0, 56.0, 84.0, 120.0, 146.0, 212.0, 306.0, 506.0, 682.0, 1115.0, 1899.0, 3222.0, 6055.0, 12095.0, 26672.0, 184586.0, 736996.0, 39928.0, 15604.0, 7679.0, 4032.0, 2341.0, 1397.0, 809.0, 515.0, 356.0, 257.0, 196.0, 140.0, 96.0, 60.0, 54.0, 42.0, 21.0, 26.0, 23.0, 7.0, 6.0, 8.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.912109375, -1.8487548828125, -1.785400390625, -1.7220458984375, -1.65869140625, -1.5953369140625, -1.531982421875, -1.4686279296875, -1.4052734375, -1.3419189453125, -1.278564453125, -1.2152099609375, -1.15185546875, -1.0885009765625, -1.025146484375, -0.9617919921875, -0.8984375, -0.8350830078125, -0.771728515625, -0.7083740234375, -0.64501953125, -0.5816650390625, -0.518310546875, -0.4549560546875, -0.3916015625, -0.3282470703125, -0.264892578125, -0.2015380859375, -0.13818359375, -0.0748291015625, -0.011474609375, 0.0518798828125, 0.115234375, 0.1785888671875, 0.241943359375, 0.3052978515625, 0.36865234375, 0.4320068359375, 0.495361328125, 0.5587158203125, 0.6220703125, 0.6854248046875, 0.748779296875, 0.8121337890625, 0.87548828125, 0.9388427734375, 1.002197265625, 1.0655517578125, 1.12890625, 1.1922607421875, 1.255615234375, 1.3189697265625, 1.38232421875, 1.4456787109375, 1.509033203125, 1.5723876953125, 1.6357421875, 1.6990966796875, 1.762451171875, 1.8258056640625, 1.88916015625, 1.9525146484375, 2.015869140625, 2.0792236328125, 2.142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 8.0, 8.0, 13.0, 11.0, 11.0, 19.0, 22.0, 22.0, 20.0, 22.0, 34.0, 33.0, 32.0, 40.0, 31.0, 33.0, 41.0, 40.0, 38.0, 43.0, 38.0, 46.0, 38.0, 32.0, 33.0, 29.0, 31.0, 36.0, 27.0, 30.0, 21.0, 15.0, 14.0, 12.0, 9.0, 10.0, 13.0, 3.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.703125, -3.583343505859375, -3.46356201171875, -3.343780517578125, -3.2239990234375, -3.104217529296875, -2.98443603515625, -2.864654541015625, -2.744873046875, -2.625091552734375, -2.50531005859375, -2.385528564453125, -2.2657470703125, -2.145965576171875, -2.02618408203125, -1.906402587890625, -1.78662109375, -1.666839599609375, -1.54705810546875, -1.427276611328125, -1.3074951171875, -1.187713623046875, -1.06793212890625, -0.948150634765625, -0.828369140625, -0.708587646484375, -0.58880615234375, -0.469024658203125, -0.3492431640625, -0.229461669921875, -0.10968017578125, 0.010101318359375, 0.1298828125, 0.249664306640625, 0.36944580078125, 0.489227294921875, 0.6090087890625, 0.728790283203125, 0.84857177734375, 0.968353271484375, 1.088134765625, 1.207916259765625, 1.32769775390625, 1.447479248046875, 1.5672607421875, 1.687042236328125, 1.80682373046875, 1.926605224609375, 2.04638671875, 2.166168212890625, 2.28594970703125, 2.405731201171875, 2.5255126953125, 2.645294189453125, 2.76507568359375, 2.884857177734375, 3.004638671875, 3.124420166015625, 3.24420166015625, 3.363983154296875, 3.4837646484375, 3.603546142578125, 3.72332763671875, 3.843109130859375, 3.962890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 11.0, 12.0, 28.0, 25.0, 56.0, 65.0, 94.0, 115.0, 184.0, 285.0, 421.0, 642.0, 979.0, 1461.0, 2147.0, 3379.0, 5138.0, 8188.0, 13455.0, 23715.0, 108709.0, 799764.0, 34049.0, 17211.0, 10228.0, 6368.0, 3996.0, 2624.0, 1754.0, 1149.0, 754.0, 491.0, 336.0, 220.0, 154.0, 111.0, 72.0, 49.0, 32.0, 30.0, 14.0, 11.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.349609375, -0.33908843994140625, -0.3285675048828125, -0.31804656982421875, -0.307525634765625, -0.29700469970703125, -0.2864837646484375, -0.27596282958984375, -0.26544189453125, -0.25492095947265625, -0.2444000244140625, -0.23387908935546875, -0.223358154296875, -0.21283721923828125, -0.2023162841796875, -0.19179534912109375, -0.1812744140625, -0.17075347900390625, -0.1602325439453125, -0.14971160888671875, -0.139190673828125, -0.12866973876953125, -0.1181488037109375, -0.10762786865234375, -0.09710693359375, -0.08658599853515625, -0.0760650634765625, -0.06554412841796875, -0.055023193359375, -0.04450225830078125, -0.0339813232421875, -0.02346038818359375, -0.012939453125, -0.00241851806640625, 0.0081024169921875, 0.01862335205078125, 0.029144287109375, 0.03966522216796875, 0.0501861572265625, 0.06070709228515625, 0.07122802734375, 0.08174896240234375, 0.0922698974609375, 0.10279083251953125, 0.113311767578125, 0.12383270263671875, 0.1343536376953125, 0.14487457275390625, 0.1553955078125, 0.16591644287109375, 0.1764373779296875, 0.18695831298828125, 0.197479248046875, 0.20800018310546875, 0.2185211181640625, 0.22904205322265625, 0.23956298828125, 0.25008392333984375, 0.2606048583984375, 0.27112579345703125, 0.281646728515625, 0.29216766357421875, 0.3026885986328125, 0.31320953369140625, 0.32373046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 10.0, 19.0, 19.0, 23.0, 26.0, 28.0, 33.0, 29.0, 24.0, 34.0, 30.0, 43.0, 37.0, 38.0, 29.0, 38.0, 44.0, 55.0, 57.0, 24.0, 38.0, 40.0, 34.0, 38.0, 26.0, 19.0, 21.0, 27.0, 9.0, 21.0, 12.0, 8.0, 11.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3769214749336243e-05, -2.2921711206436157e-05, -2.2074207663536072e-05, -2.1226704120635986e-05, -2.03792005777359e-05, -1.9531697034835815e-05, -1.868419349193573e-05, -1.7836689949035645e-05, -1.698918640613556e-05, -1.6141682863235474e-05, -1.5294179320335388e-05, -1.4446675777435303e-05, -1.3599172234535217e-05, -1.2751668691635132e-05, -1.1904165148735046e-05, -1.1056661605834961e-05, -1.0209158062934875e-05, -9.36165452003479e-06, -8.514150977134705e-06, -7.666647434234619e-06, -6.819143891334534e-06, -5.971640348434448e-06, -5.124136805534363e-06, -4.276633262634277e-06, -3.429129719734192e-06, -2.5816261768341064e-06, -1.734122633934021e-06, -8.866190910339355e-07, -3.91155481338501e-08, 8.083879947662354e-07, 1.6558915376663208e-06, 2.5033950805664062e-06, 3.3508986234664917e-06, 4.198402166366577e-06, 5.045905709266663e-06, 5.893409252166748e-06, 6.7409127950668335e-06, 7.588416337966919e-06, 8.435919880867004e-06, 9.28342342376709e-06, 1.0130926966667175e-05, 1.097843050956726e-05, 1.1825934052467346e-05, 1.2673437595367432e-05, 1.3520941138267517e-05, 1.4368444681167603e-05, 1.5215948224067688e-05, 1.6063451766967773e-05, 1.691095530986786e-05, 1.7758458852767944e-05, 1.860596239566803e-05, 1.9453465938568115e-05, 2.03009694814682e-05, 2.1148473024368286e-05, 2.199597656726837e-05, 2.2843480110168457e-05, 2.3690983653068542e-05, 2.4538487195968628e-05, 2.5385990738868713e-05, 2.62334942817688e-05, 2.7080997824668884e-05, 2.792850136756897e-05, 2.8776004910469055e-05, 2.962350845336914e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 17.0, 23.0, 28.0, 37.0, 54.0, 89.0, 119.0, 198.0, 294.0, 484.0, 829.0, 1229.0, 1873.0, 2948.0, 4883.0, 7726.0, 12928.0, 21809.0, 36345.0, 61327.0, 100451.0, 150181.0, 184201.0, 165239.0, 115510.0, 71664.0, 42942.0, 25444.0, 15322.0, 9088.0, 5701.0, 3518.0, 2197.0, 1380.0, 905.0, 567.0, 350.0, 222.0, 143.0, 98.0, 66.0, 43.0, 29.0, 17.0, 13.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18826675415039062, -0.18231964111328125, -0.17637252807617188, -0.1704254150390625, -0.16447830200195312, -0.15853118896484375, -0.15258407592773438, -0.146636962890625, -0.14068984985351562, -0.13474273681640625, -0.12879562377929688, -0.1228485107421875, -0.11690139770507812, -0.11095428466796875, -0.10500717163085938, -0.09906005859375, -0.09311294555664062, -0.08716583251953125, -0.08121871948242188, -0.0752716064453125, -0.06932449340820312, -0.06337738037109375, -0.057430267333984375, -0.051483154296875, -0.045536041259765625, -0.03958892822265625, -0.033641815185546875, -0.0276947021484375, -0.021747589111328125, -0.01580047607421875, -0.009853363037109375, -0.00390625, 0.002040863037109375, 0.00798797607421875, 0.013935089111328125, 0.0198822021484375, 0.025829315185546875, 0.03177642822265625, 0.037723541259765625, 0.043670654296875, 0.049617767333984375, 0.05556488037109375, 0.061511993408203125, 0.0674591064453125, 0.07340621948242188, 0.07935333251953125, 0.08530044555664062, 0.09124755859375, 0.09719467163085938, 0.10314178466796875, 0.10908889770507812, 0.1150360107421875, 0.12098312377929688, 0.12693023681640625, 0.13287734985351562, 0.138824462890625, 0.14477157592773438, 0.15071868896484375, 0.15666580200195312, 0.1626129150390625, 0.16856002807617188, 0.17450714111328125, 0.18045425415039062, 0.1864013671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 15.0, 14.0, 16.0, 26.0, 34.0, 29.0, 43.0, 39.0, 47.0, 53.0, 44.0, 71.0, 56.0, 69.0, 50.0, 48.0, 54.0, 54.0, 39.0, 25.0, 30.0, 23.0, 19.0, 16.0, 13.0, 8.0, 9.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.055511474609375, -0.05358457565307617, -0.051657676696777344, -0.049730777740478516, -0.04780387878417969, -0.04587697982788086, -0.04395008087158203, -0.0420231819152832, -0.040096282958984375, -0.03816938400268555, -0.03624248504638672, -0.03431558609008789, -0.03238868713378906, -0.030461788177490234, -0.028534889221191406, -0.026607990264892578, -0.02468109130859375, -0.022754192352294922, -0.020827293395996094, -0.018900394439697266, -0.016973495483398438, -0.01504659652709961, -0.013119697570800781, -0.011192798614501953, -0.009265899658203125, -0.007339000701904297, -0.005412101745605469, -0.0034852027893066406, -0.0015583038330078125, 0.0003685951232910156, 0.0022954940795898438, 0.004222393035888672, 0.0061492919921875, 0.008076190948486328, 0.010003089904785156, 0.011929988861083984, 0.013856887817382812, 0.01578378677368164, 0.01771068572998047, 0.019637584686279297, 0.021564483642578125, 0.023491382598876953, 0.02541828155517578, 0.02734518051147461, 0.029272079467773438, 0.031198978424072266, 0.033125877380371094, 0.03505277633666992, 0.03697967529296875, 0.03890657424926758, 0.040833473205566406, 0.042760372161865234, 0.04468727111816406, 0.04661417007446289, 0.04854106903076172, 0.05046796798706055, 0.052394866943359375, 0.0543217658996582, 0.05624866485595703, 0.05817556381225586, 0.06010246276855469, 0.062029361724853516, 0.06395626068115234, 0.06588315963745117, 0.06781005859375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 6.0, 13.0, 22.0, 18.0, 22.0, 21.0, 37.0, 32.0, 41.0, 47.0, 47.0, 47.0, 58.0, 57.0, 65.0, 70.0, 48.0, 60.0, 41.0, 44.0, 37.0, 34.0, 31.0, 21.0, 18.0, 12.0, 10.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.832262992858887, -9.5341215133667, -9.235980033874512, -8.937837600708008, -8.63969612121582, -8.341554641723633, -8.043413162231445, -7.745271682739258, -7.447129726409912, -7.148988246917725, -6.850846290588379, -6.552704811096191, -6.254563331604004, -5.956421375274658, -5.658279895782471, -5.360137939453125, -5.0619964599609375, -4.76385498046875, -4.465713024139404, -4.167571544647217, -3.86942982673645, -3.5712881088256836, -3.273146629333496, -2.9750049114227295, -2.676863193511963, -2.3787214756011963, -2.0805797576904297, -1.7824382781982422, -1.4842965602874756, -1.186154842376709, -0.8880132436752319, -0.5898716449737549, -0.2917299270629883, 0.006411731243133545, 0.30455338954925537, 0.6026950478553772, 0.900836706161499, 1.1989784240722656, 1.4971200227737427, 1.7952616214752197, 2.0934033393859863, 2.391545057296753, 2.6896867752075195, 2.987828254699707, 3.2859699726104736, 3.5841116905212402, 3.8822531700134277, 4.180395126342773, 4.478536605834961, 4.776678085327148, 5.074820041656494, 5.372961521148682, 5.671103477478027, 5.969244956970215, 6.267386436462402, 6.56552791595459, 6.8636698722839355, 7.161811351776123, 7.459953308105469, 7.758094787597656, 8.056236267089844, 8.354377746582031, 8.652520179748535, 8.950661659240723, 9.24880313873291]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 7.0, 7.0, 15.0, 12.0, 16.0, 9.0, 14.0, 12.0, 17.0, 35.0, 29.0, 30.0, 25.0, 23.0, 31.0, 36.0, 36.0, 37.0, 29.0, 51.0, 36.0, 31.0, 47.0, 45.0, 32.0, 38.0, 34.0, 32.0, 30.0, 30.0, 28.0, 25.0, 19.0, 14.0, 24.0, 12.0, 14.0, 7.0, 5.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.478827476501465, -5.315625190734863, -5.1524224281311035, -4.989220142364502, -4.8260178565979, -4.662815570831299, -4.499612808227539, -4.3364105224609375, -4.173208236694336, -4.010005950927734, -3.8468034267425537, -3.683600902557373, -3.5203986167907715, -3.357196092605591, -3.19399356842041, -3.0307912826538086, -2.867588758468628, -2.7043862342834473, -2.5411839485168457, -2.377981424331665, -2.2147791385650635, -2.051576614379883, -1.8883742094039917, -1.7251718044281006, -1.5619693994522095, -1.3987669944763184, -1.2355645895004272, -1.0723621845245361, -0.9091597199440002, -0.7459573149681091, -0.5827548503875732, -0.41955244541168213, -0.256350040435791, -0.09314762055873871, 0.0700547993183136, 0.2332572340965271, 0.3964596390724182, 0.5596620440483093, 0.7228645086288452, 0.8860669136047363, 1.0492693185806274, 1.2124717235565186, 1.3756741285324097, 1.5388765335083008, 1.7020790576934814, 1.865281343460083, 2.0284838676452637, 2.1916861534118652, 2.354888677597046, 2.5180912017822266, 2.681293487548828, 2.844496011734009, 3.0076982975006104, 3.170900821685791, 3.3341031074523926, 3.4973056316375732, 3.660508155822754, 3.8237106800079346, 3.986912965774536, 4.150115489959717, 4.313317775726318, 4.47652006149292, 4.63972282409668, 4.802925109863281, 4.966127395629883]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 22.0, 21.0, 47.0, 60.0, 94.0, 147.0, 229.0, 325.0, 463.0, 735.0, 1195.0, 1746.0, 2808.0, 4309.0, 6651.0, 9953.0, 14834.0, 22394.0, 32843.0, 46396.0, 63640.0, 82631.0, 99908.0, 110825.0, 112827.0, 104792.0, 89115.0, 70896.0, 53277.0, 37934.0, 25945.0, 17783.0, 11644.0, 7599.0, 5015.0, 3284.0, 2128.0, 1416.0, 900.0, 566.0, 363.0, 285.0, 163.0, 115.0, 72.0, 54.0, 34.0, 20.0, 18.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.8984375, -3.77734375, -3.65625, -3.53515625, -3.4140625, -3.29296875, -3.171875, -3.05078125, -2.9296875, -2.80859375, -2.6875, -2.56640625, -2.4453125, -2.32421875, -2.203125, -2.08203125, -1.9609375, -1.83984375, -1.71875, -1.59765625, -1.4765625, -1.35546875, -1.234375, -1.11328125, -0.9921875, -0.87109375, -0.75, -0.62890625, -0.5078125, -0.38671875, -0.265625, -0.14453125, -0.0234375, 0.09765625, 0.21875, 0.33984375, 0.4609375, 0.58203125, 0.703125, 0.82421875, 0.9453125, 1.06640625, 1.1875, 1.30859375, 1.4296875, 1.55078125, 1.671875, 1.79296875, 1.9140625, 2.03515625, 2.15625, 2.27734375, 2.3984375, 2.51953125, 2.640625, 2.76171875, 2.8828125, 3.00390625, 3.125, 3.24609375, 3.3671875, 3.48828125, 3.609375, 3.73046875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 14.0, 11.0, 24.0, 17.0, 18.0, 26.0, 37.0, 26.0, 32.0, 18.0, 32.0, 38.0, 46.0, 31.0, 40.0, 48.0, 28.0, 39.0, 47.0, 32.0, 39.0, 41.0, 25.0, 44.0, 30.0, 31.0, 23.0, 22.0, 24.0, 22.0, 7.0, 10.0, 9.0, 7.0, 5.0, 9.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0], "bins": [-6.69140625, -6.51092529296875, -6.3304443359375, -6.14996337890625, -5.969482421875, -5.78900146484375, -5.6085205078125, -5.42803955078125, -5.24755859375, -5.06707763671875, -4.8865966796875, -4.70611572265625, -4.525634765625, -4.34515380859375, -4.1646728515625, -3.98419189453125, -3.8037109375, -3.62322998046875, -3.4427490234375, -3.26226806640625, -3.081787109375, -2.90130615234375, -2.7208251953125, -2.54034423828125, -2.35986328125, -2.17938232421875, -1.9989013671875, -1.81842041015625, -1.637939453125, -1.45745849609375, -1.2769775390625, -1.09649658203125, -0.916015625, -0.73553466796875, -0.5550537109375, -0.37457275390625, -0.194091796875, -0.01361083984375, 0.1668701171875, 0.34735107421875, 0.52783203125, 0.70831298828125, 0.8887939453125, 1.06927490234375, 1.249755859375, 1.43023681640625, 1.6107177734375, 1.79119873046875, 1.9716796875, 2.15216064453125, 2.3326416015625, 2.51312255859375, 2.693603515625, 2.87408447265625, 3.0545654296875, 3.23504638671875, 3.41552734375, 3.59600830078125, 3.7764892578125, 3.95697021484375, 4.137451171875, 4.31793212890625, 4.4984130859375, 4.67889404296875, 4.859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 24.0, 21.0, 34.0, 52.0, 85.0, 112.0, 179.0, 275.0, 445.0, 679.0, 1075.0, 1722.0, 2652.0, 4383.0, 6939.0, 10829.0, 16856.0, 26276.0, 39140.0, 56839.0, 78006.0, 100234.0, 117554.0, 123762.0, 116502.0, 99299.0, 77704.0, 56173.0, 38992.0, 25871.0, 16858.0, 10662.0, 6653.0, 4335.0, 2684.0, 1675.0, 1064.0, 709.0, 397.0, 281.0, 165.0, 107.0, 67.0, 57.0, 39.0, 27.0, 13.0, 10.0, 11.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.40234375, -4.2579345703125, -4.113525390625, -3.9691162109375, -3.82470703125, -3.6802978515625, -3.535888671875, -3.3914794921875, -3.2470703125, -3.1026611328125, -2.958251953125, -2.8138427734375, -2.66943359375, -2.5250244140625, -2.380615234375, -2.2362060546875, -2.091796875, -1.9473876953125, -1.802978515625, -1.6585693359375, -1.51416015625, -1.3697509765625, -1.225341796875, -1.0809326171875, -0.9365234375, -0.7921142578125, -0.647705078125, -0.5032958984375, -0.35888671875, -0.2144775390625, -0.070068359375, 0.0743408203125, 0.21875, 0.3631591796875, 0.507568359375, 0.6519775390625, 0.79638671875, 0.9407958984375, 1.085205078125, 1.2296142578125, 1.3740234375, 1.5184326171875, 1.662841796875, 1.8072509765625, 1.95166015625, 2.0960693359375, 2.240478515625, 2.3848876953125, 2.529296875, 2.6737060546875, 2.818115234375, 2.9625244140625, 3.10693359375, 3.2513427734375, 3.395751953125, 3.5401611328125, 3.6845703125, 3.8289794921875, 3.973388671875, 4.1177978515625, 4.26220703125, 4.4066162109375, 4.551025390625, 4.6954345703125, 4.83984375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 6.0, 14.0, 10.0, 11.0, 14.0, 22.0, 30.0, 29.0, 41.0, 30.0, 37.0, 38.0, 33.0, 42.0, 62.0, 44.0, 39.0, 48.0, 60.0, 28.0, 58.0, 34.0, 34.0, 35.0, 29.0, 34.0, 21.0, 31.0, 23.0, 15.0, 9.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 15.0, 10.0, 19.0, 25.0, 47.0, 63.0, 91.0, 125.0, 194.0, 296.0, 433.0, 720.0, 1195.0, 1816.0, 2996.0, 4833.0, 8690.0, 14858.0, 26382.0, 46171.0, 79822.0, 125716.0, 170667.0, 180963.0, 147400.0, 97897.0, 58227.0, 33236.0, 18851.0, 10844.0, 6154.0, 3639.0, 2275.0, 1386.0, 882.0, 568.0, 342.0, 247.0, 144.0, 93.0, 73.0, 41.0, 29.0, 30.0, 19.0, 3.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.95501708984375, -3.8240966796875, -3.69317626953125, -3.562255859375, -3.43133544921875, -3.3004150390625, -3.16949462890625, -3.03857421875, -2.90765380859375, -2.7767333984375, -2.64581298828125, -2.514892578125, -2.38397216796875, -2.2530517578125, -2.12213134765625, -1.9912109375, -1.86029052734375, -1.7293701171875, -1.59844970703125, -1.467529296875, -1.33660888671875, -1.2056884765625, -1.07476806640625, -0.94384765625, -0.81292724609375, -0.6820068359375, -0.55108642578125, -0.420166015625, -0.28924560546875, -0.1583251953125, -0.02740478515625, 0.103515625, 0.23443603515625, 0.3653564453125, 0.49627685546875, 0.627197265625, 0.75811767578125, 0.8890380859375, 1.01995849609375, 1.15087890625, 1.28179931640625, 1.4127197265625, 1.54364013671875, 1.674560546875, 1.80548095703125, 1.9364013671875, 2.06732177734375, 2.1982421875, 2.32916259765625, 2.4600830078125, 2.59100341796875, 2.721923828125, 2.85284423828125, 2.9837646484375, 3.11468505859375, 3.24560546875, 3.37652587890625, 3.5074462890625, 3.63836669921875, 3.769287109375, 3.90020751953125, 4.0311279296875, 4.16204833984375, 4.29296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 3.0, 9.0, 13.0, 17.0, 14.0, 19.0, 36.0, 30.0, 47.0, 50.0, 61.0, 71.0, 86.0, 66.0, 60.0, 63.0, 68.0, 44.0, 38.0, 44.0, 21.0, 26.0, 17.0, 16.0, 12.0, 16.0, 8.0, 2.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005102157592773438, -0.0004954151809215546, -0.0004806146025657654, -0.0004658140242099762, -0.000451013445854187, -0.00043621286749839783, -0.00042141228914260864, -0.00040661171078681946, -0.0003918111324310303, -0.0003770105540752411, -0.0003622099757194519, -0.0003474093973636627, -0.00033260881900787354, -0.00031780824065208435, -0.00030300766229629517, -0.000288207083940506, -0.0002734065055847168, -0.0002586059272289276, -0.00024380534887313843, -0.00022900477051734924, -0.00021420419216156006, -0.00019940361380577087, -0.0001846030354499817, -0.0001698024570941925, -0.00015500187873840332, -0.00014020130038261414, -0.00012540072202682495, -0.00011060014367103577, -9.579956531524658e-05, -8.09989869594574e-05, -6.619840860366821e-05, -5.139783024787903e-05, -3.6597251892089844e-05, -2.179667353630066e-05, -6.996095180511475e-06, 7.80448317527771e-06, 2.2605061531066895e-05, 3.740563988685608e-05, 5.2206218242645264e-05, 6.700679659843445e-05, 8.180737495422363e-05, 9.660795331001282e-05, 0.000111408531665802, 0.0001262091100215912, 0.00014100968837738037, 0.00015581026673316956, 0.00017061084508895874, 0.00018541142344474792, 0.0002002120018005371, 0.0002150125801563263, 0.00022981315851211548, 0.00024461373686790466, 0.00025941431522369385, 0.00027421489357948303, 0.0002890154719352722, 0.0003038160502910614, 0.0003186166286468506, 0.00033341720700263977, 0.00034821778535842896, 0.00036301836371421814, 0.0003778189420700073, 0.0003926195204257965, 0.0004074200987815857, 0.0004222206771373749, 0.00043702125549316406]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 10.0, 14.0, 27.0, 50.0, 67.0, 81.0, 117.0, 170.0, 266.0, 431.0, 694.0, 1045.0, 1694.0, 2659.0, 4658.0, 7731.0, 13490.0, 24031.0, 42880.0, 76789.0, 124727.0, 174583.0, 188610.0, 151719.0, 98752.0, 57985.0, 32072.0, 17849.0, 10006.0, 5961.0, 3511.0, 2121.0, 1316.0, 819.0, 523.0, 368.0, 234.0, 142.0, 125.0, 74.0, 51.0, 28.0, 25.0, 16.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.8359375, -4.69049072265625, -4.5450439453125, -4.39959716796875, -4.254150390625, -4.10870361328125, -3.9632568359375, -3.81781005859375, -3.67236328125, -3.52691650390625, -3.3814697265625, -3.23602294921875, -3.090576171875, -2.94512939453125, -2.7996826171875, -2.65423583984375, -2.5087890625, -2.36334228515625, -2.2178955078125, -2.07244873046875, -1.927001953125, -1.78155517578125, -1.6361083984375, -1.49066162109375, -1.34521484375, -1.19976806640625, -1.0543212890625, -0.90887451171875, -0.763427734375, -0.61798095703125, -0.4725341796875, -0.32708740234375, -0.181640625, -0.03619384765625, 0.1092529296875, 0.25469970703125, 0.400146484375, 0.54559326171875, 0.6910400390625, 0.83648681640625, 0.98193359375, 1.12738037109375, 1.2728271484375, 1.41827392578125, 1.563720703125, 1.70916748046875, 1.8546142578125, 2.00006103515625, 2.1455078125, 2.29095458984375, 2.4364013671875, 2.58184814453125, 2.727294921875, 2.87274169921875, 3.0181884765625, 3.16363525390625, 3.30908203125, 3.45452880859375, 3.5999755859375, 3.74542236328125, 3.890869140625, 4.03631591796875, 4.1817626953125, 4.32720947265625, 4.47265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 6.0, 4.0, 13.0, 12.0, 14.0, 13.0, 23.0, 26.0, 34.0, 42.0, 55.0, 54.0, 53.0, 68.0, 60.0, 66.0, 60.0, 65.0, 58.0, 56.0, 42.0, 20.0, 30.0, 21.0, 12.0, 15.0, 13.0, 15.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4627532958984375, -1.420623779296875, -1.3784942626953125, -1.33636474609375, -1.2942352294921875, -1.252105712890625, -1.2099761962890625, -1.1678466796875, -1.1257171630859375, -1.083587646484375, -1.0414581298828125, -0.99932861328125, -0.9571990966796875, -0.915069580078125, -0.8729400634765625, -0.830810546875, -0.7886810302734375, -0.746551513671875, -0.7044219970703125, -0.66229248046875, -0.6201629638671875, -0.578033447265625, -0.5359039306640625, -0.4937744140625, -0.4516448974609375, -0.409515380859375, -0.3673858642578125, -0.32525634765625, -0.2831268310546875, -0.240997314453125, -0.1988677978515625, -0.15673828125, -0.1146087646484375, -0.072479248046875, -0.0303497314453125, 0.01177978515625, 0.0539093017578125, 0.096038818359375, 0.1381683349609375, 0.1802978515625, 0.2224273681640625, 0.264556884765625, 0.3066864013671875, 0.34881591796875, 0.3909454345703125, 0.433074951171875, 0.4752044677734375, 0.517333984375, 0.5594635009765625, 0.601593017578125, 0.6437225341796875, 0.68585205078125, 0.7279815673828125, 0.770111083984375, 0.8122406005859375, 0.8543701171875, 0.8964996337890625, 0.938629150390625, 0.9807586669921875, 1.02288818359375, 1.0650177001953125, 1.107147216796875, 1.1492767333984375, 1.19140625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 8.0, 10.0, 12.0, 25.0, 14.0, 24.0, 34.0, 26.0, 36.0, 41.0, 55.0, 48.0, 42.0, 54.0, 55.0, 62.0, 65.0, 49.0, 51.0, 42.0, 46.0, 41.0, 34.0, 15.0, 21.0, 24.0, 12.0, 12.0, 6.0, 9.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.650629043579102, -10.352104187011719, -10.053580284118652, -9.75505542755127, -9.456531524658203, -9.15800666809082, -8.859481811523438, -8.560957908630371, -8.262433052062988, -7.963908672332764, -7.665384292602539, -7.366859436035156, -7.068335056304932, -6.769810676574707, -6.471286296844482, -6.172761917114258, -5.874237537384033, -5.575713157653809, -5.277188777923584, -4.978664398193359, -4.680139541625977, -4.381615161895752, -4.083090782165527, -3.7845661640167236, -3.486041784286499, -3.1875174045562744, -2.8889927864074707, -2.590468406677246, -2.2919440269470215, -1.9934194087982178, -1.6948950290679932, -1.3963704109191895, -1.0978460311889648, -0.7993215322494507, -0.5007970929145813, -0.20227265357971191, 0.09625184535980225, 0.3947763442993164, 0.693300724029541, 0.9918253421783447, 1.2903497219085693, 1.5888742208480835, 1.8873987197875977, 2.1859230995178223, 2.484447479248047, 2.7829720973968506, 3.081496477127075, 3.380021095275879, 3.6785454750061035, 3.977069854736328, 4.275594234466553, 4.574118614196777, 4.87264347076416, 5.171167850494385, 5.469692230224609, 5.768217086791992, 6.066740989685059, 6.365265369415283, 6.663789749145508, 6.962314605712891, 7.260838985443115, 7.55936336517334, 7.8578877449035645, 8.156412124633789, 8.454936981201172]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 13.0, 12.0, 19.0, 19.0, 18.0, 26.0, 20.0, 26.0, 32.0, 34.0, 36.0, 37.0, 31.0, 43.0, 49.0, 50.0, 34.0, 37.0, 42.0, 37.0, 40.0, 30.0, 39.0, 37.0, 27.0, 25.0, 29.0, 23.0, 23.0, 16.0, 18.0, 10.0, 8.0, 13.0, 9.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.264275074005127, -6.079763412475586, -5.895252227783203, -5.710740566253662, -5.526229381561279, -5.341717720031738, -5.1572065353393555, -4.9726948738098145, -4.788183689117432, -4.603672027587891, -4.419160842895508, -4.234649181365967, -4.050137996673584, -3.865626573562622, -3.68111515045166, -3.496603488922119, -3.3120920658111572, -3.1275806427001953, -2.9430692195892334, -2.7585577964782715, -2.5740463733673096, -2.3895349502563477, -2.2050232887268066, -2.020512104034424, -1.8360005617141724, -1.6514891386032104, -1.4669777154922485, -1.282466173171997, -1.0979547500610352, -0.913443386554718, -0.7289319038391113, -0.5444204807281494, -0.3599090576171875, -0.1753976196050644, 0.009113818407058716, 0.19362527132034302, 0.37813669443130493, 0.5626481175422668, 0.7471596002578735, 0.9316710233688354, 1.1161824464797974, 1.3006938695907593, 1.4852052927017212, 1.6697168350219727, 1.8542282581329346, 2.0387396812438965, 2.2232511043548584, 2.4077625274658203, 2.5922739505767822, 2.776785373687744, 2.961296796798706, 3.145808219909668, 3.33031964302063, 3.514831066131592, 3.699342727661133, 3.8838539123535156, 4.068365573883057, 4.252877235412598, 4.4373884201049805, 4.6219000816345215, 4.806411266326904, 4.990922927856445, 5.175434112548828, 5.359945774078369, 5.544456958770752]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 19.0, 22.0, 27.0, 37.0, 68.0, 103.0, 165.0, 216.0, 318.0, 554.0, 766.0, 1223.0, 1942.0, 3110.0, 5101.0, 8688.0, 15240.0, 27559.0, 51448.0, 101181.0, 207114.0, 427300.0, 767312.0, 963519.0, 758700.0, 424153.0, 209678.0, 103656.0, 52238.0, 27649.0, 14766.0, 8443.0, 4816.0, 2732.0, 1664.0, 1050.0, 610.0, 431.0, 248.0, 145.0, 83.0, 60.0, 41.0, 27.0, 19.0, 14.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.0078125, -9.7176513671875, -9.427490234375, -9.1373291015625, -8.84716796875, -8.5570068359375, -8.266845703125, -7.9766845703125, -7.6865234375, -7.3963623046875, -7.106201171875, -6.8160400390625, -6.52587890625, -6.2357177734375, -5.945556640625, -5.6553955078125, -5.365234375, -5.0750732421875, -4.784912109375, -4.4947509765625, -4.20458984375, -3.9144287109375, -3.624267578125, -3.3341064453125, -3.0439453125, -2.7537841796875, -2.463623046875, -2.1734619140625, -1.88330078125, -1.5931396484375, -1.302978515625, -1.0128173828125, -0.72265625, -0.4324951171875, -0.142333984375, 0.1478271484375, 0.43798828125, 0.7281494140625, 1.018310546875, 1.3084716796875, 1.5986328125, 1.8887939453125, 2.178955078125, 2.4691162109375, 2.75927734375, 3.0494384765625, 3.339599609375, 3.6297607421875, 3.919921875, 4.2100830078125, 4.500244140625, 4.7904052734375, 5.08056640625, 5.3707275390625, 5.660888671875, 5.9510498046875, 6.2412109375, 6.5313720703125, 6.821533203125, 7.1116943359375, 7.40185546875, 7.6920166015625, 7.982177734375, 8.2723388671875, 8.5625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 5.0, 7.0, 15.0, 11.0, 24.0, 14.0, 15.0, 22.0, 23.0, 32.0, 26.0, 35.0, 40.0, 41.0, 41.0, 43.0, 46.0, 49.0, 42.0, 35.0, 43.0, 31.0, 25.0, 40.0, 31.0, 35.0, 32.0, 29.0, 27.0, 25.0, 17.0, 15.0, 15.0, 11.0, 12.0, 4.0, 13.0, 4.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.1875, -5.01556396484375, -4.8436279296875, -4.67169189453125, -4.499755859375, -4.32781982421875, -4.1558837890625, -3.98394775390625, -3.81201171875, -3.64007568359375, -3.4681396484375, -3.29620361328125, -3.124267578125, -2.95233154296875, -2.7803955078125, -2.60845947265625, -2.4365234375, -2.26458740234375, -2.0926513671875, -1.92071533203125, -1.748779296875, -1.57684326171875, -1.4049072265625, -1.23297119140625, -1.06103515625, -0.88909912109375, -0.7171630859375, -0.54522705078125, -0.373291015625, -0.20135498046875, -0.0294189453125, 0.14251708984375, 0.314453125, 0.48638916015625, 0.6583251953125, 0.83026123046875, 1.002197265625, 1.17413330078125, 1.3460693359375, 1.51800537109375, 1.68994140625, 1.86187744140625, 2.0338134765625, 2.20574951171875, 2.377685546875, 2.54962158203125, 2.7215576171875, 2.89349365234375, 3.0654296875, 3.23736572265625, 3.4093017578125, 3.58123779296875, 3.753173828125, 3.92510986328125, 4.0970458984375, 4.26898193359375, 4.44091796875, 4.61285400390625, 4.7847900390625, 4.95672607421875, 5.128662109375, 5.30059814453125, 5.4725341796875, 5.64447021484375, 5.81640625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 4.0, 18.0, 19.0, 45.0, 47.0, 90.0, 114.0, 198.0, 253.0, 389.0, 617.0, 973.0, 1584.0, 2613.0, 4212.0, 7009.0, 11938.0, 20688.0, 35840.0, 64739.0, 117119.0, 211301.0, 371836.0, 594448.0, 776310.0, 736693.0, 522398.0, 312973.0, 175267.0, 97050.0, 54132.0, 30011.0, 17441.0, 10175.0, 5935.0, 3721.0, 2251.0, 1371.0, 844.0, 554.0, 383.0, 238.0, 149.0, 93.0, 52.0, 50.0, 29.0, 21.0, 8.0, 11.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0], "bins": [-10.359375, -10.0340576171875, -9.708740234375, -9.3834228515625, -9.05810546875, -8.7327880859375, -8.407470703125, -8.0821533203125, -7.7568359375, -7.4315185546875, -7.106201171875, -6.7808837890625, -6.45556640625, -6.1302490234375, -5.804931640625, -5.4796142578125, -5.154296875, -4.8289794921875, -4.503662109375, -4.1783447265625, -3.85302734375, -3.5277099609375, -3.202392578125, -2.8770751953125, -2.5517578125, -2.2264404296875, -1.901123046875, -1.5758056640625, -1.25048828125, -0.9251708984375, -0.599853515625, -0.2745361328125, 0.05078125, 0.3760986328125, 0.701416015625, 1.0267333984375, 1.35205078125, 1.6773681640625, 2.002685546875, 2.3280029296875, 2.6533203125, 2.9786376953125, 3.303955078125, 3.6292724609375, 3.95458984375, 4.2799072265625, 4.605224609375, 4.9305419921875, 5.255859375, 5.5811767578125, 5.906494140625, 6.2318115234375, 6.55712890625, 6.8824462890625, 7.207763671875, 7.5330810546875, 7.8583984375, 8.1837158203125, 8.509033203125, 8.8343505859375, 9.15966796875, 9.4849853515625, 9.810302734375, 10.1356201171875, 10.4609375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 27.0, 37.0, 47.0, 50.0, 72.0, 70.0, 111.0, 158.0, 150.0, 181.0, 203.0, 264.0, 296.0, 276.0, 294.0, 287.0, 265.0, 241.0, 214.0, 188.0, 132.0, 105.0, 88.0, 71.0, 58.0, 38.0, 38.0, 28.0, 13.0, 17.0, 11.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.73828125, -4.61676025390625, -4.4952392578125, -4.37371826171875, -4.252197265625, -4.13067626953125, -4.0091552734375, -3.88763427734375, -3.76611328125, -3.64459228515625, -3.5230712890625, -3.40155029296875, -3.280029296875, -3.15850830078125, -3.0369873046875, -2.91546630859375, -2.7939453125, -2.67242431640625, -2.5509033203125, -2.42938232421875, -2.307861328125, -2.18634033203125, -2.0648193359375, -1.94329833984375, -1.82177734375, -1.70025634765625, -1.5787353515625, -1.45721435546875, -1.335693359375, -1.21417236328125, -1.0926513671875, -0.97113037109375, -0.849609375, -0.72808837890625, -0.6065673828125, -0.48504638671875, -0.363525390625, -0.24200439453125, -0.1204833984375, 0.00103759765625, 0.12255859375, 0.24407958984375, 0.3656005859375, 0.48712158203125, 0.608642578125, 0.73016357421875, 0.8516845703125, 0.97320556640625, 1.0947265625, 1.21624755859375, 1.3377685546875, 1.45928955078125, 1.580810546875, 1.70233154296875, 1.8238525390625, 1.94537353515625, 2.06689453125, 2.18841552734375, 2.3099365234375, 2.43145751953125, 2.552978515625, 2.67449951171875, 2.7960205078125, 2.91754150390625, 3.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 6.0, 10.0, 10.0, 17.0, 14.0, 18.0, 32.0, 32.0, 30.0, 41.0, 42.0, 55.0, 56.0, 61.0, 65.0, 65.0, 50.0, 64.0, 46.0, 38.0, 43.0, 37.0, 31.0, 28.0, 24.0, 20.0, 14.0, 11.0, 9.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.759474754333496, -13.364616394042969, -12.969757080078125, -12.574898719787598, -12.18004035949707, -11.785181999206543, -11.390323638916016, -10.995464324951172, -10.600605964660645, -10.205747604370117, -9.810888290405273, -9.416029930114746, -9.021171569824219, -8.626313209533691, -8.231454849243164, -7.83659553527832, -7.441737174987793, -7.046878814697266, -6.65201997756958, -6.2571611404418945, -5.862302780151367, -5.46744441986084, -5.072585582733154, -4.677726745605469, -4.282868385314941, -3.888009786605835, -3.4931511878967285, -3.098292589187622, -2.7034339904785156, -2.308575391769409, -1.9137167930603027, -1.5188581943511963, -1.1240005493164062, -0.7291419506072998, -0.33428335189819336, 0.060575246810913086, 0.45543384552001953, 0.850292444229126, 1.2451510429382324, 1.6400096416473389, 2.0348682403564453, 2.4297268390655518, 2.824585437774658, 3.2194440364837646, 3.614302635192871, 4.009160995483398, 4.404019832611084, 4.7988786697387695, 5.193737030029297, 5.588595390319824, 5.98345422744751, 6.378313064575195, 6.773171424865723, 7.16802978515625, 7.5628886222839355, 7.957747459411621, 8.352605819702148, 8.747464179992676, 9.142322540283203, 9.537181854248047, 9.932040214538574, 10.326898574829102, 10.721757888793945, 11.116616249084473, 11.511474609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 6.0, 10.0, 8.0, 16.0, 16.0, 14.0, 19.0, 20.0, 18.0, 27.0, 28.0, 13.0, 36.0, 34.0, 27.0, 50.0, 34.0, 40.0, 37.0, 38.0, 33.0, 42.0, 50.0, 34.0, 35.0, 33.0, 37.0, 28.0, 35.0, 21.0, 24.0, 23.0, 17.0, 18.0, 18.0, 7.0, 13.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.569639205932617, -6.363455295562744, -6.157271385192871, -5.95108699798584, -5.744903087615967, -5.538719177246094, -5.332535266876221, -5.126351356506348, -4.920166969299316, -4.713983058929443, -4.50779914855957, -4.301614761352539, -4.095430850982666, -3.889246940612793, -3.68306303024292, -3.4768788814544678, -3.2706949710845947, -3.0645110607147217, -2.8583269119262695, -2.6521430015563965, -2.4459588527679443, -2.2397749423980713, -2.033590793609619, -1.827406883239746, -1.6212228536605835, -1.415038824081421, -1.2088547945022583, -1.0026707649230957, -0.7964867949485779, -0.5903028249740601, -0.38411879539489746, -0.17793476581573486, 0.028249263763427734, 0.23443327844142914, 0.44061729311943054, 0.6468012928962708, 0.8529853224754333, 1.0591692924499512, 1.2653533220291138, 1.4715373516082764, 1.677721381187439, 1.8839054107666016, 2.0900893211364746, 2.2962734699249268, 2.5024573802948, 2.708641529083252, 2.914825439453125, 3.121009349822998, 3.32719349861145, 3.5333774089813232, 3.7395615577697754, 3.9457454681396484, 4.1519293785095215, 4.3581132888793945, 4.564297676086426, 4.770481586456299, 4.976665496826172, 5.182849407196045, 5.389033317565918, 5.595217704772949, 5.801401615142822, 6.007585525512695, 6.213769435882568, 6.419953346252441, 6.626137733459473]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 9.0, 18.0, 23.0, 32.0, 60.0, 67.0, 128.0, 201.0, 292.0, 444.0, 774.0, 1144.0, 2008.0, 3053.0, 5206.0, 8671.0, 14477.0, 24862.0, 42141.0, 69471.0, 110331.0, 155324.0, 178288.0, 153745.0, 108365.0, 67847.0, 41207.0, 24246.0, 14281.0, 8375.0, 5058.0, 3184.0, 1971.0, 1200.0, 724.0, 485.0, 291.0, 183.0, 138.0, 76.0, 43.0, 33.0, 25.0, 13.0, 17.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.806640625, -0.7818069458007812, -0.7569732666015625, -0.7321395874023438, -0.707305908203125, -0.6824722290039062, -0.6576385498046875, -0.6328048706054688, -0.60797119140625, -0.5831375122070312, -0.5583038330078125, -0.5334701538085938, -0.508636474609375, -0.48380279541015625, -0.4589691162109375, -0.43413543701171875, -0.4093017578125, -0.38446807861328125, -0.3596343994140625, -0.33480072021484375, -0.309967041015625, -0.28513336181640625, -0.2602996826171875, -0.23546600341796875, -0.21063232421875, -0.18579864501953125, -0.1609649658203125, -0.13613128662109375, -0.111297607421875, -0.08646392822265625, -0.0616302490234375, -0.03679656982421875, -0.011962890625, 0.01287078857421875, 0.0377044677734375, 0.06253814697265625, 0.087371826171875, 0.11220550537109375, 0.1370391845703125, 0.16187286376953125, 0.18670654296875, 0.21154022216796875, 0.2363739013671875, 0.26120758056640625, 0.286041259765625, 0.31087493896484375, 0.3357086181640625, 0.36054229736328125, 0.3853759765625, 0.41020965576171875, 0.4350433349609375, 0.45987701416015625, 0.484710693359375, 0.5095443725585938, 0.5343780517578125, 0.5592117309570312, 0.58404541015625, 0.6088790893554688, 0.6337127685546875, 0.6585464477539062, 0.683380126953125, 0.7082138061523438, 0.7330474853515625, 0.7578811645507812, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 9.0, 10.0, 13.0, 13.0, 23.0, 21.0, 27.0, 34.0, 23.0, 28.0, 27.0, 34.0, 36.0, 36.0, 38.0, 47.0, 47.0, 47.0, 34.0, 29.0, 37.0, 34.0, 35.0, 33.0, 32.0, 28.0, 31.0, 27.0, 26.0, 26.0, 17.0, 12.0, 12.0, 7.0, 10.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7830810546875, -6.550537109375, -6.3179931640625, -6.08544921875, -5.8529052734375, -5.620361328125, -5.3878173828125, -5.1552734375, -4.9227294921875, -4.690185546875, -4.4576416015625, -4.22509765625, -3.9925537109375, -3.760009765625, -3.5274658203125, -3.294921875, -3.0623779296875, -2.829833984375, -2.5972900390625, -2.36474609375, -2.1322021484375, -1.899658203125, -1.6671142578125, -1.4345703125, -1.2020263671875, -0.969482421875, -0.7369384765625, -0.50439453125, -0.2718505859375, -0.039306640625, 0.1932373046875, 0.42578125, 0.6583251953125, 0.890869140625, 1.1234130859375, 1.35595703125, 1.5885009765625, 1.821044921875, 2.0535888671875, 2.2861328125, 2.5186767578125, 2.751220703125, 2.9837646484375, 3.21630859375, 3.4488525390625, 3.681396484375, 3.9139404296875, 4.146484375, 4.3790283203125, 4.611572265625, 4.8441162109375, 5.07666015625, 5.3092041015625, 5.541748046875, 5.7742919921875, 6.0068359375, 6.2393798828125, 6.471923828125, 6.7044677734375, 6.93701171875, 7.1695556640625, 7.402099609375, 7.6346435546875, 7.8671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 10.0, 18.0, 18.0, 24.0, 36.0, 51.0, 47.0, 99.0, 99.0, 133.0, 210.0, 290.0, 451.0, 741.0, 1117.0, 1722.0, 2954.0, 5358.0, 10455.0, 21488.0, 80016.0, 819859.0, 61323.0, 19788.0, 9534.0, 5093.0, 2824.0, 1635.0, 996.0, 647.0, 431.0, 307.0, 240.0, 135.0, 100.0, 77.0, 66.0, 49.0, 26.0, 19.0, 10.0, 16.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.517578125, -2.4375, -2.357421875, -2.27734375, -2.197265625, -2.1171875, -2.037109375, -1.95703125, -1.876953125, -1.796875, -1.716796875, -1.63671875, -1.556640625, -1.4765625, -1.396484375, -1.31640625, -1.236328125, -1.15625, -1.076171875, -0.99609375, -0.916015625, -0.8359375, -0.755859375, -0.67578125, -0.595703125, -0.515625, -0.435546875, -0.35546875, -0.275390625, -0.1953125, -0.115234375, -0.03515625, 0.044921875, 0.125, 0.205078125, 0.28515625, 0.365234375, 0.4453125, 0.525390625, 0.60546875, 0.685546875, 0.765625, 0.845703125, 0.92578125, 1.005859375, 1.0859375, 1.166015625, 1.24609375, 1.326171875, 1.40625, 1.486328125, 1.56640625, 1.646484375, 1.7265625, 1.806640625, 1.88671875, 1.966796875, 2.046875, 2.126953125, 2.20703125, 2.287109375, 2.3671875, 2.447265625, 2.52734375, 2.607421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 25.0, 14.0, 12.0, 17.0, 24.0, 24.0, 26.0, 28.0, 37.0, 32.0, 36.0, 34.0, 29.0, 36.0, 30.0, 40.0, 34.0, 31.0, 35.0, 36.0, 29.0, 35.0, 31.0, 29.0, 29.0, 26.0, 18.0, 22.0, 17.0, 22.0, 14.0, 19.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.69140625, -4.5523681640625, -4.413330078125, -4.2742919921875, -4.13525390625, -3.9962158203125, -3.857177734375, -3.7181396484375, -3.5791015625, -3.4400634765625, -3.301025390625, -3.1619873046875, -3.02294921875, -2.8839111328125, -2.744873046875, -2.6058349609375, -2.466796875, -2.3277587890625, -2.188720703125, -2.0496826171875, -1.91064453125, -1.7716064453125, -1.632568359375, -1.4935302734375, -1.3544921875, -1.2154541015625, -1.076416015625, -0.9373779296875, -0.79833984375, -0.6593017578125, -0.520263671875, -0.3812255859375, -0.2421875, -0.1031494140625, 0.035888671875, 0.1749267578125, 0.31396484375, 0.4530029296875, 0.592041015625, 0.7310791015625, 0.8701171875, 1.0091552734375, 1.148193359375, 1.2872314453125, 1.42626953125, 1.5653076171875, 1.704345703125, 1.8433837890625, 1.982421875, 2.1214599609375, 2.260498046875, 2.3995361328125, 2.53857421875, 2.6776123046875, 2.816650390625, 2.9556884765625, 3.0947265625, 3.2337646484375, 3.372802734375, 3.5118408203125, 3.65087890625, 3.7899169921875, 3.928955078125, 4.0679931640625, 4.20703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 16.0, 23.0, 28.0, 37.0, 45.0, 88.0, 101.0, 182.0, 284.0, 445.0, 776.0, 1356.0, 2425.0, 4539.0, 8823.0, 18025.0, 47365.0, 884669.0, 43601.0, 17247.0, 8395.0, 4345.0, 2357.0, 1328.0, 756.0, 460.0, 295.0, 185.0, 105.0, 75.0, 58.0, 33.0, 20.0, 19.0, 6.0, 8.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7001953125, -0.677947998046875, -0.65570068359375, -0.633453369140625, -0.6112060546875, -0.588958740234375, -0.56671142578125, -0.544464111328125, -0.522216796875, -0.499969482421875, -0.47772216796875, -0.455474853515625, -0.4332275390625, -0.410980224609375, -0.38873291015625, -0.366485595703125, -0.34423828125, -0.321990966796875, -0.29974365234375, -0.277496337890625, -0.2552490234375, -0.233001708984375, -0.21075439453125, -0.188507080078125, -0.166259765625, -0.144012451171875, -0.12176513671875, -0.099517822265625, -0.0772705078125, -0.055023193359375, -0.03277587890625, -0.010528564453125, 0.01171875, 0.033966064453125, 0.05621337890625, 0.078460693359375, 0.1007080078125, 0.122955322265625, 0.14520263671875, 0.167449951171875, 0.189697265625, 0.211944580078125, 0.23419189453125, 0.256439208984375, 0.2786865234375, 0.300933837890625, 0.32318115234375, 0.345428466796875, 0.36767578125, 0.389923095703125, 0.41217041015625, 0.434417724609375, 0.4566650390625, 0.478912353515625, 0.50115966796875, 0.523406982421875, 0.545654296875, 0.567901611328125, 0.59014892578125, 0.612396240234375, 0.6346435546875, 0.656890869140625, 0.67913818359375, 0.701385498046875, 0.7236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 1.0, 7.0, 6.0, 4.0, 6.0, 9.0, 8.0, 12.0, 7.0, 15.0, 20.0, 12.0, 19.0, 22.0, 24.0, 25.0, 36.0, 24.0, 33.0, 34.0, 44.0, 39.0, 40.0, 36.0, 31.0, 40.0, 30.0, 36.0, 29.0, 42.0, 34.0, 29.0, 34.0, 28.0, 25.0, 14.0, 18.0, 17.0, 17.0, 19.0, 14.0, 15.0, 5.0, 6.0, 3.0, 8.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3845583200454712e-05, -2.3074448108673096e-05, -2.230331301689148e-05, -2.1532177925109863e-05, -2.0761042833328247e-05, -1.998990774154663e-05, -1.9218772649765015e-05, -1.84476375579834e-05, -1.7676502466201782e-05, -1.6905367374420166e-05, -1.613423228263855e-05, -1.5363097190856934e-05, -1.4591962099075317e-05, -1.3820827007293701e-05, -1.3049691915512085e-05, -1.2278556823730469e-05, -1.1507421731948853e-05, -1.0736286640167236e-05, -9.96515154838562e-06, -9.194016456604004e-06, -8.422881364822388e-06, -7.651746273040771e-06, -6.880611181259155e-06, -6.109476089477539e-06, -5.338340997695923e-06, -4.567205905914307e-06, -3.7960708141326904e-06, -3.0249357223510742e-06, -2.253800630569458e-06, -1.4826655387878418e-06, -7.115304470062256e-07, 5.960464477539063e-08, 8.307397365570068e-07, 1.601874828338623e-06, 2.3730099201202393e-06, 3.1441450119018555e-06, 3.915280103683472e-06, 4.686415195465088e-06, 5.457550287246704e-06, 6.22868537902832e-06, 6.9998204708099365e-06, 7.770955562591553e-06, 8.542090654373169e-06, 9.313225746154785e-06, 1.0084360837936401e-05, 1.0855495929718018e-05, 1.1626631021499634e-05, 1.239776611328125e-05, 1.3168901205062866e-05, 1.3940036296844482e-05, 1.4711171388626099e-05, 1.5482306480407715e-05, 1.625344157218933e-05, 1.7024576663970947e-05, 1.7795711755752563e-05, 1.856684684753418e-05, 1.9337981939315796e-05, 2.0109117031097412e-05, 2.088025212287903e-05, 2.1651387214660645e-05, 2.242252230644226e-05, 2.3193657398223877e-05, 2.3964792490005493e-05, 2.473592758178711e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 16.0, 14.0, 20.0, 33.0, 40.0, 73.0, 91.0, 162.0, 199.0, 307.0, 508.0, 997.0, 1810.0, 3555.0, 7661.0, 17385.0, 41635.0, 103331.0, 235637.0, 317743.0, 184929.0, 76237.0, 30901.0, 13100.0, 5798.0, 2757.0, 1435.0, 836.0, 427.0, 282.0, 195.0, 112.0, 76.0, 62.0, 46.0, 33.0, 27.0, 22.0, 15.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3826026916503906, -0.36750030517578125, -0.3523979187011719, -0.3372955322265625, -0.3221931457519531, -0.30709075927734375, -0.2919883728027344, -0.276885986328125, -0.2617835998535156, -0.24668121337890625, -0.23157882690429688, -0.2164764404296875, -0.20137405395507812, -0.18627166748046875, -0.17116928100585938, -0.15606689453125, -0.14096450805664062, -0.12586212158203125, -0.11075973510742188, -0.0956573486328125, -0.08055496215820312, -0.06545257568359375, -0.050350189208984375, -0.035247802734375, -0.020145416259765625, -0.00504302978515625, 0.010059356689453125, 0.0251617431640625, 0.040264129638671875, 0.05536651611328125, 0.07046890258789062, 0.0855712890625, 0.10067367553710938, 0.11577606201171875, 0.13087844848632812, 0.1459808349609375, 0.16108322143554688, 0.17618560791015625, 0.19128799438476562, 0.206390380859375, 0.22149276733398438, 0.23659515380859375, 0.2516975402832031, 0.2667999267578125, 0.2819023132324219, 0.29700469970703125, 0.3121070861816406, 0.32720947265625, 0.3423118591308594, 0.35741424560546875, 0.3725166320800781, 0.3876190185546875, 0.4027214050292969, 0.41782379150390625, 0.4329261779785156, 0.448028564453125, 0.4631309509277344, 0.47823333740234375, 0.4933357238769531, 0.5084381103515625, 0.5235404968261719, 0.5386428833007812, 0.5537452697753906, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 8.0, 6.0, 13.0, 17.0, 20.0, 19.0, 23.0, 27.0, 34.0, 35.0, 46.0, 60.0, 53.0, 56.0, 59.0, 48.0, 57.0, 53.0, 55.0, 48.0, 37.0, 27.0, 29.0, 19.0, 31.0, 20.0, 24.0, 15.0, 11.0, 12.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.092529296875, -0.08972930908203125, -0.0869293212890625, -0.08412933349609375, -0.081329345703125, -0.07852935791015625, -0.0757293701171875, -0.07292938232421875, -0.07012939453125, -0.06732940673828125, -0.0645294189453125, -0.06172943115234375, -0.058929443359375, -0.05612945556640625, -0.0533294677734375, -0.05052947998046875, -0.0477294921875, -0.04492950439453125, -0.0421295166015625, -0.03932952880859375, -0.036529541015625, -0.03372955322265625, -0.0309295654296875, -0.02812957763671875, -0.02532958984375, -0.02252960205078125, -0.0197296142578125, -0.01692962646484375, -0.014129638671875, -0.01132965087890625, -0.0085296630859375, -0.00572967529296875, -0.0029296875, -0.00012969970703125, 0.0026702880859375, 0.00547027587890625, 0.008270263671875, 0.01107025146484375, 0.0138702392578125, 0.01667022705078125, 0.01947021484375, 0.02227020263671875, 0.0250701904296875, 0.02787017822265625, 0.030670166015625, 0.03347015380859375, 0.0362701416015625, 0.03907012939453125, 0.0418701171875, 0.04467010498046875, 0.0474700927734375, 0.05027008056640625, 0.053070068359375, 0.05587005615234375, 0.0586700439453125, 0.06147003173828125, 0.06427001953125, 0.06707000732421875, 0.0698699951171875, 0.07266998291015625, 0.075469970703125, 0.07826995849609375, 0.0810699462890625, 0.08386993408203125, 0.086669921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 15.0, 16.0, 27.0, 30.0, 27.0, 41.0, 40.0, 44.0, 54.0, 55.0, 66.0, 58.0, 64.0, 49.0, 66.0, 43.0, 31.0, 49.0, 28.0, 35.0, 25.0, 25.0, 19.0, 13.0, 6.0, 10.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.455452919006348, -13.064770698547363, -12.674088478088379, -12.283407211303711, -11.892724990844727, -11.502042770385742, -11.111360549926758, -10.720678329467773, -10.329996109008789, -9.939313888549805, -9.54863166809082, -9.157949447631836, -8.767268180847168, -8.376585960388184, -7.985903739929199, -7.595221519470215, -7.204539775848389, -6.813857555389404, -6.423175811767578, -6.032493591308594, -5.641811370849609, -5.251129150390625, -4.860447406768799, -4.4697651863098145, -4.079083442687988, -3.688401460647583, -3.2977192401885986, -2.9070372581481934, -2.516355037689209, -2.1256730556488037, -1.7349910736083984, -1.344308853149414, -0.9536266326904297, -0.5629445314407349, -0.17226248979568481, 0.21841955184936523, 0.6091016530990601, 0.9997837543487549, 1.3904657363891602, 1.7811479568481445, 2.17182993888855, 2.562511920928955, 2.9531941413879395, 3.3438761234283447, 3.73455810546875, 4.125240325927734, 4.515922546386719, 4.906604766845703, 5.297286510467529, 5.687968730926514, 6.07865047454834, 6.469332695007324, 6.860014915466309, 7.250697135925293, 7.641378879547119, 8.032060623168945, 8.42274284362793, 8.813425064086914, 9.204107284545898, 9.594789505004883, 9.98547077178955, 10.376152992248535, 10.76683521270752, 11.157517433166504, 11.548199653625488]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 3.0, 13.0, 9.0, 17.0, 14.0, 14.0, 21.0, 18.0, 20.0, 28.0, 23.0, 17.0, 33.0, 36.0, 35.0, 38.0, 39.0, 40.0, 39.0, 36.0, 32.0, 46.0, 51.0, 27.0, 39.0, 32.0, 39.0, 29.0, 32.0, 20.0, 23.0, 25.0, 14.0, 17.0, 19.0, 6.0, 13.0, 13.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5517683029174805, -6.345795631408691, -6.1398234367370605, -5.9338507652282715, -5.727878093719482, -5.521905899047852, -5.3159332275390625, -5.109960556030273, -4.903987884521484, -4.698015213012695, -4.4920430183410645, -4.286070346832275, -4.080097675323486, -3.8741252422332764, -3.6681528091430664, -3.4621801376342773, -3.2562079429626465, -3.0502355098724365, -2.8442628383636475, -2.6382904052734375, -2.4323177337646484, -2.2263453006744385, -2.0203728675842285, -1.814400315284729, -1.6084277629852295, -1.40245521068573, -1.1964826583862305, -0.9905102252960205, -0.784537672996521, -0.5785651206970215, -0.3725926876068115, -0.166620135307312, 0.0393519401550293, 0.24532446265220642, 0.45129698514938354, 0.6572694778442383, 0.8632420301437378, 1.0692145824432373, 1.2751870155334473, 1.4811595678329468, 1.6871321201324463, 1.8931046724319458, 2.0990772247314453, 2.3050496578216553, 2.5110220909118652, 2.7169947624206543, 2.9229671955108643, 3.128939628601074, 3.3349123001098633, 3.5408847332000732, 3.7468574047088623, 3.9528298377990723, 4.158802509307861, 4.364774703979492, 4.570747375488281, 4.77672004699707, 4.982692718505859, 5.188665390014648, 5.394637584686279, 5.600610256195068, 5.806582927703857, 6.012555122375488, 6.218527793884277, 6.424500465393066, 6.630472660064697]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 15.0, 28.0, 21.0, 30.0, 62.0, 76.0, 105.0, 192.0, 239.0, 348.0, 499.0, 773.0, 1181.0, 1806.0, 2907.0, 4703.0, 8132.0, 14097.0, 26150.0, 47564.0, 83948.0, 134435.0, 177946.0, 182407.0, 144607.0, 93684.0, 53896.0, 29445.0, 16049.0, 9009.0, 5171.0, 3129.0, 1947.0, 1312.0, 834.0, 565.0, 393.0, 263.0, 188.0, 114.0, 87.0, 54.0, 42.0, 20.0, 20.0, 16.0, 12.0, 11.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.5303955078125, -8.256103515625, -7.9818115234375, -7.70751953125, -7.4332275390625, -7.158935546875, -6.8846435546875, -6.6103515625, -6.3360595703125, -6.061767578125, -5.7874755859375, -5.51318359375, -5.2388916015625, -4.964599609375, -4.6903076171875, -4.416015625, -4.1417236328125, -3.867431640625, -3.5931396484375, -3.31884765625, -3.0445556640625, -2.770263671875, -2.4959716796875, -2.2216796875, -1.9473876953125, -1.673095703125, -1.3988037109375, -1.12451171875, -0.8502197265625, -0.575927734375, -0.3016357421875, -0.02734375, 0.2469482421875, 0.521240234375, 0.7955322265625, 1.06982421875, 1.3441162109375, 1.618408203125, 1.8927001953125, 2.1669921875, 2.4412841796875, 2.715576171875, 2.9898681640625, 3.26416015625, 3.5384521484375, 3.812744140625, 4.0870361328125, 4.361328125, 4.6356201171875, 4.909912109375, 5.1842041015625, 5.45849609375, 5.7327880859375, 6.007080078125, 6.2813720703125, 6.5556640625, 6.8299560546875, 7.104248046875, 7.3785400390625, 7.65283203125, 7.9271240234375, 8.201416015625, 8.4757080078125, 8.75]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 12.0, 9.0, 14.0, 11.0, 14.0, 16.0, 24.0, 20.0, 24.0, 29.0, 29.0, 34.0, 32.0, 27.0, 29.0, 39.0, 41.0, 34.0, 39.0, 39.0, 36.0, 30.0, 34.0, 38.0, 43.0, 35.0, 33.0, 21.0, 29.0, 18.0, 21.0, 25.0, 16.0, 18.0, 21.0, 11.0, 13.0, 11.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.73046875, -6.5091552734375, -6.287841796875, -6.0665283203125, -5.84521484375, -5.6239013671875, -5.402587890625, -5.1812744140625, -4.9599609375, -4.7386474609375, -4.517333984375, -4.2960205078125, -4.07470703125, -3.8533935546875, -3.632080078125, -3.4107666015625, -3.189453125, -2.9681396484375, -2.746826171875, -2.5255126953125, -2.30419921875, -2.0828857421875, -1.861572265625, -1.6402587890625, -1.4189453125, -1.1976318359375, -0.976318359375, -0.7550048828125, -0.53369140625, -0.3123779296875, -0.091064453125, 0.1302490234375, 0.3515625, 0.5728759765625, 0.794189453125, 1.0155029296875, 1.23681640625, 1.4581298828125, 1.679443359375, 1.9007568359375, 2.1220703125, 2.3433837890625, 2.564697265625, 2.7860107421875, 3.00732421875, 3.2286376953125, 3.449951171875, 3.6712646484375, 3.892578125, 4.1138916015625, 4.335205078125, 4.5565185546875, 4.77783203125, 4.9991455078125, 5.220458984375, 5.4417724609375, 5.6630859375, 5.8843994140625, 6.105712890625, 6.3270263671875, 6.54833984375, 6.7696533203125, 6.990966796875, 7.2122802734375, 7.43359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 15.0, 22.0, 28.0, 36.0, 46.0, 67.0, 124.0, 162.0, 210.0, 358.0, 541.0, 844.0, 1308.0, 2122.0, 3337.0, 5762.0, 11154.0, 22845.0, 52159.0, 118479.0, 220413.0, 261365.0, 182233.0, 88098.0, 38327.0, 17188.0, 8820.0, 4715.0, 2860.0, 1749.0, 1069.0, 725.0, 427.0, 305.0, 192.0, 144.0, 99.0, 52.0, 55.0, 25.0, 24.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.34375, -14.8831787109375, -14.422607421875, -13.9620361328125, -13.50146484375, -13.0408935546875, -12.580322265625, -12.1197509765625, -11.6591796875, -11.1986083984375, -10.738037109375, -10.2774658203125, -9.81689453125, -9.3563232421875, -8.895751953125, -8.4351806640625, -7.974609375, -7.5140380859375, -7.053466796875, -6.5928955078125, -6.13232421875, -5.6717529296875, -5.211181640625, -4.7506103515625, -4.2900390625, -3.8294677734375, -3.368896484375, -2.9083251953125, -2.44775390625, -1.9871826171875, -1.526611328125, -1.0660400390625, -0.60546875, -0.1448974609375, 0.315673828125, 0.7762451171875, 1.23681640625, 1.6973876953125, 2.157958984375, 2.6185302734375, 3.0791015625, 3.5396728515625, 4.000244140625, 4.4608154296875, 4.92138671875, 5.3819580078125, 5.842529296875, 6.3031005859375, 6.763671875, 7.2242431640625, 7.684814453125, 8.1453857421875, 8.60595703125, 9.0665283203125, 9.527099609375, 9.9876708984375, 10.4482421875, 10.9088134765625, 11.369384765625, 11.8299560546875, 12.29052734375, 12.7510986328125, 13.211669921875, 13.6722412109375, 14.1328125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 7.0, 6.0, 10.0, 19.0, 14.0, 23.0, 21.0, 18.0, 19.0, 18.0, 19.0, 26.0, 44.0, 27.0, 35.0, 44.0, 39.0, 41.0, 27.0, 53.0, 37.0, 39.0, 36.0, 37.0, 30.0, 31.0, 41.0, 36.0, 29.0, 24.0, 11.0, 18.0, 13.0, 20.0, 13.0, 12.0, 11.0, 8.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.30078125, -5.1474609375, -4.994140625, -4.8408203125, -4.6875, -4.5341796875, -4.380859375, -4.2275390625, -4.07421875, -3.9208984375, -3.767578125, -3.6142578125, -3.4609375, -3.3076171875, -3.154296875, -3.0009765625, -2.84765625, -2.6943359375, -2.541015625, -2.3876953125, -2.234375, -2.0810546875, -1.927734375, -1.7744140625, -1.62109375, -1.4677734375, -1.314453125, -1.1611328125, -1.0078125, -0.8544921875, -0.701171875, -0.5478515625, -0.39453125, -0.2412109375, -0.087890625, 0.0654296875, 0.21875, 0.3720703125, 0.525390625, 0.6787109375, 0.83203125, 0.9853515625, 1.138671875, 1.2919921875, 1.4453125, 1.5986328125, 1.751953125, 1.9052734375, 2.05859375, 2.2119140625, 2.365234375, 2.5185546875, 2.671875, 2.8251953125, 2.978515625, 3.1318359375, 3.28515625, 3.4384765625, 3.591796875, 3.7451171875, 3.8984375, 4.0517578125, 4.205078125, 4.3583984375, 4.51171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 6.0, 12.0, 15.0, 18.0, 47.0, 50.0, 92.0, 118.0, 209.0, 291.0, 446.0, 682.0, 964.0, 1487.0, 2279.0, 3673.0, 5540.0, 8893.0, 14221.0, 24116.0, 41475.0, 71925.0, 121726.0, 177615.0, 194099.0, 150739.0, 94222.0, 53590.0, 30876.0, 18253.0, 10935.0, 7003.0, 4451.0, 2928.0, 2001.0, 1236.0, 720.0, 513.0, 361.0, 232.0, 169.0, 113.0, 67.0, 50.0, 29.0, 27.0, 17.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.4285888671875, -6.208740234375, -5.9888916015625, -5.76904296875, -5.5491943359375, -5.329345703125, -5.1094970703125, -4.8896484375, -4.6697998046875, -4.449951171875, -4.2301025390625, -4.01025390625, -3.7904052734375, -3.570556640625, -3.3507080078125, -3.130859375, -2.9110107421875, -2.691162109375, -2.4713134765625, -2.25146484375, -2.0316162109375, -1.811767578125, -1.5919189453125, -1.3720703125, -1.1522216796875, -0.932373046875, -0.7125244140625, -0.49267578125, -0.2728271484375, -0.052978515625, 0.1668701171875, 0.38671875, 0.6065673828125, 0.826416015625, 1.0462646484375, 1.26611328125, 1.4859619140625, 1.705810546875, 1.9256591796875, 2.1455078125, 2.3653564453125, 2.585205078125, 2.8050537109375, 3.02490234375, 3.2447509765625, 3.464599609375, 3.6844482421875, 3.904296875, 4.1241455078125, 4.343994140625, 4.5638427734375, 4.78369140625, 5.0035400390625, 5.223388671875, 5.4432373046875, 5.6630859375, 5.8829345703125, 6.102783203125, 6.3226318359375, 6.54248046875, 6.7623291015625, 6.982177734375, 7.2020263671875, 7.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 9.0, 14.0, 25.0, 30.0, 26.0, 28.0, 43.0, 49.0, 53.0, 64.0, 74.0, 65.0, 63.0, 66.0, 54.0, 41.0, 44.0, 39.0, 32.0, 30.0, 23.0, 18.0, 18.0, 7.0, 9.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0006823539733886719, -0.0006618201732635498, -0.0006412863731384277, -0.0006207525730133057, -0.0006002187728881836, -0.0005796849727630615, -0.0005591511726379395, -0.0005386173725128174, -0.0005180835723876953, -0.0004975497722625732, -0.00047701597213745117, -0.0004564821720123291, -0.00043594837188720703, -0.00041541457176208496, -0.0003948807716369629, -0.0003743469715118408, -0.00035381317138671875, -0.0003332793712615967, -0.0003127455711364746, -0.00029221177101135254, -0.00027167797088623047, -0.0002511441707611084, -0.00023061037063598633, -0.00021007657051086426, -0.0001895427703857422, -0.00016900897026062012, -0.00014847517013549805, -0.00012794137001037598, -0.0001074075698852539, -8.687376976013184e-05, -6.633996963500977e-05, -4.5806169509887695e-05, -2.5272369384765625e-05, -4.738569259643555e-06, 1.5795230865478516e-05, 3.6329030990600586e-05, 5.6862831115722656e-05, 7.739663124084473e-05, 9.79304313659668e-05, 0.00011846423149108887, 0.00013899803161621094, 0.000159531831741333, 0.00018006563186645508, 0.00020059943199157715, 0.00022113323211669922, 0.0002416670322418213, 0.00026220083236694336, 0.00028273463249206543, 0.0003032684326171875, 0.00032380223274230957, 0.00034433603286743164, 0.0003648698329925537, 0.0003854036331176758, 0.00040593743324279785, 0.0004264712333679199, 0.000447005033493042, 0.00046753883361816406, 0.00048807263374328613, 0.0005086064338684082, 0.0005291402339935303, 0.0005496740341186523, 0.0005702078342437744, 0.0005907416343688965, 0.0006112754344940186, 0.0006318092346191406]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 20.0, 23.0, 30.0, 49.0, 80.0, 156.0, 198.0, 323.0, 447.0, 807.0, 1241.0, 1956.0, 3018.0, 5184.0, 8589.0, 14171.0, 24929.0, 43293.0, 76179.0, 129863.0, 188642.0, 197682.0, 144733.0, 87379.0, 50112.0, 28230.0, 16387.0, 9754.0, 5806.0, 3439.0, 2191.0, 1292.0, 810.0, 523.0, 355.0, 222.0, 160.0, 85.0, 64.0, 52.0, 30.0, 17.0, 13.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.7520751953125, -6.511962890625, -6.2718505859375, -6.03173828125, -5.7916259765625, -5.551513671875, -5.3114013671875, -5.0712890625, -4.8311767578125, -4.591064453125, -4.3509521484375, -4.11083984375, -3.8707275390625, -3.630615234375, -3.3905029296875, -3.150390625, -2.9102783203125, -2.670166015625, -2.4300537109375, -2.18994140625, -1.9498291015625, -1.709716796875, -1.4696044921875, -1.2294921875, -0.9893798828125, -0.749267578125, -0.5091552734375, -0.26904296875, -0.0289306640625, 0.211181640625, 0.4512939453125, 0.69140625, 0.9315185546875, 1.171630859375, 1.4117431640625, 1.65185546875, 1.8919677734375, 2.132080078125, 2.3721923828125, 2.6123046875, 2.8524169921875, 3.092529296875, 3.3326416015625, 3.57275390625, 3.8128662109375, 4.052978515625, 4.2930908203125, 4.533203125, 4.7733154296875, 5.013427734375, 5.2535400390625, 5.49365234375, 5.7337646484375, 5.973876953125, 6.2139892578125, 6.4541015625, 6.6942138671875, 6.934326171875, 7.1744384765625, 7.41455078125, 7.6546630859375, 7.894775390625, 8.1348876953125, 8.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 5.0, 11.0, 13.0, 14.0, 18.0, 28.0, 20.0, 26.0, 27.0, 46.0, 48.0, 53.0, 58.0, 67.0, 65.0, 62.0, 58.0, 54.0, 54.0, 54.0, 38.0, 30.0, 24.0, 17.0, 17.0, 19.0, 8.0, 11.0, 2.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.99609375, -1.93450927734375, -1.8729248046875, -1.81134033203125, -1.749755859375, -1.68817138671875, -1.6265869140625, -1.56500244140625, -1.50341796875, -1.44183349609375, -1.3802490234375, -1.31866455078125, -1.257080078125, -1.19549560546875, -1.1339111328125, -1.07232666015625, -1.0107421875, -0.94915771484375, -0.8875732421875, -0.82598876953125, -0.764404296875, -0.70281982421875, -0.6412353515625, -0.57965087890625, -0.51806640625, -0.45648193359375, -0.3948974609375, -0.33331298828125, -0.271728515625, -0.21014404296875, -0.1485595703125, -0.08697509765625, -0.025390625, 0.03619384765625, 0.0977783203125, 0.15936279296875, 0.220947265625, 0.28253173828125, 0.3441162109375, 0.40570068359375, 0.46728515625, 0.52886962890625, 0.5904541015625, 0.65203857421875, 0.713623046875, 0.77520751953125, 0.8367919921875, 0.89837646484375, 0.9599609375, 1.02154541015625, 1.0831298828125, 1.14471435546875, 1.206298828125, 1.26788330078125, 1.3294677734375, 1.39105224609375, 1.45263671875, 1.51422119140625, 1.5758056640625, 1.63739013671875, 1.698974609375, 1.76055908203125, 1.8221435546875, 1.88372802734375, 1.9453125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 15.0, 19.0, 24.0, 21.0, 20.0, 40.0, 27.0, 47.0, 49.0, 39.0, 47.0, 61.0, 49.0, 51.0, 60.0, 73.0, 31.0, 33.0, 48.0, 35.0, 31.0, 25.0, 19.0, 12.0, 11.0, 20.0, 17.0, 8.0, 13.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.122962951660156, -11.743892669677734, -11.364823341369629, -10.985753059387207, -10.606683731079102, -10.22761344909668, -9.848543167114258, -9.469472885131836, -9.09040355682373, -8.711333274841309, -8.332263946533203, -7.953193664550781, -7.574123859405518, -7.195054054260254, -6.815983772277832, -6.436913967132568, -6.057844161987305, -5.678774356842041, -5.299704551696777, -4.9206342697143555, -4.541564464569092, -4.162494659423828, -3.7834246158599854, -3.4043545722961426, -3.025284767150879, -2.6462149620056152, -2.2671449184417725, -1.8880749940872192, -1.509005069732666, -1.1299351453781128, -0.7508652210235596, -0.3717951774597168, 0.007274627685546875, 0.3863445520401001, 0.7654144763946533, 1.1444844007492065, 1.5235543251037598, 1.902624249458313, 2.281694173812866, 2.660764217376709, 3.0398340225219727, 3.4189038276672363, 3.797973871231079, 4.177043914794922, 4.5561137199401855, 4.935183525085449, 5.314253807067871, 5.693323612213135, 6.072393417358398, 6.451463222503662, 6.830533027648926, 7.209603309631348, 7.588673114776611, 7.967742919921875, 8.346813201904297, 8.725883483886719, 9.104952812194824, 9.484023094177246, 9.863092422485352, 10.242162704467773, 10.621232986450195, 11.0003023147583, 11.379372596740723, 11.758441925048828, 12.13751220703125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 13.0, 10.0, 11.0, 14.0, 21.0, 21.0, 13.0, 19.0, 24.0, 21.0, 40.0, 30.0, 38.0, 51.0, 43.0, 30.0, 46.0, 35.0, 39.0, 46.0, 30.0, 42.0, 41.0, 29.0, 22.0, 28.0, 27.0, 29.0, 31.0, 17.0, 20.0, 24.0, 11.0, 16.0, 15.0, 15.0, 8.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.735739707946777, -7.48982572555542, -7.2439117431640625, -6.997997760772705, -6.752083778381348, -6.50616979598999, -6.260255813598633, -6.014341831207275, -5.768427848815918, -5.5225138664245605, -5.276599884033203, -5.030685901641846, -4.784771919250488, -4.538857936859131, -4.292943954467773, -4.047029972076416, -3.8011162281036377, -3.5552022457122803, -3.309288263320923, -3.0633742809295654, -2.817460298538208, -2.5715465545654297, -2.3256325721740723, -2.079718589782715, -1.8338044881820679, -1.5878905057907104, -1.341976523399353, -1.0960626602172852, -0.850148618221283, -0.6042346954345703, -0.3583207130432129, -0.11240673065185547, 0.13350725173950195, 0.3794212341308594, 0.6253352165222168, 0.8712491393089294, 1.1171631813049316, 1.3630770444869995, 1.608991026878357, 1.8549050092697144, 2.1008191108703613, 2.3467330932617188, 2.592647075653076, 2.8385610580444336, 3.084475040435791, 3.3303890228271484, 3.576303005218506, 3.8222169876098633, 4.0681304931640625, 4.31404447555542, 4.559958457946777, 4.805872440338135, 5.051786422729492, 5.29770040512085, 5.543614387512207, 5.7895283699035645, 6.035442352294922, 6.281356334686279, 6.527270317077637, 6.773184299468994, 7.019098281860352, 7.265012264251709, 7.510926246643066, 7.756840229034424, 8.002754211425781]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 10.0, 7.0, 18.0, 28.0, 36.0, 69.0, 87.0, 150.0, 233.0, 367.0, 582.0, 850.0, 1477.0, 2163.0, 3567.0, 6069.0, 10181.0, 17147.0, 30263.0, 52705.0, 97186.0, 180228.0, 335413.0, 581254.0, 807711.0, 798423.0, 562165.0, 321863.0, 172463.0, 91872.0, 50666.0, 28436.0, 16379.0, 9590.0, 5677.0, 3495.0, 2082.0, 1280.0, 766.0, 446.0, 325.0, 183.0, 135.0, 90.0, 54.0, 45.0, 23.0, 11.0, 10.0, 7.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.73388671875, -8.3974609375, -8.06103515625, -7.724609375, -7.38818359375, -7.0517578125, -6.71533203125, -6.37890625, -6.04248046875, -5.7060546875, -5.36962890625, -5.033203125, -4.69677734375, -4.3603515625, -4.02392578125, -3.6875, -3.35107421875, -3.0146484375, -2.67822265625, -2.341796875, -2.00537109375, -1.6689453125, -1.33251953125, -0.99609375, -0.65966796875, -0.3232421875, 0.01318359375, 0.349609375, 0.68603515625, 1.0224609375, 1.35888671875, 1.6953125, 2.03173828125, 2.3681640625, 2.70458984375, 3.041015625, 3.37744140625, 3.7138671875, 4.05029296875, 4.38671875, 4.72314453125, 5.0595703125, 5.39599609375, 5.732421875, 6.06884765625, 6.4052734375, 6.74169921875, 7.078125, 7.41455078125, 7.7509765625, 8.08740234375, 8.423828125, 8.76025390625, 9.0966796875, 9.43310546875, 9.76953125, 10.10595703125, 10.4423828125, 10.77880859375, 11.115234375, 11.45166015625, 11.7880859375, 12.12451171875, 12.4609375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 11.0, 7.0, 10.0, 21.0, 11.0, 17.0, 21.0, 22.0, 31.0, 45.0, 27.0, 27.0, 30.0, 33.0, 43.0, 44.0, 43.0, 47.0, 36.0, 46.0, 42.0, 51.0, 36.0, 33.0, 34.0, 26.0, 31.0, 22.0, 32.0, 22.0, 16.0, 16.0, 12.0, 7.0, 10.0, 8.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.80462646484375, -8.5389404296875, -8.27325439453125, -8.007568359375, -7.74188232421875, -7.4761962890625, -7.21051025390625, -6.94482421875, -6.67913818359375, -6.4134521484375, -6.14776611328125, -5.882080078125, -5.61639404296875, -5.3507080078125, -5.08502197265625, -4.8193359375, -4.55364990234375, -4.2879638671875, -4.02227783203125, -3.756591796875, -3.49090576171875, -3.2252197265625, -2.95953369140625, -2.69384765625, -2.42816162109375, -2.1624755859375, -1.89678955078125, -1.631103515625, -1.36541748046875, -1.0997314453125, -0.83404541015625, -0.568359375, -0.30267333984375, -0.0369873046875, 0.22869873046875, 0.494384765625, 0.76007080078125, 1.0257568359375, 1.29144287109375, 1.55712890625, 1.82281494140625, 2.0885009765625, 2.35418701171875, 2.619873046875, 2.88555908203125, 3.1512451171875, 3.41693115234375, 3.6826171875, 3.94830322265625, 4.2139892578125, 4.47967529296875, 4.745361328125, 5.01104736328125, 5.2767333984375, 5.54241943359375, 5.80810546875, 6.07379150390625, 6.3394775390625, 6.60516357421875, 6.870849609375, 7.13653564453125, 7.4022216796875, 7.66790771484375, 7.93359375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 18.0, 19.0, 37.0, 34.0, 69.0, 96.0, 145.0, 276.0, 357.0, 558.0, 945.0, 1575.0, 2480.0, 3986.0, 6762.0, 11503.0, 20078.0, 35114.0, 64625.0, 118348.0, 219939.0, 399606.0, 654743.0, 843349.0, 738913.0, 477081.0, 269107.0, 145174.0, 78291.0, 42624.0, 24169.0, 13807.0, 8005.0, 4717.0, 2893.0, 1748.0, 1088.0, 673.0, 434.0, 334.0, 183.0, 145.0, 77.0, 53.0, 34.0, 24.0, 13.0, 11.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-16.125, -15.64599609375, -15.1669921875, -14.68798828125, -14.208984375, -13.72998046875, -13.2509765625, -12.77197265625, -12.29296875, -11.81396484375, -11.3349609375, -10.85595703125, -10.376953125, -9.89794921875, -9.4189453125, -8.93994140625, -8.4609375, -7.98193359375, -7.5029296875, -7.02392578125, -6.544921875, -6.06591796875, -5.5869140625, -5.10791015625, -4.62890625, -4.14990234375, -3.6708984375, -3.19189453125, -2.712890625, -2.23388671875, -1.7548828125, -1.27587890625, -0.796875, -0.31787109375, 0.1611328125, 0.64013671875, 1.119140625, 1.59814453125, 2.0771484375, 2.55615234375, 3.03515625, 3.51416015625, 3.9931640625, 4.47216796875, 4.951171875, 5.43017578125, 5.9091796875, 6.38818359375, 6.8671875, 7.34619140625, 7.8251953125, 8.30419921875, 8.783203125, 9.26220703125, 9.7412109375, 10.22021484375, 10.69921875, 11.17822265625, 11.6572265625, 12.13623046875, 12.615234375, 13.09423828125, 13.5732421875, 14.05224609375, 14.53125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 17.0, 20.0, 20.0, 32.0, 38.0, 52.0, 58.0, 58.0, 72.0, 98.0, 137.0, 182.0, 192.0, 227.0, 251.0, 224.0, 255.0, 273.0, 298.0, 246.0, 199.0, 194.0, 186.0, 144.0, 140.0, 108.0, 81.0, 52.0, 49.0, 40.0, 43.0, 30.0, 13.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.36590576171875, -4.2044677734375, -4.04302978515625, -3.881591796875, -3.72015380859375, -3.5587158203125, -3.39727783203125, -3.23583984375, -3.07440185546875, -2.9129638671875, -2.75152587890625, -2.590087890625, -2.42864990234375, -2.2672119140625, -2.10577392578125, -1.9443359375, -1.78289794921875, -1.6214599609375, -1.46002197265625, -1.298583984375, -1.13714599609375, -0.9757080078125, -0.81427001953125, -0.65283203125, -0.49139404296875, -0.3299560546875, -0.16851806640625, -0.007080078125, 0.15435791015625, 0.3157958984375, 0.47723388671875, 0.638671875, 0.80010986328125, 0.9615478515625, 1.12298583984375, 1.284423828125, 1.44586181640625, 1.6072998046875, 1.76873779296875, 1.93017578125, 2.09161376953125, 2.2530517578125, 2.41448974609375, 2.575927734375, 2.73736572265625, 2.8988037109375, 3.06024169921875, 3.2216796875, 3.38311767578125, 3.5445556640625, 3.70599365234375, 3.867431640625, 4.02886962890625, 4.1903076171875, 4.35174560546875, 4.51318359375, 4.67462158203125, 4.8360595703125, 4.99749755859375, 5.158935546875, 5.32037353515625, 5.4818115234375, 5.64324951171875, 5.8046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 8.0, 5.0, 14.0, 10.0, 14.0, 20.0, 14.0, 27.0, 26.0, 40.0, 35.0, 35.0, 46.0, 54.0, 50.0, 52.0, 53.0, 54.0, 53.0, 47.0, 47.0, 47.0, 37.0, 23.0, 28.0, 39.0, 25.0, 20.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.755992889404297, -17.209001541137695, -16.662010192871094, -16.115018844604492, -15.56802749633789, -15.021036148071289, -14.474045753479004, -13.927054405212402, -13.3800630569458, -12.8330717086792, -12.286080360412598, -11.739089012145996, -11.192098617553711, -10.64510726928711, -10.098115921020508, -9.551124572753906, -9.004133224487305, -8.457141876220703, -7.910150527954102, -7.363159656524658, -6.816168308258057, -6.269176959991455, -5.722186088562012, -5.17519474029541, -4.628203392028809, -4.081212043762207, -3.5342209339141846, -2.987229824066162, -2.4402384757995605, -1.893247127532959, -1.3462560176849365, -0.7992649078369141, -0.2522735595703125, 0.2947176694869995, 0.8417088985443115, 1.3887001276016235, 1.9356913566589355, 2.482682704925537, 3.0296738147735596, 3.576664924621582, 4.123656272888184, 4.670647621154785, 5.217638969421387, 5.76462984085083, 6.311621189117432, 6.858612537384033, 7.405603408813477, 7.952594757080078, 8.49958610534668, 9.046577453613281, 9.593568801879883, 10.140560150146484, 10.687551498413086, 11.234542846679688, 11.781533241271973, 12.328524589538574, 12.875515937805176, 13.422507286071777, 13.969498634338379, 14.51648998260498, 15.063480377197266, 15.610471725463867, 16.15746307373047, 16.70445442199707, 17.251445770263672]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 11.0, 11.0, 10.0, 14.0, 19.0, 19.0, 19.0, 25.0, 18.0, 25.0, 35.0, 27.0, 28.0, 30.0, 43.0, 33.0, 32.0, 38.0, 27.0, 38.0, 38.0, 34.0, 32.0, 34.0, 25.0, 32.0, 23.0, 30.0, 35.0, 26.0, 19.0, 18.0, 16.0, 17.0, 18.0, 16.0, 19.0, 6.0, 11.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.7020845413208, -9.396124839782715, -9.090165138244629, -8.78420639038086, -8.478246688842773, -8.172286987304688, -7.866327285766602, -7.560368061065674, -7.254408836364746, -6.94844913482666, -6.642489910125732, -6.3365302085876465, -6.030570983886719, -5.724611282348633, -5.418651580810547, -5.112692356109619, -4.806732654571533, -4.500772953033447, -4.1948137283325195, -3.8888540267944336, -3.582894802093506, -3.27693510055542, -2.970975637435913, -2.6650161743164062, -2.3590567111968994, -2.0530972480773926, -1.7471377849578857, -1.4411782026290894, -1.1352187395095825, -0.8292592763900757, -0.5232996940612793, -0.21734023094177246, 0.08861923217773438, 0.3945787250995636, 0.7005382180213928, 1.0064977407455444, 1.3124572038650513, 1.618416666984558, 1.9243762493133545, 2.2303357124328613, 2.536295175552368, 2.842254638671875, 3.148214101791382, 3.4541735649108887, 3.7601332664489746, 4.066092491149902, 4.372052192687988, 4.678011894226074, 4.983971118927002, 5.289930820465088, 5.595890045166016, 5.901849746704102, 6.207808971405029, 6.513768672943115, 6.819727897644043, 7.125687599182129, 7.431647300720215, 7.737607002258301, 8.043566703796387, 8.349525451660156, 8.655485153198242, 8.961444854736328, 9.267404556274414, 9.5733642578125, 9.87932300567627]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 11.0, 27.0, 27.0, 69.0, 91.0, 125.0, 232.0, 364.0, 584.0, 996.0, 1530.0, 2577.0, 4309.0, 7073.0, 11893.0, 20196.0, 34496.0, 59493.0, 98685.0, 150991.0, 188987.0, 170730.0, 117805.0, 73009.0, 42597.0, 25169.0, 14509.0, 8687.0, 5158.0, 3199.0, 1912.0, 1131.0, 690.0, 431.0, 269.0, 159.0, 94.0, 79.0, 48.0, 30.0, 20.0, 15.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.4033203125, -1.3603973388671875, -1.317474365234375, -1.2745513916015625, -1.23162841796875, -1.1887054443359375, -1.145782470703125, -1.1028594970703125, -1.0599365234375, -1.0170135498046875, -0.974090576171875, -0.9311676025390625, -0.88824462890625, -0.8453216552734375, -0.802398681640625, -0.7594757080078125, -0.716552734375, -0.6736297607421875, -0.630706787109375, -0.5877838134765625, -0.54486083984375, -0.5019378662109375, -0.459014892578125, -0.4160919189453125, -0.3731689453125, -0.3302459716796875, -0.287322998046875, -0.2444000244140625, -0.20147705078125, -0.1585540771484375, -0.115631103515625, -0.0727081298828125, -0.02978515625, 0.0131378173828125, 0.056060791015625, 0.0989837646484375, 0.14190673828125, 0.1848297119140625, 0.227752685546875, 0.2706756591796875, 0.3135986328125, 0.3565216064453125, 0.399444580078125, 0.4423675537109375, 0.48529052734375, 0.5282135009765625, 0.571136474609375, 0.6140594482421875, 0.656982421875, 0.6999053955078125, 0.742828369140625, 0.7857513427734375, 0.82867431640625, 0.8715972900390625, 0.914520263671875, 0.9574432373046875, 1.0003662109375, 1.0432891845703125, 1.086212158203125, 1.1291351318359375, 1.17205810546875, 1.2149810791015625, 1.257904052734375, 1.3008270263671875, 1.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 4.0, 7.0, 10.0, 8.0, 15.0, 12.0, 15.0, 17.0, 21.0, 31.0, 27.0, 30.0, 34.0, 27.0, 38.0, 36.0, 35.0, 44.0, 44.0, 49.0, 30.0, 32.0, 37.0, 33.0, 32.0, 38.0, 33.0, 32.0, 26.0, 34.0, 24.0, 18.0, 18.0, 18.0, 18.0, 12.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.4921875, -12.1234130859375, -11.754638671875, -11.3858642578125, -11.01708984375, -10.6483154296875, -10.279541015625, -9.9107666015625, -9.5419921875, -9.1732177734375, -8.804443359375, -8.4356689453125, -8.06689453125, -7.6981201171875, -7.329345703125, -6.9605712890625, -6.591796875, -6.2230224609375, -5.854248046875, -5.4854736328125, -5.11669921875, -4.7479248046875, -4.379150390625, -4.0103759765625, -3.6416015625, -3.2728271484375, -2.904052734375, -2.5352783203125, -2.16650390625, -1.7977294921875, -1.428955078125, -1.0601806640625, -0.69140625, -0.3226318359375, 0.046142578125, 0.4149169921875, 0.78369140625, 1.1524658203125, 1.521240234375, 1.8900146484375, 2.2587890625, 2.6275634765625, 2.996337890625, 3.3651123046875, 3.73388671875, 4.1026611328125, 4.471435546875, 4.8402099609375, 5.208984375, 5.5777587890625, 5.946533203125, 6.3153076171875, 6.68408203125, 7.0528564453125, 7.421630859375, 7.7904052734375, 8.1591796875, 8.5279541015625, 8.896728515625, 9.2655029296875, 9.63427734375, 10.0030517578125, 10.371826171875, 10.7406005859375, 11.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 11.0, 20.0, 35.0, 33.0, 46.0, 78.0, 104.0, 118.0, 214.0, 298.0, 435.0, 776.0, 1276.0, 2116.0, 3972.0, 7776.0, 16320.0, 42024.0, 786443.0, 137701.0, 24650.0, 11268.0, 5604.0, 2917.0, 1628.0, 981.0, 580.0, 362.0, 221.0, 175.0, 114.0, 80.0, 43.0, 41.0, 21.0, 16.0, 12.0, 11.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.849609375, -3.715728759765625, -3.58184814453125, -3.447967529296875, -3.3140869140625, -3.180206298828125, -3.04632568359375, -2.912445068359375, -2.778564453125, -2.644683837890625, -2.51080322265625, -2.376922607421875, -2.2430419921875, -2.109161376953125, -1.97528076171875, -1.841400146484375, -1.70751953125, -1.573638916015625, -1.43975830078125, -1.305877685546875, -1.1719970703125, -1.038116455078125, -0.90423583984375, -0.770355224609375, -0.636474609375, -0.502593994140625, -0.36871337890625, -0.234832763671875, -0.1009521484375, 0.032928466796875, 0.16680908203125, 0.300689697265625, 0.4345703125, 0.568450927734375, 0.70233154296875, 0.836212158203125, 0.9700927734375, 1.103973388671875, 1.23785400390625, 1.371734619140625, 1.505615234375, 1.639495849609375, 1.77337646484375, 1.907257080078125, 2.0411376953125, 2.175018310546875, 2.30889892578125, 2.442779541015625, 2.57666015625, 2.710540771484375, 2.84442138671875, 2.978302001953125, 3.1121826171875, 3.246063232421875, 3.37994384765625, 3.513824462890625, 3.647705078125, 3.781585693359375, 3.91546630859375, 4.049346923828125, 4.1832275390625, 4.317108154296875, 4.45098876953125, 4.584869384765625, 4.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 7.0, 5.0, 12.0, 15.0, 16.0, 20.0, 23.0, 18.0, 27.0, 25.0, 28.0, 26.0, 30.0, 37.0, 38.0, 36.0, 40.0, 33.0, 38.0, 41.0, 41.0, 45.0, 37.0, 40.0, 39.0, 48.0, 28.0, 29.0, 22.0, 29.0, 24.0, 20.0, 20.0, 16.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.7265625, -7.4775390625, -7.228515625, -6.9794921875, -6.73046875, -6.4814453125, -6.232421875, -5.9833984375, -5.734375, -5.4853515625, -5.236328125, -4.9873046875, -4.73828125, -4.4892578125, -4.240234375, -3.9912109375, -3.7421875, -3.4931640625, -3.244140625, -2.9951171875, -2.74609375, -2.4970703125, -2.248046875, -1.9990234375, -1.75, -1.5009765625, -1.251953125, -1.0029296875, -0.75390625, -0.5048828125, -0.255859375, -0.0068359375, 0.2421875, 0.4912109375, 0.740234375, 0.9892578125, 1.23828125, 1.4873046875, 1.736328125, 1.9853515625, 2.234375, 2.4833984375, 2.732421875, 2.9814453125, 3.23046875, 3.4794921875, 3.728515625, 3.9775390625, 4.2265625, 4.4755859375, 4.724609375, 4.9736328125, 5.22265625, 5.4716796875, 5.720703125, 5.9697265625, 6.21875, 6.4677734375, 6.716796875, 6.9658203125, 7.21484375, 7.4638671875, 7.712890625, 7.9619140625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 5.0, 17.0, 15.0, 25.0, 30.0, 49.0, 57.0, 96.0, 129.0, 170.0, 254.0, 382.0, 517.0, 836.0, 1167.0, 1884.0, 2714.0, 4381.0, 7050.0, 11797.0, 22009.0, 73907.0, 841025.0, 36589.0, 17271.0, 9673.0, 5833.0, 3620.0, 2292.0, 1498.0, 989.0, 617.0, 484.0, 378.0, 243.0, 170.0, 101.0, 81.0, 63.0, 32.0, 30.0, 23.0, 14.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8271484375, -0.79986572265625, -0.7725830078125, -0.74530029296875, -0.718017578125, -0.69073486328125, -0.6634521484375, -0.63616943359375, -0.60888671875, -0.58160400390625, -0.5543212890625, -0.52703857421875, -0.499755859375, -0.47247314453125, -0.4451904296875, -0.41790771484375, -0.390625, -0.36334228515625, -0.3360595703125, -0.30877685546875, -0.281494140625, -0.25421142578125, -0.2269287109375, -0.19964599609375, -0.17236328125, -0.14508056640625, -0.1177978515625, -0.09051513671875, -0.063232421875, -0.03594970703125, -0.0086669921875, 0.01861572265625, 0.0458984375, 0.07318115234375, 0.1004638671875, 0.12774658203125, 0.155029296875, 0.18231201171875, 0.2095947265625, 0.23687744140625, 0.26416015625, 0.29144287109375, 0.3187255859375, 0.34600830078125, 0.373291015625, 0.40057373046875, 0.4278564453125, 0.45513916015625, 0.482421875, 0.50970458984375, 0.5369873046875, 0.56427001953125, 0.591552734375, 0.61883544921875, 0.6461181640625, 0.67340087890625, 0.70068359375, 0.72796630859375, 0.7552490234375, 0.78253173828125, 0.809814453125, 0.83709716796875, 0.8643798828125, 0.89166259765625, 0.9189453125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 1.0, 8.0, 8.0, 7.0, 5.0, 19.0, 20.0, 12.0, 11.0, 18.0, 24.0, 21.0, 26.0, 37.0, 34.0, 36.0, 41.0, 58.0, 48.0, 30.0, 54.0, 54.0, 47.0, 36.0, 39.0, 36.0, 40.0, 27.0, 32.0, 35.0, 27.0, 21.0, 9.0, 11.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5762786865234375e-05, -3.473460674285889e-05, -3.37064266204834e-05, -3.267824649810791e-05, -3.165006637573242e-05, -3.0621886253356934e-05, -2.9593706130981445e-05, -2.8565526008605957e-05, -2.753734588623047e-05, -2.650916576385498e-05, -2.5480985641479492e-05, -2.4452805519104004e-05, -2.3424625396728516e-05, -2.2396445274353027e-05, -2.136826515197754e-05, -2.034008502960205e-05, -1.9311904907226562e-05, -1.8283724784851074e-05, -1.7255544662475586e-05, -1.6227364540100098e-05, -1.519918441772461e-05, -1.4171004295349121e-05, -1.3142824172973633e-05, -1.2114644050598145e-05, -1.1086463928222656e-05, -1.0058283805847168e-05, -9.03010368347168e-06, -8.001923561096191e-06, -6.973743438720703e-06, -5.945563316345215e-06, -4.9173831939697266e-06, -3.889203071594238e-06, -2.86102294921875e-06, -1.8328428268432617e-06, -8.046627044677734e-07, 2.2351741790771484e-07, 1.2516975402832031e-06, 2.2798776626586914e-06, 3.3080577850341797e-06, 4.336237907409668e-06, 5.364418029785156e-06, 6.3925981521606445e-06, 7.420778274536133e-06, 8.448958396911621e-06, 9.47713851928711e-06, 1.0505318641662598e-05, 1.1533498764038086e-05, 1.2561678886413574e-05, 1.3589859008789062e-05, 1.461803913116455e-05, 1.564621925354004e-05, 1.6674399375915527e-05, 1.7702579498291016e-05, 1.8730759620666504e-05, 1.9758939743041992e-05, 2.078711986541748e-05, 2.181529998779297e-05, 2.2843480110168457e-05, 2.3871660232543945e-05, 2.4899840354919434e-05, 2.5928020477294922e-05, 2.695620059967041e-05, 2.79843807220459e-05, 2.9012560844421387e-05, 3.0040740966796875e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 10.0, 5.0, 14.0, 21.0, 30.0, 30.0, 61.0, 102.0, 148.0, 265.0, 351.0, 525.0, 790.0, 1276.0, 2000.0, 3231.0, 5389.0, 8569.0, 14668.0, 25077.0, 42856.0, 73323.0, 121559.0, 179500.0, 195575.0, 147362.0, 92709.0, 54384.0, 31865.0, 18355.0, 10925.0, 6657.0, 4012.0, 2469.0, 1560.0, 1006.0, 661.0, 404.0, 287.0, 200.0, 119.0, 76.0, 46.0, 31.0, 21.0, 20.0, 8.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5256805419921875, -0.509857177734375, -0.4940338134765625, -0.47821044921875, -0.4623870849609375, -0.446563720703125, -0.4307403564453125, -0.4149169921875, -0.3990936279296875, -0.383270263671875, -0.3674468994140625, -0.35162353515625, -0.3358001708984375, -0.319976806640625, -0.3041534423828125, -0.288330078125, -0.2725067138671875, -0.256683349609375, -0.2408599853515625, -0.22503662109375, -0.2092132568359375, -0.193389892578125, -0.1775665283203125, -0.1617431640625, -0.1459197998046875, -0.130096435546875, -0.1142730712890625, -0.09844970703125, -0.0826263427734375, -0.066802978515625, -0.0509796142578125, -0.03515625, -0.0193328857421875, -0.003509521484375, 0.0123138427734375, 0.02813720703125, 0.0439605712890625, 0.059783935546875, 0.0756072998046875, 0.0914306640625, 0.1072540283203125, 0.123077392578125, 0.1389007568359375, 0.15472412109375, 0.1705474853515625, 0.186370849609375, 0.2021942138671875, 0.218017578125, 0.2338409423828125, 0.249664306640625, 0.2654876708984375, 0.28131103515625, 0.2971343994140625, 0.312957763671875, 0.3287811279296875, 0.3446044921875, 0.3604278564453125, 0.376251220703125, 0.3920745849609375, 0.40789794921875, 0.4237213134765625, 0.439544677734375, 0.4553680419921875, 0.47119140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 14.0, 13.0, 8.0, 18.0, 16.0, 15.0, 19.0, 39.0, 39.0, 47.0, 55.0, 55.0, 64.0, 68.0, 64.0, 72.0, 55.0, 65.0, 52.0, 41.0, 21.0, 23.0, 29.0, 19.0, 19.0, 13.0, 9.0, 4.0, 6.0, 9.0, 6.0, 2.0, 1.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18789291381835938, -0.18267059326171875, -0.17744827270507812, -0.1722259521484375, -0.16700363159179688, -0.16178131103515625, -0.15655899047851562, -0.151336669921875, -0.14611434936523438, -0.14089202880859375, -0.13566970825195312, -0.1304473876953125, -0.12522506713867188, -0.12000274658203125, -0.11478042602539062, -0.10955810546875, -0.10433578491210938, -0.09911346435546875, -0.09389114379882812, -0.0886688232421875, -0.08344650268554688, -0.07822418212890625, -0.07300186157226562, -0.067779541015625, -0.06255722045898438, -0.05733489990234375, -0.052112579345703125, -0.0468902587890625, -0.041667938232421875, -0.03644561767578125, -0.031223297119140625, -0.0260009765625, -0.020778656005859375, -0.01555633544921875, -0.010334014892578125, -0.0051116943359375, 0.000110626220703125, 0.00533294677734375, 0.010555267333984375, 0.015777587890625, 0.020999908447265625, 0.02622222900390625, 0.031444549560546875, 0.0366668701171875, 0.041889190673828125, 0.04711151123046875, 0.052333831787109375, 0.05755615234375, 0.06277847290039062, 0.06800079345703125, 0.07322311401367188, 0.0784454345703125, 0.08366775512695312, 0.08889007568359375, 0.09411239624023438, 0.099334716796875, 0.10455703735351562, 0.10977935791015625, 0.11500167846679688, 0.1202239990234375, 0.12544631958007812, 0.13066864013671875, 0.13589096069335938, 0.14111328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 14.0, 11.0, 13.0, 20.0, 15.0, 19.0, 26.0, 37.0, 37.0, 36.0, 44.0, 47.0, 55.0, 50.0, 54.0, 48.0, 47.0, 54.0, 41.0, 49.0, 42.0, 30.0, 26.0, 35.0, 30.0, 19.0, 18.0, 16.0, 8.0, 7.0, 7.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.071125030517578, -16.5330867767334, -15.995046615600586, -15.457008361816406, -14.91896915435791, -14.380929946899414, -13.842891693115234, -13.304852485656738, -12.766813278198242, -12.228774070739746, -11.69073486328125, -11.15269660949707, -10.614657402038574, -10.076618194580078, -9.538579940795898, -9.000540733337402, -8.462501525878906, -7.92446231842041, -7.386423587799072, -6.848384857177734, -6.310345649719238, -5.772306442260742, -5.234267711639404, -4.696228981018066, -4.15818977355957, -3.6201508045196533, -3.0821118354797363, -2.5440728664398193, -2.0060338973999023, -1.4679949283599854, -0.9299559593200684, -0.39191699028015137, 0.14612388610839844, 0.6841628551483154, 1.2222018241882324, 1.7602407932281494, 2.2982797622680664, 2.8363187313079834, 3.3743577003479004, 3.9123966693878174, 4.450435638427734, 4.9884748458862305, 5.526513576507568, 6.064552307128906, 6.602591514587402, 7.140630722045898, 7.678669452667236, 8.216708183288574, 8.75474739074707, 9.292786598205566, 9.830825805664062, 10.368864059448242, 10.906903266906738, 11.444942474365234, 11.982980728149414, 12.52101993560791, 13.059059143066406, 13.597098350524902, 14.135137557983398, 14.673175811767578, 15.211215019226074, 15.74925422668457, 16.28729248046875, 16.825332641601562, 17.363370895385742]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 7.0, 4.0, 6.0, 5.0, 6.0, 13.0, 10.0, 10.0, 13.0, 19.0, 18.0, 18.0, 27.0, 18.0, 25.0, 32.0, 31.0, 27.0, 29.0, 46.0, 32.0, 31.0, 37.0, 35.0, 33.0, 37.0, 36.0, 28.0, 37.0, 24.0, 34.0, 25.0, 28.0, 34.0, 26.0, 19.0, 16.0, 18.0, 18.0, 16.0, 15.0, 19.0, 7.0, 11.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.865306854248047, -9.556503295898438, -9.247699737548828, -8.938896179199219, -8.63009262084961, -8.321290016174316, -8.012486457824707, -7.703682899475098, -7.394879341125488, -7.086075782775879, -6.7772722244262695, -6.468469142913818, -6.159665584564209, -5.8508620262146, -5.542058944702148, -5.233255386352539, -4.92445182800293, -4.61564826965332, -4.306844711303711, -3.9980416297912598, -3.6892380714416504, -3.380434513092041, -3.0716311931610107, -2.7628278732299805, -2.454024314880371, -2.1452207565307617, -1.8364174365997314, -1.5276139974594116, -1.2188105583190918, -0.910007119178772, -0.6012036800384521, -0.2924003601074219, 0.016402244567871094, 0.3252056837081909, 0.6340091228485107, 0.9428125619888306, 1.2516160011291504, 1.5604194402694702, 1.86922287940979, 2.1780261993408203, 2.4868297576904297, 2.795633316040039, 3.1044366359710693, 3.4132399559020996, 3.722043514251709, 4.030847072601318, 4.3396501541137695, 4.648453712463379, 4.957257270812988, 5.266060829162598, 5.574864387512207, 5.883667469024658, 6.192471027374268, 6.501274585723877, 6.810077667236328, 7.1188812255859375, 7.427684783935547, 7.736488342285156, 8.045291900634766, 8.354095458984375, 8.662899017333984, 8.971701622009277, 9.280505180358887, 9.589308738708496, 9.898112297058105]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 16.0, 15.0, 24.0, 33.0, 70.0, 83.0, 162.0, 247.0, 390.0, 630.0, 1089.0, 1913.0, 3379.0, 6409.0, 11348.0, 21308.0, 38771.0, 68895.0, 113305.0, 161112.0, 184051.0, 162827.0, 114693.0, 70139.0, 39483.0, 21756.0, 11647.0, 6384.0, 3496.0, 1967.0, 1159.0, 662.0, 416.0, 230.0, 162.0, 92.0, 59.0, 36.0, 28.0, 18.0, 8.0, 15.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.015625, -11.6461181640625, -11.276611328125, -10.9071044921875, -10.53759765625, -10.1680908203125, -9.798583984375, -9.4290771484375, -9.0595703125, -8.6900634765625, -8.320556640625, -7.9510498046875, -7.58154296875, -7.2120361328125, -6.842529296875, -6.4730224609375, -6.103515625, -5.7340087890625, -5.364501953125, -4.9949951171875, -4.62548828125, -4.2559814453125, -3.886474609375, -3.5169677734375, -3.1474609375, -2.7779541015625, -2.408447265625, -2.0389404296875, -1.66943359375, -1.2999267578125, -0.930419921875, -0.5609130859375, -0.19140625, 0.1781005859375, 0.547607421875, 0.9171142578125, 1.28662109375, 1.6561279296875, 2.025634765625, 2.3951416015625, 2.7646484375, 3.1341552734375, 3.503662109375, 3.8731689453125, 4.24267578125, 4.6121826171875, 4.981689453125, 5.3511962890625, 5.720703125, 6.0902099609375, 6.459716796875, 6.8292236328125, 7.19873046875, 7.5682373046875, 7.937744140625, 8.3072509765625, 8.6767578125, 9.0462646484375, 9.415771484375, 9.7852783203125, 10.15478515625, 10.5242919921875, 10.893798828125, 11.2633056640625, 11.6328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 9.0, 10.0, 16.0, 9.0, 18.0, 23.0, 27.0, 23.0, 36.0, 24.0, 25.0, 40.0, 43.0, 39.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 44.0, 34.0, 37.0, 43.0, 26.0, 28.0, 36.0, 28.0, 14.0, 23.0, 17.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.0390625, -12.6461181640625, -12.253173828125, -11.8602294921875, -11.46728515625, -11.0743408203125, -10.681396484375, -10.2884521484375, -9.8955078125, -9.5025634765625, -9.109619140625, -8.7166748046875, -8.32373046875, -7.9307861328125, -7.537841796875, -7.1448974609375, -6.751953125, -6.3590087890625, -5.966064453125, -5.5731201171875, -5.18017578125, -4.7872314453125, -4.394287109375, -4.0013427734375, -3.6083984375, -3.2154541015625, -2.822509765625, -2.4295654296875, -2.03662109375, -1.6436767578125, -1.250732421875, -0.8577880859375, -0.46484375, -0.0718994140625, 0.321044921875, 0.7139892578125, 1.10693359375, 1.4998779296875, 1.892822265625, 2.2857666015625, 2.6787109375, 3.0716552734375, 3.464599609375, 3.8575439453125, 4.25048828125, 4.6434326171875, 5.036376953125, 5.4293212890625, 5.822265625, 6.2152099609375, 6.608154296875, 7.0010986328125, 7.39404296875, 7.7869873046875, 8.179931640625, 8.5728759765625, 8.9658203125, 9.3587646484375, 9.751708984375, 10.1446533203125, 10.53759765625, 10.9305419921875, 11.323486328125, 11.7164306640625, 12.109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 19.0, 21.0, 37.0, 48.0, 74.0, 107.0, 169.0, 247.0, 374.0, 612.0, 1005.0, 1660.0, 2869.0, 4783.0, 8542.0, 15858.0, 29247.0, 56062.0, 103252.0, 172553.0, 217229.0, 183935.0, 114379.0, 62566.0, 32618.0, 17423.0, 9641.0, 5345.0, 3053.0, 1798.0, 1060.0, 679.0, 458.0, 270.0, 174.0, 108.0, 83.0, 55.0, 43.0, 31.0, 17.0, 15.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-19.125, -18.5380859375, -17.951171875, -17.3642578125, -16.77734375, -16.1904296875, -15.603515625, -15.0166015625, -14.4296875, -13.8427734375, -13.255859375, -12.6689453125, -12.08203125, -11.4951171875, -10.908203125, -10.3212890625, -9.734375, -9.1474609375, -8.560546875, -7.9736328125, -7.38671875, -6.7998046875, -6.212890625, -5.6259765625, -5.0390625, -4.4521484375, -3.865234375, -3.2783203125, -2.69140625, -2.1044921875, -1.517578125, -0.9306640625, -0.34375, 0.2431640625, 0.830078125, 1.4169921875, 2.00390625, 2.5908203125, 3.177734375, 3.7646484375, 4.3515625, 4.9384765625, 5.525390625, 6.1123046875, 6.69921875, 7.2861328125, 7.873046875, 8.4599609375, 9.046875, 9.6337890625, 10.220703125, 10.8076171875, 11.39453125, 11.9814453125, 12.568359375, 13.1552734375, 13.7421875, 14.3291015625, 14.916015625, 15.5029296875, 16.08984375, 16.6767578125, 17.263671875, 17.8505859375, 18.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 10.0, 16.0, 18.0, 17.0, 13.0, 20.0, 33.0, 21.0, 30.0, 38.0, 42.0, 44.0, 44.0, 48.0, 43.0, 37.0, 47.0, 48.0, 44.0, 47.0, 35.0, 33.0, 24.0, 32.0, 15.0, 33.0, 21.0, 27.0, 18.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9375, -6.701904296875, -6.46630859375, -6.230712890625, -5.9951171875, -5.759521484375, -5.52392578125, -5.288330078125, -5.052734375, -4.817138671875, -4.58154296875, -4.345947265625, -4.1103515625, -3.874755859375, -3.63916015625, -3.403564453125, -3.16796875, -2.932373046875, -2.69677734375, -2.461181640625, -2.2255859375, -1.989990234375, -1.75439453125, -1.518798828125, -1.283203125, -1.047607421875, -0.81201171875, -0.576416015625, -0.3408203125, -0.105224609375, 0.13037109375, 0.365966796875, 0.6015625, 0.837158203125, 1.07275390625, 1.308349609375, 1.5439453125, 1.779541015625, 2.01513671875, 2.250732421875, 2.486328125, 2.721923828125, 2.95751953125, 3.193115234375, 3.4287109375, 3.664306640625, 3.89990234375, 4.135498046875, 4.37109375, 4.606689453125, 4.84228515625, 5.077880859375, 5.3134765625, 5.549072265625, 5.78466796875, 6.020263671875, 6.255859375, 6.491455078125, 6.72705078125, 6.962646484375, 7.1982421875, 7.433837890625, 7.66943359375, 7.905029296875, 8.140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 9.0, 11.0, 26.0, 31.0, 45.0, 53.0, 89.0, 134.0, 175.0, 230.0, 340.0, 515.0, 681.0, 947.0, 1463.0, 2214.0, 3277.0, 5222.0, 8441.0, 13862.0, 23301.0, 39998.0, 68952.0, 112389.0, 161351.0, 182344.0, 156916.0, 106713.0, 64578.0, 37127.0, 21955.0, 12818.0, 7762.0, 4865.0, 3041.0, 2000.0, 1394.0, 954.0, 705.0, 477.0, 336.0, 221.0, 168.0, 104.0, 79.0, 77.0, 46.0, 34.0, 22.0, 25.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0], "bins": [-9.578125, -9.2828369140625, -8.987548828125, -8.6922607421875, -8.39697265625, -8.1016845703125, -7.806396484375, -7.5111083984375, -7.2158203125, -6.9205322265625, -6.625244140625, -6.3299560546875, -6.03466796875, -5.7393798828125, -5.444091796875, -5.1488037109375, -4.853515625, -4.5582275390625, -4.262939453125, -3.9676513671875, -3.67236328125, -3.3770751953125, -3.081787109375, -2.7864990234375, -2.4912109375, -2.1959228515625, -1.900634765625, -1.6053466796875, -1.31005859375, -1.0147705078125, -0.719482421875, -0.4241943359375, -0.12890625, 0.1663818359375, 0.461669921875, 0.7569580078125, 1.05224609375, 1.3475341796875, 1.642822265625, 1.9381103515625, 2.2333984375, 2.5286865234375, 2.823974609375, 3.1192626953125, 3.41455078125, 3.7098388671875, 4.005126953125, 4.3004150390625, 4.595703125, 4.8909912109375, 5.186279296875, 5.4815673828125, 5.77685546875, 6.0721435546875, 6.367431640625, 6.6627197265625, 6.9580078125, 7.2532958984375, 7.548583984375, 7.8438720703125, 8.13916015625, 8.4344482421875, 8.729736328125, 9.0250244140625, 9.3203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 10.0, 13.0, 22.0, 16.0, 22.0, 38.0, 52.0, 55.0, 46.0, 69.0, 80.0, 81.0, 66.0, 69.0, 71.0, 43.0, 48.0, 38.0, 27.0, 24.0, 17.0, 13.0, 13.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0016374588012695312, -0.0015962719917297363, -0.0015550851821899414, -0.0015138983726501465, -0.0014727115631103516, -0.0014315247535705566, -0.0013903379440307617, -0.0013491511344909668, -0.0013079643249511719, -0.001266777515411377, -0.001225590705871582, -0.0011844038963317871, -0.0011432170867919922, -0.0011020302772521973, -0.0010608434677124023, -0.0010196566581726074, -0.0009784698486328125, -0.0009372830390930176, -0.0008960962295532227, -0.0008549094200134277, -0.0008137226104736328, -0.0007725358009338379, -0.000731348991394043, -0.000690162181854248, -0.0006489753723144531, -0.0006077885627746582, -0.0005666017532348633, -0.0005254149436950684, -0.00048422813415527344, -0.0004430413246154785, -0.0004018545150756836, -0.00036066770553588867, -0.00031948089599609375, -0.00027829408645629883, -0.0002371072769165039, -0.00019592046737670898, -0.00015473365783691406, -0.00011354684829711914, -7.236003875732422e-05, -3.11732292175293e-05, 1.0013580322265625e-05, 5.120038986206055e-05, 9.238719940185547e-05, 0.0001335740089416504, 0.0001747608184814453, 0.00021594762802124023, 0.00025713443756103516, 0.0002983212471008301, 0.000339508056640625, 0.0003806948661804199, 0.00042188167572021484, 0.00046306848526000977, 0.0005042552947998047, 0.0005454421043395996, 0.0005866289138793945, 0.0006278157234191895, 0.0006690025329589844, 0.0007101893424987793, 0.0007513761520385742, 0.0007925629615783691, 0.0008337497711181641, 0.000874936580657959, 0.0009161233901977539, 0.0009573101997375488, 0.0009984970092773438]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 22.0, 27.0, 36.0, 61.0, 76.0, 107.0, 143.0, 228.0, 354.0, 479.0, 786.0, 1113.0, 1630.0, 2717.0, 4018.0, 6463.0, 10238.0, 17417.0, 29917.0, 51659.0, 87266.0, 137393.0, 178373.0, 176341.0, 133329.0, 84709.0, 49992.0, 28935.0, 16909.0, 10116.0, 6105.0, 4069.0, 2532.0, 1671.0, 1074.0, 738.0, 482.0, 311.0, 214.0, 141.0, 119.0, 72.0, 47.0, 31.0, 36.0, 15.0, 6.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.578125, -9.296142578125, -9.01416015625, -8.732177734375, -8.4501953125, -8.168212890625, -7.88623046875, -7.604248046875, -7.322265625, -7.040283203125, -6.75830078125, -6.476318359375, -6.1943359375, -5.912353515625, -5.63037109375, -5.348388671875, -5.06640625, -4.784423828125, -4.50244140625, -4.220458984375, -3.9384765625, -3.656494140625, -3.37451171875, -3.092529296875, -2.810546875, -2.528564453125, -2.24658203125, -1.964599609375, -1.6826171875, -1.400634765625, -1.11865234375, -0.836669921875, -0.5546875, -0.272705078125, 0.00927734375, 0.291259765625, 0.5732421875, 0.855224609375, 1.13720703125, 1.419189453125, 1.701171875, 1.983154296875, 2.26513671875, 2.547119140625, 2.8291015625, 3.111083984375, 3.39306640625, 3.675048828125, 3.95703125, 4.239013671875, 4.52099609375, 4.802978515625, 5.0849609375, 5.366943359375, 5.64892578125, 5.930908203125, 6.212890625, 6.494873046875, 6.77685546875, 7.058837890625, 7.3408203125, 7.622802734375, 7.90478515625, 8.186767578125, 8.46875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 7.0, 6.0, 6.0, 8.0, 11.0, 20.0, 21.0, 24.0, 24.0, 38.0, 36.0, 52.0, 61.0, 71.0, 65.0, 72.0, 51.0, 55.0, 56.0, 48.0, 41.0, 45.0, 28.0, 25.0, 16.0, 16.0, 12.0, 15.0, 15.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.455078125, -2.377197265625, -2.29931640625, -2.221435546875, -2.1435546875, -2.065673828125, -1.98779296875, -1.909912109375, -1.83203125, -1.754150390625, -1.67626953125, -1.598388671875, -1.5205078125, -1.442626953125, -1.36474609375, -1.286865234375, -1.208984375, -1.131103515625, -1.05322265625, -0.975341796875, -0.8974609375, -0.819580078125, -0.74169921875, -0.663818359375, -0.5859375, -0.508056640625, -0.43017578125, -0.352294921875, -0.2744140625, -0.196533203125, -0.11865234375, -0.040771484375, 0.037109375, 0.114990234375, 0.19287109375, 0.270751953125, 0.3486328125, 0.426513671875, 0.50439453125, 0.582275390625, 0.66015625, 0.738037109375, 0.81591796875, 0.893798828125, 0.9716796875, 1.049560546875, 1.12744140625, 1.205322265625, 1.283203125, 1.361083984375, 1.43896484375, 1.516845703125, 1.5947265625, 1.672607421875, 1.75048828125, 1.828369140625, 1.90625, 1.984130859375, 2.06201171875, 2.139892578125, 2.2177734375, 2.295654296875, 2.37353515625, 2.451416015625, 2.529296875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 17.0, 16.0, 21.0, 23.0, 23.0, 26.0, 36.0, 42.0, 41.0, 31.0, 52.0, 52.0, 53.0, 67.0, 49.0, 54.0, 49.0, 52.0, 37.0, 36.0, 31.0, 30.0, 28.0, 19.0, 17.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.077926635742188, -20.463621139526367, -19.849315643310547, -19.235010147094727, -18.620704650878906, -18.006399154663086, -17.392093658447266, -16.777786254882812, -16.163482666015625, -15.549177169799805, -14.934871673583984, -14.320566177368164, -13.706260681152344, -13.091955184936523, -12.477648735046387, -11.863343238830566, -11.24903678894043, -10.63473129272461, -10.020425796508789, -9.406120300292969, -8.791814804077148, -8.177509307861328, -7.563202857971191, -6.948897361755371, -6.334591865539551, -5.7202863693237305, -5.10598087310791, -4.491674900054932, -3.8773694038391113, -3.263063907623291, -2.6487581729888916, -2.034452438354492, -1.4201488494873047, -0.8058432340621948, -0.19153761863708496, 0.4227679967880249, 1.0370736122131348, 1.651379108428955, 2.2656848430633545, 2.879990577697754, 3.494296073913574, 4.1086015701293945, 4.722907066345215, 5.337213039398193, 5.951518535614014, 6.565824031829834, 7.1801300048828125, 7.794435501098633, 8.408740997314453, 9.023046493530273, 9.637351989746094, 10.251657485961914, 10.865962982177734, 11.480268478393555, 12.094574928283691, 12.708880424499512, 13.323185920715332, 13.937491416931152, 14.551796913146973, 15.166102409362793, 15.78040885925293, 16.39471435546875, 17.00901985168457, 17.62332534790039, 18.23763084411621]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 7.0, 10.0, 15.0, 17.0, 12.0, 10.0, 15.0, 21.0, 19.0, 33.0, 29.0, 26.0, 34.0, 33.0, 37.0, 47.0, 34.0, 38.0, 39.0, 40.0, 55.0, 27.0, 31.0, 34.0, 27.0, 36.0, 36.0, 27.0, 29.0, 23.0, 27.0, 12.0, 13.0, 13.0, 7.0, 18.0, 7.0, 7.0, 5.0, 7.0, 5.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.295456886291504, -12.856975555419922, -12.41849422454834, -11.980012893676758, -11.541531562805176, -11.103050231933594, -10.664569854736328, -10.22608757019043, -9.787607192993164, -9.349125862121582, -8.91064453125, -8.472163200378418, -8.033681869506836, -7.595200538635254, -7.15671968460083, -6.718238353729248, -6.279756546020508, -5.841275215148926, -5.402793884277344, -4.964312553405762, -4.52583122253418, -4.087349891662598, -3.648869037628174, -3.210387706756592, -2.7719063758850098, -2.3334250450134277, -1.8949438333511353, -1.4564626216888428, -1.0179812908172607, -0.5794999599456787, -0.14101886749267578, 0.29746246337890625, 0.7359437942504883, 1.1744251251220703, 1.6129063367843628, 2.0513875484466553, 2.4898688793182373, 2.9283502101898193, 3.3668313026428223, 3.8053126335144043, 4.243793964385986, 4.682275295257568, 5.12075662612915, 5.559237480163574, 5.997718811035156, 6.436200141906738, 6.87468147277832, 7.313162803649902, 7.751644134521484, 8.190125465393066, 8.628606796264648, 9.06708812713623, 9.505569458007812, 9.944050788879395, 10.382532119750977, 10.821012496948242, 11.25949478149414, 11.697976112365723, 12.136457443237305, 12.574938774108887, 13.013420104980469, 13.45190143585205, 13.890382766723633, 14.328863143920898, 14.76734447479248]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 6.0, 13.0, 8.0, 23.0, 24.0, 29.0, 42.0, 49.0, 74.0, 90.0, 130.0, 185.0, 258.0, 410.0, 593.0, 1104.0, 1882.0, 4602.0, 496139.0, 10543.0, 3664.0, 1690.0, 909.0, 598.0, 325.0, 210.0, 174.0, 121.0, 111.0, 64.0, 33.0, 30.0, 28.0, 22.0, 25.0, 16.0, 9.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.6606140136719, -263.2204895019531, -253.78036499023438, -244.34024047851562, -234.90011596679688, -225.45999145507812, -216.0198516845703, -206.57972717285156, -197.1396026611328, -187.69947814941406, -178.2593536376953, -168.81922912597656, -159.37908935546875, -149.93896484375, -140.49884033203125, -131.0587158203125, -121.61859130859375, -112.178466796875, -102.73834228515625, -93.29821014404297, -83.85808563232422, -74.41796112060547, -64.97782897949219, -55.53770446777344, -46.09757995605469, -36.65745544433594, -27.217327117919922, -17.77720069885254, -8.337074279785156, 1.1030502319335938, 10.54317855834961, 19.983306884765625, 29.423431396484375, 38.863555908203125, 48.30368423461914, 57.743812561035156, 67.1839370727539, 76.62406158447266, 86.06419372558594, 95.50431823730469, 104.94444274902344, 114.38456726074219, 123.82469177246094, 133.2648162841797, 142.7049560546875, 152.14508056640625, 161.585205078125, 171.02532958984375, 180.4654541015625, 189.90557861328125, 199.345703125, 208.78582763671875, 218.2259521484375, 227.66607666015625, 237.10621643066406, 246.5463409423828, 255.98646545410156, 265.4266052246094, 274.8667297363281, 284.3068542480469, 293.7469787597656, 303.1871032714844, 312.6272277832031, 322.0673522949219, 331.5074768066406]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 10.0, 12.0, 14.0, 18.0, 14.0, 6.0, 19.0, 18.0, 22.0, 30.0, 31.0, 27.0, 39.0, 31.0, 39.0, 40.0, 33.0, 32.0, 43.0, 1076.0, 44.0, 31.0, 28.0, 37.0, 26.0, 37.0, 30.0, 33.0, 21.0, 29.0, 19.0, 20.0, 9.0, 17.0, 10.0, 15.0, 4.0, 8.0, 4.0, 7.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-412.3919372558594, -398.66351318359375, -384.93511962890625, -371.20672607421875, -357.4783020019531, -343.7498779296875, -330.021484375, -316.2930908203125, -302.5646667480469, -288.83624267578125, -275.10784912109375, -261.37945556640625, -247.65103149414062, -233.92262268066406, -220.1942138671875, -206.46580505371094, -192.73739624023438, -179.0089874267578, -165.28057861328125, -151.5521697998047, -137.82376098632812, -124.09535217285156, -110.366943359375, -96.63853454589844, -82.91012573242188, -69.18171691894531, -55.45330810546875, -41.72489929199219, -27.996490478515625, -14.268081665039062, -0.5396728515625, 13.188735961914062, 26.917144775390625, 40.64555358886719, 54.37396240234375, 68.10237121582031, 81.83078002929688, 95.55918884277344, 109.28759765625, 123.01600646972656, 136.74441528320312, 150.4728240966797, 164.20123291015625, 177.9296417236328, 191.65805053710938, 205.38645935058594, 219.1148681640625, 232.84327697753906, 246.57168579101562, 260.30010986328125, 274.02850341796875, 287.75689697265625, 301.4853210449219, 315.2137451171875, 328.942138671875, 342.6705322265625, 356.3989562988281, 370.12738037109375, 383.85577392578125, 397.58416748046875, 411.3125915527344, 425.041015625, 438.7694091796875, 452.497802734375, 466.2262268066406]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 6.0, 4.0, 9.0, 12.0, 6.0, 11.0, 10.0, 15.0, 26.0, 31.0, 28.0, 35.0, 50.0, 83.0, 110.0, 157.0, 258.0, 328.0, 512.0, 690.0, 926.0, 1171.0, 1581.0, 2182.0, 3398.0, 4810.0, 11404.0, 31146528.0, 52135.0, 10468.0, 7266.0, 6639.0, 1471.0, 632.0, 417.0, 279.0, 247.0, 168.0, 126.0, 108.0, 85.0, 41.0, 22.0, 8.0, 7.0, 0.0, 0.0, 1.0], "bins": [-690.6199951171875, -674.8472900390625, -659.0745849609375, -643.3018798828125, -627.5291137695312, -611.7564086914062, -595.9837036132812, -580.2109985351562, -564.4382934570312, -548.6655883789062, -532.8928833007812, -517.1201171875, -501.3474426269531, -485.57470703125, -469.802001953125, -454.029296875, -438.2565612792969, -422.4838562011719, -406.71112060546875, -390.93841552734375, -375.16571044921875, -359.39300537109375, -343.6202697753906, -327.8475646972656, -312.0748291015625, -296.3021240234375, -280.5293884277344, -264.7566833496094, -248.98397827148438, -233.2112579345703, -217.43853759765625, -201.66583251953125, -185.89309692382812, -170.12037658691406, -154.34767150878906, -138.574951171875, -122.80223846435547, -107.02952575683594, -91.25680541992188, -75.48409271240234, -59.71138000488281, -43.93866729736328, -28.165950775146484, -12.393234252929688, 3.3794784545898438, 19.152191162109375, 34.92491149902344, 50.69762420654297, 66.4703369140625, 82.24304962158203, 98.01576232910156, 113.78848266601562, 129.56118774414062, 145.3339080810547, 161.10662841796875, 176.87933349609375, 192.6520538330078, 208.42477416992188, 224.19747924804688, 239.97019958496094, 255.742919921875, 271.515625, 287.288330078125, 303.0610656738281, 318.8337707519531]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 20.0, 23.0, 20.0, 40.0, 43.0, 57.0, 62.0, 93.0, 99.0, 88.0, 80.0, 83.0, 54.0, 51.0, 33.0, 34.0, 17.0, 20.0, 17.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-550.7784423828125, -535.5905151367188, -520.402587890625, -505.21466064453125, -490.0267028808594, -474.8387756347656, -459.6508483886719, -444.4629211425781, -429.27496337890625, -414.0870361328125, -398.89910888671875, -383.711181640625, -368.5232238769531, -353.3352966308594, -338.1473693847656, -322.9594421386719, -307.7715148925781, -292.5835876464844, -277.3956604003906, -262.20770263671875, -247.019775390625, -231.83184814453125, -216.6439208984375, -201.45599365234375, -186.26805114746094, -171.0801239013672, -155.89218139648438, -140.70425415039062, -125.51631927490234, -110.32838439941406, -95.14045715332031, -79.95252227783203, -64.76458740234375, -49.57665252685547, -34.38872146606445, -19.200790405273438, -4.012855529785156, 11.175079345703125, 26.363006591796875, 41.550941467285156, 56.73887634277344, 71.92681121826172, 87.11474609375, 102.30267333984375, 117.49060821533203, 132.6785430908203, 147.86647033691406, 163.05441284179688, 178.24234008789062, 193.43026733398438, 208.6182098388672, 223.80613708496094, 238.99407958984375, 254.1820068359375, 269.36993408203125, 284.557861328125, 299.74578857421875, 314.9337158203125, 330.12164306640625, 345.3095703125, 360.4975280761719, 375.6854553222656, 390.8733825683594, 406.0613098144531, 421.249267578125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 7.0, 4.0, 13.0, 11.0, 12.0, 16.0, 15.0, 7.0, 23.0, 21.0, 30.0, 30.0, 35.0, 49.0, 58.0, 71.0, 85.0, 69.0, 77.0, 55.0, 37.0, 36.0, 31.0, 28.0, 22.0, 28.0, 15.0, 13.0, 13.0, 9.0, 9.0, 20.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-474.1795654296875, -460.4901428222656, -446.80072021484375, -433.111328125, -419.4219055175781, -405.73248291015625, -392.0430908203125, -378.3536682128906, -364.66424560546875, -350.9748229980469, -337.285400390625, -323.59600830078125, -309.9065856933594, -296.2171630859375, -282.52777099609375, -268.8383483886719, -255.14892578125, -241.45950317382812, -227.7700958251953, -214.0806884765625, -200.39126586914062, -186.70184326171875, -173.01243591308594, -159.32302856445312, -145.63360595703125, -131.94418334960938, -118.25477600097656, -104.56536102294922, -90.87594604492188, -77.18653106689453, -63.49711608886719, -49.807701110839844, -36.118255615234375, -22.42884063720703, -8.739425659179688, 4.949989318847656, 18.639404296875, 32.328819274902344, 46.01823425292969, 59.70764923095703, 73.39706420898438, 87.08647918701172, 100.77589416503906, 114.4653091430664, 128.15472412109375, 141.84414672851562, 155.53355407714844, 169.22296142578125, 182.91238403320312, 196.601806640625, 210.2912139892578, 223.98062133789062, 237.6700439453125, 251.35946655273438, 265.04888916015625, 278.73828125, 292.4277038574219, 306.11712646484375, 319.8065185546875, 333.4959411621094, 347.18536376953125, 360.8747863769531, 374.564208984375, 388.25360107421875, 401.9430236816406]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 12.0, 12.0, 27.0, 39.0, 63.0, 91.0, 125.0, 198.0, 280.0, 422.0, 666.0, 972.0, 1409.0, 2289.0, 3595.0, 5950.0, 9764.0, 17205.0, 31923.0, 61449.0, 123836.0, 264246.0, 607553.0, 1620773.0, 789513.0, 336472.0, 153290.0, 74528.0, 38695.0, 20849.0, 11672.0, 6685.0, 3998.0, 2374.0, 1374.0, 784.0, 444.0, 283.0, 178.0, 91.0, 51.0, 47.0, 26.0, 13.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.313232421875, -9.00927734375, -8.705322265625, -8.4013671875, -8.097412109375, -7.79345703125, -7.489501953125, -7.185546875, -6.881591796875, -6.57763671875, -6.273681640625, -5.9697265625, -5.665771484375, -5.36181640625, -5.057861328125, -4.75390625, -4.449951171875, -4.14599609375, -3.842041015625, -3.5380859375, -3.234130859375, -2.93017578125, -2.626220703125, -2.322265625, -2.018310546875, -1.71435546875, -1.410400390625, -1.1064453125, -0.802490234375, -0.49853515625, -0.194580078125, 0.109375, 0.413330078125, 0.71728515625, 1.021240234375, 1.3251953125, 1.629150390625, 1.93310546875, 2.237060546875, 2.541015625, 2.844970703125, 3.14892578125, 3.452880859375, 3.7568359375, 4.060791015625, 4.36474609375, 4.668701171875, 4.97265625, 5.276611328125, 5.58056640625, 5.884521484375, 6.1884765625, 6.492431640625, 6.79638671875, 7.100341796875, 7.404296875, 7.708251953125, 8.01220703125, 8.316162109375, 8.6201171875, 8.924072265625, 9.22802734375, 9.531982421875, 9.8359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 3.0, 13.0, 18.0, 7.0, 19.0, 13.0, 20.0, 26.0, 40.0, 54.0, 44.0, 41.0, 59.0, 62.0, 64.0, 62.0, 65.0, 60.0, 62.0, 38.0, 46.0, 25.0, 24.0, 24.0, 19.0, 16.0, 8.0, 9.0, 6.0, 6.0, 7.0, 2.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8542861938476562, -0.8282012939453125, -0.8021163940429688, -0.776031494140625, -0.7499465942382812, -0.7238616943359375, -0.6977767944335938, -0.67169189453125, -0.6456069946289062, -0.6195220947265625, -0.5934371948242188, -0.567352294921875, -0.5412673950195312, -0.5151824951171875, -0.48909759521484375, -0.4630126953125, -0.43692779541015625, -0.4108428955078125, -0.38475799560546875, -0.358673095703125, -0.33258819580078125, -0.3065032958984375, -0.28041839599609375, -0.25433349609375, -0.22824859619140625, -0.2021636962890625, -0.17607879638671875, -0.149993896484375, -0.12390899658203125, -0.0978240966796875, -0.07173919677734375, -0.045654296875, -0.01956939697265625, 0.0065155029296875, 0.03260040283203125, 0.058685302734375, 0.08477020263671875, 0.1108551025390625, 0.13694000244140625, 0.16302490234375, 0.18910980224609375, 0.2151947021484375, 0.24127960205078125, 0.267364501953125, 0.29344940185546875, 0.3195343017578125, 0.34561920166015625, 0.3717041015625, 0.39778900146484375, 0.4238739013671875, 0.44995880126953125, 0.476043701171875, 0.5021286010742188, 0.5282135009765625, 0.5542984008789062, 0.58038330078125, 0.6064682006835938, 0.6325531005859375, 0.6586380004882812, 0.684722900390625, 0.7108078002929688, 0.7368927001953125, 0.7629776000976562, 0.7890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 15.0, 19.0, 19.0, 27.0, 48.0, 47.0, 92.0, 133.0, 199.0, 337.0, 635.0, 1200.0, 2583.0, 6389.0, 17607.0, 55745.0, 199260.0, 735735.0, 1958032.0, 877025.0, 239232.0, 66075.0, 20448.0, 7354.0, 2967.0, 1358.0, 690.0, 371.0, 217.0, 124.0, 93.0, 55.0, 37.0, 24.0, 10.0, 13.0, 11.0, 10.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.7890625, -10.4857177734375, -10.182373046875, -9.8790283203125, -9.57568359375, -9.2723388671875, -8.968994140625, -8.6656494140625, -8.3623046875, -8.0589599609375, -7.755615234375, -7.4522705078125, -7.14892578125, -6.8455810546875, -6.542236328125, -6.2388916015625, -5.935546875, -5.6322021484375, -5.328857421875, -5.0255126953125, -4.72216796875, -4.4188232421875, -4.115478515625, -3.8121337890625, -3.5087890625, -3.2054443359375, -2.902099609375, -2.5987548828125, -2.29541015625, -1.9920654296875, -1.688720703125, -1.3853759765625, -1.08203125, -0.7786865234375, -0.475341796875, -0.1719970703125, 0.13134765625, 0.4346923828125, 0.738037109375, 1.0413818359375, 1.3447265625, 1.6480712890625, 1.951416015625, 2.2547607421875, 2.55810546875, 2.8614501953125, 3.164794921875, 3.4681396484375, 3.771484375, 4.0748291015625, 4.378173828125, 4.6815185546875, 4.98486328125, 5.2882080078125, 5.591552734375, 5.8948974609375, 6.1982421875, 6.5015869140625, 6.804931640625, 7.1082763671875, 7.41162109375, 7.7149658203125, 8.018310546875, 8.3216552734375, 8.625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 17.0, 34.0, 46.0, 45.0, 81.0, 91.0, 104.0, 115.0, 180.0, 194.0, 282.0, 289.0, 417.0, 485.0, 322.0, 266.0, 235.0, 189.0, 144.0, 114.0, 86.0, 83.0, 61.0, 33.0, 42.0, 16.0, 15.0, 19.0, 10.0, 7.0, 5.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.408966064453125, -2.31988525390625, -2.230804443359375, -2.1417236328125, -2.052642822265625, -1.96356201171875, -1.874481201171875, -1.785400390625, -1.696319580078125, -1.60723876953125, -1.518157958984375, -1.4290771484375, -1.339996337890625, -1.25091552734375, -1.161834716796875, -1.07275390625, -0.983673095703125, -0.89459228515625, -0.805511474609375, -0.7164306640625, -0.627349853515625, -0.53826904296875, -0.449188232421875, -0.360107421875, -0.271026611328125, -0.18194580078125, -0.092864990234375, -0.0037841796875, 0.085296630859375, 0.17437744140625, 0.263458251953125, 0.3525390625, 0.441619873046875, 0.53070068359375, 0.619781494140625, 0.7088623046875, 0.797943115234375, 0.88702392578125, 0.976104736328125, 1.065185546875, 1.154266357421875, 1.24334716796875, 1.332427978515625, 1.4215087890625, 1.510589599609375, 1.59967041015625, 1.688751220703125, 1.77783203125, 1.866912841796875, 1.95599365234375, 2.045074462890625, 2.1341552734375, 2.223236083984375, 2.31231689453125, 2.401397705078125, 2.490478515625, 2.579559326171875, 2.66864013671875, 2.757720947265625, 2.8468017578125, 2.935882568359375, 3.02496337890625, 3.114044189453125, 3.203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 12.0, 19.0, 22.0, 35.0, 40.0, 53.0, 65.0, 64.0, 65.0, 67.0, 87.0, 65.0, 80.0, 62.0, 60.0, 41.0, 37.0, 16.0, 15.0, 13.0, 9.0, 9.0, 6.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.275325775146484, -27.48114585876465, -26.686967849731445, -25.89278793334961, -25.098608016967773, -24.30443000793457, -23.510250091552734, -22.71607208251953, -21.921892166137695, -21.12771224975586, -20.333534240722656, -19.53935432434082, -18.745174407958984, -17.95099639892578, -17.156816482543945, -16.36263656616211, -15.56845760345459, -14.77427864074707, -13.980098724365234, -13.185919761657715, -12.391740798950195, -11.59756088256836, -10.80338191986084, -10.00920295715332, -9.215023040771484, -8.420844078063965, -7.626664638519287, -6.832485198974609, -6.03830623626709, -5.244126796722412, -4.449947357177734, -3.655768394470215, -2.8615894317626953, -2.0674102306365967, -1.2732309103012085, -0.4790515899658203, 0.3151276111602783, 1.109306812286377, 1.9034862518310547, 2.697665214538574, 3.491844654083252, 4.28602409362793, 5.080203056335449, 5.874382495880127, 6.668561935424805, 7.462740898132324, 8.256919860839844, 9.05109977722168, 9.8452787399292, 10.639457702636719, 11.433637619018555, 12.227816581726074, 13.021995544433594, 13.81617546081543, 14.61035442352295, 15.404533386230469, 16.198713302612305, 16.99289321899414, 17.787071228027344, 18.58125114440918, 19.375431060791016, 20.16960906982422, 20.963788986206055, 21.75796890258789, 22.552146911621094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 5.0, 8.0, 14.0, 12.0, 7.0, 20.0, 16.0, 13.0, 22.0, 30.0, 37.0, 33.0, 40.0, 36.0, 40.0, 40.0, 44.0, 54.0, 40.0, 39.0, 33.0, 28.0, 35.0, 46.0, 39.0, 39.0, 32.0, 15.0, 22.0, 34.0, 13.0, 18.0, 14.0, 5.0, 10.0, 7.0, 5.0, 12.0, 5.0, 3.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-16.215167999267578, -15.719022750854492, -15.222877502441406, -14.72673225402832, -14.230587005615234, -13.734441757202148, -13.238296508789062, -12.742151260375977, -12.24600601196289, -11.749860763549805, -11.253715515136719, -10.757570266723633, -10.261425018310547, -9.765279769897461, -9.269134521484375, -8.772989273071289, -8.276844024658203, -7.780698776245117, -7.284553527832031, -6.788408279418945, -6.292263031005859, -5.796117782592773, -5.2999725341796875, -4.803827285766602, -4.307682037353516, -3.8115367889404297, -3.3153915405273438, -2.819246292114258, -2.323101043701172, -1.826955795288086, -1.330810546875, -0.8346652984619141, -0.3385200500488281, 0.1576251983642578, 0.6537704467773438, 1.1499156951904297, 1.6460609436035156, 2.1422061920166016, 2.6383514404296875, 3.1344966888427734, 3.6306419372558594, 4.126787185668945, 4.622932434082031, 5.119077682495117, 5.615222930908203, 6.111368179321289, 6.607513427734375, 7.103658676147461, 7.599803924560547, 8.095949172973633, 8.592094421386719, 9.088239669799805, 9.58438491821289, 10.080530166625977, 10.576675415039062, 11.072820663452148, 11.568965911865234, 12.06511116027832, 12.561256408691406, 13.057401657104492, 13.553546905517578, 14.049692153930664, 14.54583740234375, 15.041982650756836, 15.538127899169922]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 2.0, 4.0, 8.0, 9.0, 9.0, 22.0, 32.0, 33.0, 53.0, 73.0, 127.0, 150.0, 233.0, 371.0, 507.0, 845.0, 1300.0, 2082.0, 3552.0, 6047.0, 10742.0, 20464.0, 40791.0, 86796.0, 187705.0, 304868.0, 198050.0, 91642.0, 42811.0, 21433.0, 11550.0, 6435.0, 3712.0, 2208.0, 1355.0, 886.0, 554.0, 363.0, 205.0, 155.0, 112.0, 70.0, 49.0, 33.0, 27.0, 25.0, 17.0, 11.0, 4.0, 9.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.91796875, -5.736083984375, -5.55419921875, -5.372314453125, -5.1904296875, -5.008544921875, -4.82666015625, -4.644775390625, -4.462890625, -4.281005859375, -4.09912109375, -3.917236328125, -3.7353515625, -3.553466796875, -3.37158203125, -3.189697265625, -3.0078125, -2.825927734375, -2.64404296875, -2.462158203125, -2.2802734375, -2.098388671875, -1.91650390625, -1.734619140625, -1.552734375, -1.370849609375, -1.18896484375, -1.007080078125, -0.8251953125, -0.643310546875, -0.46142578125, -0.279541015625, -0.09765625, 0.084228515625, 0.26611328125, 0.447998046875, 0.6298828125, 0.811767578125, 0.99365234375, 1.175537109375, 1.357421875, 1.539306640625, 1.72119140625, 1.903076171875, 2.0849609375, 2.266845703125, 2.44873046875, 2.630615234375, 2.8125, 2.994384765625, 3.17626953125, 3.358154296875, 3.5400390625, 3.721923828125, 3.90380859375, 4.085693359375, 4.267578125, 4.449462890625, 4.63134765625, 4.813232421875, 4.9951171875, 5.177001953125, 5.35888671875, 5.540771484375, 5.72265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 8.0, 10.0, 22.0, 18.0, 18.0, 26.0, 36.0, 31.0, 36.0, 64.0, 55.0, 53.0, 47.0, 55.0, 61.0, 57.0, 59.0, 44.0, 32.0, 37.0, 48.0, 26.0, 21.0, 19.0, 19.0, 15.0, 13.0, 8.0, 4.0, 9.0, 6.0, 4.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0234375, -0.9931640625, -0.962890625, -0.9326171875, -0.90234375, -0.8720703125, -0.841796875, -0.8115234375, -0.78125, -0.7509765625, -0.720703125, -0.6904296875, -0.66015625, -0.6298828125, -0.599609375, -0.5693359375, -0.5390625, -0.5087890625, -0.478515625, -0.4482421875, -0.41796875, -0.3876953125, -0.357421875, -0.3271484375, -0.296875, -0.2666015625, -0.236328125, -0.2060546875, -0.17578125, -0.1455078125, -0.115234375, -0.0849609375, -0.0546875, -0.0244140625, 0.005859375, 0.0361328125, 0.06640625, 0.0966796875, 0.126953125, 0.1572265625, 0.1875, 0.2177734375, 0.248046875, 0.2783203125, 0.30859375, 0.3388671875, 0.369140625, 0.3994140625, 0.4296875, 0.4599609375, 0.490234375, 0.5205078125, 0.55078125, 0.5810546875, 0.611328125, 0.6416015625, 0.671875, 0.7021484375, 0.732421875, 0.7626953125, 0.79296875, 0.8232421875, 0.853515625, 0.8837890625, 0.9140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 12.0, 8.0, 8.0, 16.0, 25.0, 24.0, 44.0, 69.0, 100.0, 200.0, 357.0, 641.0, 1296.0, 2770.0, 6974.0, 20730.0, 84097.0, 496751.0, 348553.0, 59587.0, 15989.0, 5595.0, 2295.0, 1076.0, 544.0, 300.0, 176.0, 108.0, 66.0, 35.0, 23.0, 21.0, 9.0, 6.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.99609375, -7.73724365234375, -7.4783935546875, -7.21954345703125, -6.960693359375, -6.70184326171875, -6.4429931640625, -6.18414306640625, -5.92529296875, -5.66644287109375, -5.4075927734375, -5.14874267578125, -4.889892578125, -4.63104248046875, -4.3721923828125, -4.11334228515625, -3.8544921875, -3.59564208984375, -3.3367919921875, -3.07794189453125, -2.819091796875, -2.56024169921875, -2.3013916015625, -2.04254150390625, -1.78369140625, -1.52484130859375, -1.2659912109375, -1.00714111328125, -0.748291015625, -0.48944091796875, -0.2305908203125, 0.02825927734375, 0.287109375, 0.54595947265625, 0.8048095703125, 1.06365966796875, 1.322509765625, 1.58135986328125, 1.8402099609375, 2.09906005859375, 2.35791015625, 2.61676025390625, 2.8756103515625, 3.13446044921875, 3.393310546875, 3.65216064453125, 3.9110107421875, 4.16986083984375, 4.4287109375, 4.68756103515625, 4.9464111328125, 5.20526123046875, 5.464111328125, 5.72296142578125, 5.9818115234375, 6.24066162109375, 6.49951171875, 6.75836181640625, 7.0172119140625, 7.27606201171875, 7.534912109375, 7.79376220703125, 8.0526123046875, 8.31146240234375, 8.5703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 19.0, 13.0, 11.0, 15.0, 21.0, 30.0, 21.0, 36.0, 28.0, 27.0, 36.0, 28.0, 38.0, 38.0, 39.0, 32.0, 41.0, 35.0, 32.0, 43.0, 27.0, 29.0, 41.0, 38.0, 27.0, 20.0, 27.0, 22.0, 23.0, 17.0, 17.0, 8.0, 6.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.763671875, -3.645416259765625, -3.52716064453125, -3.408905029296875, -3.2906494140625, -3.172393798828125, -3.05413818359375, -2.935882568359375, -2.817626953125, -2.699371337890625, -2.58111572265625, -2.462860107421875, -2.3446044921875, -2.226348876953125, -2.10809326171875, -1.989837646484375, -1.87158203125, -1.753326416015625, -1.63507080078125, -1.516815185546875, -1.3985595703125, -1.280303955078125, -1.16204833984375, -1.043792724609375, -0.925537109375, -0.807281494140625, -0.68902587890625, -0.570770263671875, -0.4525146484375, -0.334259033203125, -0.21600341796875, -0.097747802734375, 0.0205078125, 0.138763427734375, 0.25701904296875, 0.375274658203125, 0.4935302734375, 0.611785888671875, 0.73004150390625, 0.848297119140625, 0.966552734375, 1.084808349609375, 1.20306396484375, 1.321319580078125, 1.4395751953125, 1.557830810546875, 1.67608642578125, 1.794342041015625, 1.91259765625, 2.030853271484375, 2.14910888671875, 2.267364501953125, 2.3856201171875, 2.503875732421875, 2.62213134765625, 2.740386962890625, 2.858642578125, 2.976898193359375, 3.09515380859375, 3.213409423828125, 3.3316650390625, 3.449920654296875, 3.56817626953125, 3.686431884765625, 3.8046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 7.0, 15.0, 38.0, 73.0, 133.0, 322.0, 1689.0, 38011.0, 1000172.0, 6875.0, 762.0, 252.0, 89.0, 36.0, 24.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -63.69140625, -62.0703125, -60.44921875, -58.828125, -57.20703125, -55.5859375, -53.96484375, -52.34375, -50.72265625, -49.1015625, -47.48046875, -45.859375, -44.23828125, -42.6171875, -40.99609375, -39.375, -37.75390625, -36.1328125, -34.51171875, -32.890625, -31.26953125, -29.6484375, -28.02734375, -26.40625, -24.78515625, -23.1640625, -21.54296875, -19.921875, -18.30078125, -16.6796875, -15.05859375, -13.4375, -11.81640625, -10.1953125, -8.57421875, -6.953125, -5.33203125, -3.7109375, -2.08984375, -0.46875, 1.15234375, 2.7734375, 4.39453125, 6.015625, 7.63671875, 9.2578125, 10.87890625, 12.5, 14.12109375, 15.7421875, 17.36328125, 18.984375, 20.60546875, 22.2265625, 23.84765625, 25.46875, 27.08984375, 28.7109375, 30.33203125, 31.953125, 33.57421875, 35.1953125, 36.81640625, 38.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 20.0, 30.0, 51.0, 50.0, 58.0, 78.0, 91.0, 89.0, 96.0, 95.0, 74.0, 49.0, 34.0, 29.0, 34.0, 13.0, 18.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042724609375, -0.0004123672842979431, -0.00039748847484588623, -0.00038260966539382935, -0.00036773085594177246, -0.0003528520464897156, -0.0003379732370376587, -0.0003230944275856018, -0.0003082156181335449, -0.00029333680868148804, -0.00027845799922943115, -0.00026357918977737427, -0.0002487003803253174, -0.0002338215708732605, -0.0002189427614212036, -0.00020406395196914673, -0.00018918514251708984, -0.00017430633306503296, -0.00015942752361297607, -0.0001445487141609192, -0.0001296699047088623, -0.00011479109525680542, -9.991228580474854e-05, -8.503347635269165e-05, -7.015466690063477e-05, -5.527585744857788e-05, -4.0397047996520996e-05, -2.551823854446411e-05, -1.0639429092407227e-05, 4.239380359649658e-06, 1.9118189811706543e-05, 3.399699926376343e-05, 4.887580871582031e-05, 6.37546181678772e-05, 7.863342761993408e-05, 9.351223707199097e-05, 0.00010839104652404785, 0.00012326985597610474, 0.00013814866542816162, 0.0001530274748802185, 0.0001679062843322754, 0.00018278509378433228, 0.00019766390323638916, 0.00021254271268844604, 0.00022742152214050293, 0.00024230033159255981, 0.0002571791410446167, 0.0002720579504966736, 0.00028693675994873047, 0.00030181556940078735, 0.00031669437885284424, 0.0003315731883049011, 0.000346451997756958, 0.0003613308072090149, 0.0003762096166610718, 0.00039108842611312866, 0.00040596723556518555, 0.00042084604501724243, 0.0004357248544692993, 0.0004506036639213562, 0.0004654824733734131, 0.00048036128282546997, 0.0004952400922775269, 0.0005101189017295837, 0.0005249977111816406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 5.0, 13.0, 21.0, 14.0, 23.0, 41.0, 46.0, 68.0, 108.0, 143.0, 223.0, 422.0, 706.0, 1335.0, 2847.0, 6937.0, 21371.0, 101802.0, 614353.0, 241318.0, 37880.0, 10630.0, 4083.0, 1885.0, 871.0, 512.0, 284.0, 182.0, 125.0, 84.0, 47.0, 40.0, 34.0, 26.0, 13.0, 15.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.03125, -8.7166748046875, -8.402099609375, -8.0875244140625, -7.77294921875, -7.4583740234375, -7.143798828125, -6.8292236328125, -6.5146484375, -6.2000732421875, -5.885498046875, -5.5709228515625, -5.25634765625, -4.9417724609375, -4.627197265625, -4.3126220703125, -3.998046875, -3.6834716796875, -3.368896484375, -3.0543212890625, -2.73974609375, -2.4251708984375, -2.110595703125, -1.7960205078125, -1.4814453125, -1.1668701171875, -0.852294921875, -0.5377197265625, -0.22314453125, 0.0914306640625, 0.406005859375, 0.7205810546875, 1.03515625, 1.3497314453125, 1.664306640625, 1.9788818359375, 2.29345703125, 2.6080322265625, 2.922607421875, 3.2371826171875, 3.5517578125, 3.8663330078125, 4.180908203125, 4.4954833984375, 4.81005859375, 5.1246337890625, 5.439208984375, 5.7537841796875, 6.068359375, 6.3829345703125, 6.697509765625, 7.0120849609375, 7.32666015625, 7.6412353515625, 7.955810546875, 8.2703857421875, 8.5849609375, 8.8995361328125, 9.214111328125, 9.5286865234375, 9.84326171875, 10.1578369140625, 10.472412109375, 10.7869873046875, 11.1015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 18.0, 28.0, 37.0, 52.0, 112.0, 154.0, 184.0, 166.0, 98.0, 44.0, 30.0, 21.0, 7.0, 6.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.46875, -9.20721435546875, -8.9456787109375, -8.68414306640625, -8.422607421875, -8.16107177734375, -7.8995361328125, -7.63800048828125, -7.37646484375, -7.11492919921875, -6.8533935546875, -6.59185791015625, -6.330322265625, -6.06878662109375, -5.8072509765625, -5.54571533203125, -5.2841796875, -5.02264404296875, -4.7611083984375, -4.49957275390625, -4.238037109375, -3.97650146484375, -3.7149658203125, -3.45343017578125, -3.19189453125, -2.93035888671875, -2.6688232421875, -2.40728759765625, -2.145751953125, -1.88421630859375, -1.6226806640625, -1.36114501953125, -1.099609375, -0.83807373046875, -0.5765380859375, -0.31500244140625, -0.053466796875, 0.20806884765625, 0.4696044921875, 0.73114013671875, 0.99267578125, 1.25421142578125, 1.5157470703125, 1.77728271484375, 2.038818359375, 2.30035400390625, 2.5618896484375, 2.82342529296875, 3.0849609375, 3.34649658203125, 3.6080322265625, 3.86956787109375, 4.131103515625, 4.39263916015625, 4.6541748046875, 4.91571044921875, 5.17724609375, 5.43878173828125, 5.7003173828125, 5.96185302734375, 6.223388671875, 6.48492431640625, 6.7464599609375, 7.00799560546875, 7.26953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 14.0, 18.0, 62.0, 248.0, 390.0, 163.0, 63.0, 18.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.04808807373047, -68.29481506347656, -63.54153823852539, -58.788265228271484, -54.03498840332031, -49.281715393066406, -44.5284423828125, -39.77516555786133, -35.02189254760742, -30.268617630004883, -25.515342712402344, -20.762069702148438, -16.0087947845459, -11.25551986694336, -6.502246856689453, -1.7489700317382812, 3.004302978515625, 7.757577419281006, 12.510851860046387, 17.26412582397461, 22.01740074157715, 26.770675659179688, 31.523948669433594, 36.277225494384766, 41.03049850463867, 45.78377151489258, 50.53704833984375, 55.290321350097656, 60.04359436035156, 64.796875, 69.55014038085938, 74.30342102050781, 79.05668640136719, 83.8099594116211, 88.563232421875, 93.31651306152344, 98.06978607177734, 102.82305908203125, 107.57633209228516, 112.32960510253906, 117.0828857421875, 121.8361587524414, 126.58943176269531, 131.34271240234375, 136.09597778320312, 140.84925842285156, 145.6025390625, 150.35580444335938, 155.10906982421875, 159.8623504638672, 164.61561584472656, 169.368896484375, 174.12216186523438, 178.8754425048828, 183.62872314453125, 188.38198852539062, 193.13526916503906, 197.8885498046875, 202.64181518554688, 207.3950958251953, 212.1483612060547, 216.90164184570312, 221.6549072265625, 226.40818786621094, 231.16146850585938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 6.0, 10.0, 15.0, 24.0, 27.0, 45.0, 64.0, 102.0, 134.0, 141.0, 132.0, 94.0, 74.0, 42.0, 28.0, 8.0, 13.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.29398345947266, -88.3702392578125, -85.44650268554688, -82.52275848388672, -79.59901428222656, -76.67527770996094, -73.75153350830078, -70.82778930664062, -67.904052734375, -64.98030853271484, -62.05657196044922, -59.13282775878906, -56.20908737182617, -53.28534698486328, -50.361602783203125, -47.437862396240234, -44.514122009277344, -41.59038162231445, -38.66664123535156, -35.742897033691406, -32.819156646728516, -29.895416259765625, -26.9716739654541, -24.047931671142578, -21.124191284179688, -18.200450897216797, -15.276708602905273, -12.352967262268066, -9.42922592163086, -6.505484580993652, -3.5817432403564453, -0.6580009460449219, 2.2657318115234375, 5.1894731521606445, 8.113214492797852, 11.036955833435059, 13.960697174072266, 16.884437561035156, 19.80817985534668, 22.731922149658203, 25.655662536621094, 28.579402923583984, 31.503145217895508, 34.42688751220703, 37.35062789916992, 40.27436828613281, 43.19811248779297, 46.12185287475586, 49.04559326171875, 51.96933364868164, 54.89307403564453, 57.81681823730469, 60.74055862426758, 63.66429901123047, 66.58804321289062, 69.51177978515625, 72.4355239868164, 75.35926818847656, 78.28300476074219, 81.20674896240234, 84.1304931640625, 87.05422973632812, 89.97797393798828, 92.90171813964844, 95.82545471191406]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 12.0, 17.0, 31.0, 47.0, 76.0, 105.0, 214.0, 358.0, 579.0, 1131.0, 2268.0, 4944.0, 11589.0, 30242.0, 94326.0, 424416.0, 3273166.0, 244358.0, 66140.0, 22919.0, 9320.0, 4120.0, 1868.0, 890.0, 490.0, 219.0, 168.0, 83.0, 48.0, 39.0, 25.0, 21.0, 12.0, 7.0, 8.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5625, -22.810791015625, -22.05908203125, -21.307373046875, -20.5556640625, -19.803955078125, -19.05224609375, -18.300537109375, -17.548828125, -16.797119140625, -16.04541015625, -15.293701171875, -14.5419921875, -13.790283203125, -13.03857421875, -12.286865234375, -11.53515625, -10.783447265625, -10.03173828125, -9.280029296875, -8.5283203125, -7.776611328125, -7.02490234375, -6.273193359375, -5.521484375, -4.769775390625, -4.01806640625, -3.266357421875, -2.5146484375, -1.762939453125, -1.01123046875, -0.259521484375, 0.4921875, 1.243896484375, 1.99560546875, 2.747314453125, 3.4990234375, 4.250732421875, 5.00244140625, 5.754150390625, 6.505859375, 7.257568359375, 8.00927734375, 8.760986328125, 9.5126953125, 10.264404296875, 11.01611328125, 11.767822265625, 12.51953125, 13.271240234375, 14.02294921875, 14.774658203125, 15.5263671875, 16.278076171875, 17.02978515625, 17.781494140625, 18.533203125, 19.284912109375, 20.03662109375, 20.788330078125, 21.5400390625, 22.291748046875, 23.04345703125, 23.795166015625, 24.546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 8.0, 11.0, 19.0, 17.0, 27.0, 30.0, 28.0, 45.0, 54.0, 67.0, 55.0, 74.0, 70.0, 66.0, 56.0, 57.0, 66.0, 44.0, 39.0, 37.0, 26.0, 22.0, 14.0, 13.0, 7.0, 10.0, 5.0, 8.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9886627197265625, -0.949005126953125, -0.9093475341796875, -0.86968994140625, -0.8300323486328125, -0.790374755859375, -0.7507171630859375, -0.7110595703125, -0.6714019775390625, -0.631744384765625, -0.5920867919921875, -0.55242919921875, -0.5127716064453125, -0.473114013671875, -0.4334564208984375, -0.393798828125, -0.3541412353515625, -0.314483642578125, -0.2748260498046875, -0.23516845703125, -0.1955108642578125, -0.155853271484375, -0.1161956787109375, -0.0765380859375, -0.0368804931640625, 0.002777099609375, 0.0424346923828125, 0.08209228515625, 0.1217498779296875, 0.161407470703125, 0.2010650634765625, 0.24072265625, 0.2803802490234375, 0.320037841796875, 0.3596954345703125, 0.39935302734375, 0.4390106201171875, 0.478668212890625, 0.5183258056640625, 0.5579833984375, 0.5976409912109375, 0.637298583984375, 0.6769561767578125, 0.71661376953125, 0.7562713623046875, 0.795928955078125, 0.8355865478515625, 0.875244140625, 0.9149017333984375, 0.954559326171875, 0.9942169189453125, 1.03387451171875, 1.0735321044921875, 1.113189697265625, 1.1528472900390625, 1.1925048828125, 1.2321624755859375, 1.271820068359375, 1.3114776611328125, 1.35113525390625, 1.3907928466796875, 1.430450439453125, 1.4701080322265625, 1.509765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 24.0, 27.0, 48.0, 57.0, 80.0, 135.0, 201.0, 305.0, 535.0, 891.0, 1513.0, 2807.0, 5225.0, 10036.0, 20916.0, 44031.0, 100203.0, 256582.0, 1094945.0, 2180721.0, 278093.0, 106710.0, 46070.0, 21353.0, 10510.0, 5333.0, 2782.0, 1620.0, 930.0, 574.0, 370.0, 235.0, 132.0, 88.0, 54.0, 27.0, 23.0, 17.0, 17.0, 17.0, 12.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.8828125, -14.432373046875, -13.98193359375, -13.531494140625, -13.0810546875, -12.630615234375, -12.18017578125, -11.729736328125, -11.279296875, -10.828857421875, -10.37841796875, -9.927978515625, -9.4775390625, -9.027099609375, -8.57666015625, -8.126220703125, -7.67578125, -7.225341796875, -6.77490234375, -6.324462890625, -5.8740234375, -5.423583984375, -4.97314453125, -4.522705078125, -4.072265625, -3.621826171875, -3.17138671875, -2.720947265625, -2.2705078125, -1.820068359375, -1.36962890625, -0.919189453125, -0.46875, -0.018310546875, 0.43212890625, 0.882568359375, 1.3330078125, 1.783447265625, 2.23388671875, 2.684326171875, 3.134765625, 3.585205078125, 4.03564453125, 4.486083984375, 4.9365234375, 5.386962890625, 5.83740234375, 6.287841796875, 6.73828125, 7.188720703125, 7.63916015625, 8.089599609375, 8.5400390625, 8.990478515625, 9.44091796875, 9.891357421875, 10.341796875, 10.792236328125, 11.24267578125, 11.693115234375, 12.1435546875, 12.593994140625, 13.04443359375, 13.494873046875, 13.9453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 6.0, 7.0, 19.0, 22.0, 28.0, 30.0, 45.0, 57.0, 65.0, 66.0, 107.0, 119.0, 153.0, 267.0, 557.0, 1416.0, 326.0, 184.0, 156.0, 107.0, 67.0, 64.0, 44.0, 46.0, 29.0, 23.0, 16.0, 12.0, 6.0, 1.0, 6.0, 1.0, 7.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.026947021484375, -2.93280029296875, -2.838653564453125, -2.7445068359375, -2.650360107421875, -2.55621337890625, -2.462066650390625, -2.367919921875, -2.273773193359375, -2.17962646484375, -2.085479736328125, -1.9913330078125, -1.897186279296875, -1.80303955078125, -1.708892822265625, -1.61474609375, -1.520599365234375, -1.42645263671875, -1.332305908203125, -1.2381591796875, -1.144012451171875, -1.04986572265625, -0.955718994140625, -0.861572265625, -0.767425537109375, -0.67327880859375, -0.579132080078125, -0.4849853515625, -0.390838623046875, -0.29669189453125, -0.202545166015625, -0.1083984375, -0.014251708984375, 0.07989501953125, 0.174041748046875, 0.2681884765625, 0.362335205078125, 0.45648193359375, 0.550628662109375, 0.644775390625, 0.738922119140625, 0.83306884765625, 0.927215576171875, 1.0213623046875, 1.115509033203125, 1.20965576171875, 1.303802490234375, 1.39794921875, 1.492095947265625, 1.58624267578125, 1.680389404296875, 1.7745361328125, 1.868682861328125, 1.96282958984375, 2.056976318359375, 2.151123046875, 2.245269775390625, 2.33941650390625, 2.433563232421875, 2.5277099609375, 2.621856689453125, 2.71600341796875, 2.810150146484375, 2.904296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 3.0, 6.0, 10.0, 10.0, 6.0, 25.0, 21.0, 47.0, 67.0, 96.0, 120.0, 139.0, 113.0, 95.0, 78.0, 46.0, 39.0, 24.0, 11.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.469757080078125, -22.664220809936523, -21.858684539794922, -21.05314826965332, -20.24761199951172, -19.442075729370117, -18.636539459228516, -17.831003189086914, -17.025466918945312, -16.21993064880371, -15.41439437866211, -14.608858108520508, -13.803321838378906, -12.997785568237305, -12.192249298095703, -11.386713027954102, -10.581177711486816, -9.775641441345215, -8.970105171203613, -8.164568901062012, -7.35903263092041, -6.553496837615967, -5.747960567474365, -4.942424297332764, -4.136888027191162, -3.3313517570495605, -2.525815486907959, -1.7202794551849365, -0.914743185043335, -0.1092071533203125, 0.6963291168212891, 1.5018653869628906, 2.307401657104492, 3.1129379272460938, 3.9184741973876953, 4.724010467529297, 5.529546737670898, 6.335082530975342, 7.140618801116943, 7.946155071258545, 8.751691818237305, 9.557228088378906, 10.362764358520508, 11.16830062866211, 11.973836898803711, 12.779373168945312, 13.584909439086914, 14.390445709228516, 15.1959810256958, 16.001516342163086, 16.807052612304688, 17.61258888244629, 18.41812515258789, 19.223661422729492, 20.029197692871094, 20.834733963012695, 21.640270233154297, 22.4458065032959, 23.2513427734375, 24.0568790435791, 24.862415313720703, 25.667951583862305, 26.473487854003906, 27.279024124145508, 28.08456039428711]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 22.0, 26.0, 28.0, 20.0, 33.0, 26.0, 45.0, 45.0, 52.0, 43.0, 67.0, 47.0, 52.0, 68.0, 52.0, 49.0, 41.0, 46.0, 33.0, 23.0, 29.0, 29.0, 16.0, 11.0, 9.0, 7.0, 11.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.70572566986084, -13.225020408630371, -12.744315147399902, -12.263609886169434, -11.782905578613281, -11.302200317382812, -10.821495056152344, -10.340789794921875, -9.860084533691406, -9.379379272460938, -8.898674011230469, -8.41796875, -7.9372639656066895, -7.456558704376221, -6.97585391998291, -6.495148658752441, -6.014443397521973, -5.533738136291504, -5.053032875061035, -4.572328090667725, -4.091622829437256, -3.610917568206787, -3.1302125453948975, -2.649507522583008, -2.168802261352539, -1.6880971193313599, -1.2073919773101807, -0.7266868352890015, -0.24598169326782227, 0.23472356796264648, 0.7154285907745361, 1.1961336135864258, 1.6768379211425781, 2.157543182373047, 2.6382482051849365, 3.118953227996826, 3.599658489227295, 4.080363750457764, 4.561068534851074, 5.041773796081543, 5.522479057312012, 6.0031843185424805, 6.483889579772949, 6.96459436416626, 7.4452996253967285, 7.926004886627197, 8.406709671020508, 8.887414932250977, 9.368120193481445, 9.848825454711914, 10.329530715942383, 10.810235977172852, 11.29094123840332, 11.771646499633789, 12.252350807189941, 12.73305606842041, 13.213761329650879, 13.694466590881348, 14.175171852111816, 14.655877113342285, 15.136581420898438, 15.617286682128906, 16.097991943359375, 16.578697204589844, 17.059402465820312]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 6.0, 8.0, 30.0, 37.0, 49.0, 94.0, 120.0, 229.0, 383.0, 678.0, 1350.0, 2630.0, 5040.0, 11658.0, 30493.0, 110833.0, 552842.0, 246600.0, 52898.0, 17690.0, 7391.0, 3464.0, 1811.0, 928.0, 521.0, 282.0, 177.0, 100.0, 56.0, 53.0, 19.0, 17.0, 12.0, 10.0, 5.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.090087890625, -20.44580078125, -19.801513671875, -19.1572265625, -18.512939453125, -17.86865234375, -17.224365234375, -16.580078125, -15.935791015625, -15.29150390625, -14.647216796875, -14.0029296875, -13.358642578125, -12.71435546875, -12.070068359375, -11.42578125, -10.781494140625, -10.13720703125, -9.492919921875, -8.8486328125, -8.204345703125, -7.56005859375, -6.915771484375, -6.271484375, -5.627197265625, -4.98291015625, -4.338623046875, -3.6943359375, -3.050048828125, -2.40576171875, -1.761474609375, -1.1171875, -0.472900390625, 0.17138671875, 0.815673828125, 1.4599609375, 2.104248046875, 2.74853515625, 3.392822265625, 4.037109375, 4.681396484375, 5.32568359375, 5.969970703125, 6.6142578125, 7.258544921875, 7.90283203125, 8.547119140625, 9.19140625, 9.835693359375, 10.47998046875, 11.124267578125, 11.7685546875, 12.412841796875, 13.05712890625, 13.701416015625, 14.345703125, 14.989990234375, 15.63427734375, 16.278564453125, 16.9228515625, 17.567138671875, 18.21142578125, 18.855712890625, 19.5]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 9.0, 14.0, 13.0, 25.0, 25.0, 23.0, 40.0, 35.0, 51.0, 51.0, 45.0, 51.0, 61.0, 39.0, 53.0, 59.0, 59.0, 52.0, 39.0, 40.0, 44.0, 25.0, 23.0, 19.0, 14.0, 10.0, 15.0, 13.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2275390625, -1.1898345947265625, -1.152130126953125, -1.1144256591796875, -1.07672119140625, -1.0390167236328125, -1.001312255859375, -0.9636077880859375, -0.9259033203125, -0.8881988525390625, -0.850494384765625, -0.8127899169921875, -0.77508544921875, -0.7373809814453125, -0.699676513671875, -0.6619720458984375, -0.624267578125, -0.5865631103515625, -0.548858642578125, -0.5111541748046875, -0.47344970703125, -0.4357452392578125, -0.398040771484375, -0.3603363037109375, -0.3226318359375, -0.2849273681640625, -0.247222900390625, -0.2095184326171875, -0.17181396484375, -0.1341094970703125, -0.096405029296875, -0.0587005615234375, -0.02099609375, 0.0167083740234375, 0.054412841796875, 0.0921173095703125, 0.12982177734375, 0.1675262451171875, 0.205230712890625, 0.2429351806640625, 0.2806396484375, 0.3183441162109375, 0.356048583984375, 0.3937530517578125, 0.43145751953125, 0.4691619873046875, 0.506866455078125, 0.5445709228515625, 0.582275390625, 0.6199798583984375, 0.657684326171875, 0.6953887939453125, 0.73309326171875, 0.7707977294921875, 0.808502197265625, 0.8462066650390625, 0.8839111328125, 0.9216156005859375, 0.959320068359375, 0.9970245361328125, 1.03472900390625, 1.0724334716796875, 1.110137939453125, 1.1478424072265625, 1.185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 9.0, 4.0, 11.0, 26.0, 47.0, 290.0, 3531.0, 504185.0, 536521.0, 3451.0, 281.0, 44.0, 15.0, 14.0, 10.0, 13.0, 7.0, 5.0, 6.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.3125, -59.123046875, -56.93359375, -54.744140625, -52.5546875, -50.365234375, -48.17578125, -45.986328125, -43.796875, -41.607421875, -39.41796875, -37.228515625, -35.0390625, -32.849609375, -30.66015625, -28.470703125, -26.28125, -24.091796875, -21.90234375, -19.712890625, -17.5234375, -15.333984375, -13.14453125, -10.955078125, -8.765625, -6.576171875, -4.38671875, -2.197265625, -0.0078125, 2.181640625, 4.37109375, 6.560546875, 8.75, 10.939453125, 13.12890625, 15.318359375, 17.5078125, 19.697265625, 21.88671875, 24.076171875, 26.265625, 28.455078125, 30.64453125, 32.833984375, 35.0234375, 37.212890625, 39.40234375, 41.591796875, 43.78125, 45.970703125, 48.16015625, 50.349609375, 52.5390625, 54.728515625, 56.91796875, 59.107421875, 61.296875, 63.486328125, 65.67578125, 67.865234375, 70.0546875, 72.244140625, 74.43359375, 76.623046875, 78.8125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 5.0, 10.0, 2.0, 9.0, 7.0, 17.0, 13.0, 18.0, 20.0, 23.0, 23.0, 24.0, 31.0, 46.0, 38.0, 31.0, 47.0, 32.0, 40.0, 36.0, 48.0, 45.0, 48.0, 44.0, 38.0, 43.0, 37.0, 29.0, 27.0, 34.0, 18.0, 22.0, 10.0, 13.0, 14.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.28094482421875, -5.1165771484375, -4.95220947265625, -4.787841796875, -4.62347412109375, -4.4591064453125, -4.29473876953125, -4.13037109375, -3.96600341796875, -3.8016357421875, -3.63726806640625, -3.472900390625, -3.30853271484375, -3.1441650390625, -2.97979736328125, -2.8154296875, -2.65106201171875, -2.4866943359375, -2.32232666015625, -2.157958984375, -1.99359130859375, -1.8292236328125, -1.66485595703125, -1.50048828125, -1.33612060546875, -1.1717529296875, -1.00738525390625, -0.843017578125, -0.67864990234375, -0.5142822265625, -0.34991455078125, -0.185546875, -0.02117919921875, 0.1431884765625, 0.30755615234375, 0.471923828125, 0.63629150390625, 0.8006591796875, 0.96502685546875, 1.12939453125, 1.29376220703125, 1.4581298828125, 1.62249755859375, 1.786865234375, 1.95123291015625, 2.1156005859375, 2.27996826171875, 2.4443359375, 2.60870361328125, 2.7730712890625, 2.93743896484375, 3.101806640625, 3.26617431640625, 3.4305419921875, 3.59490966796875, 3.75927734375, 3.92364501953125, 4.0880126953125, 4.25238037109375, 4.416748046875, 4.58111572265625, 4.7454833984375, 4.90985107421875, 5.07421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 4.0, 0.0, 5.0, 11.0, 7.0, 11.0, 10.0, 13.0, 37.0, 122.0, 514.0, 14516.0, 1029814.0, 3027.0, 286.0, 74.0, 22.0, 20.0, 12.0, 5.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.4873046875, -100.287109375, -97.0869140625, -93.88671875, -90.6865234375, -87.486328125, -84.2861328125, -81.0859375, -77.8857421875, -74.685546875, -71.4853515625, -68.28515625, -65.0849609375, -61.884765625, -58.6845703125, -55.484375, -52.2841796875, -49.083984375, -45.8837890625, -42.68359375, -39.4833984375, -36.283203125, -33.0830078125, -29.8828125, -26.6826171875, -23.482421875, -20.2822265625, -17.08203125, -13.8818359375, -10.681640625, -7.4814453125, -4.28125, -1.0810546875, 2.119140625, 5.3193359375, 8.51953125, 11.7197265625, 14.919921875, 18.1201171875, 21.3203125, 24.5205078125, 27.720703125, 30.9208984375, 34.12109375, 37.3212890625, 40.521484375, 43.7216796875, 46.921875, 50.1220703125, 53.322265625, 56.5224609375, 59.72265625, 62.9228515625, 66.123046875, 69.3232421875, 72.5234375, 75.7236328125, 78.923828125, 82.1240234375, 85.32421875, 88.5244140625, 91.724609375, 94.9248046875, 98.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 10.0, 14.0, 33.0, 34.0, 64.0, 105.0, 172.0, 173.0, 145.0, 81.0, 55.0, 36.0, 19.0, 8.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010538101196289062, -0.0010282471776008606, -0.001002684235572815, -0.0009771212935447693, -0.0009515583515167236, -0.000925995409488678, -0.0009004324674606323, -0.0008748695254325867, -0.000849306583404541, -0.0008237436413764954, -0.0007981806993484497, -0.000772617757320404, -0.0007470548152923584, -0.0007214918732643127, -0.0006959289312362671, -0.0006703659892082214, -0.0006448030471801758, -0.0006192401051521301, -0.0005936771631240845, -0.0005681142210960388, -0.0005425512790679932, -0.0005169883370399475, -0.0004914253950119019, -0.0004658624529838562, -0.00044029951095581055, -0.0004147365689277649, -0.00038917362689971924, -0.0003636106848716736, -0.00033804774284362793, -0.0003124848008155823, -0.0002869218587875366, -0.00026135891675949097, -0.0002357959747314453, -0.00021023303270339966, -0.000184670090675354, -0.00015910714864730835, -0.0001335442066192627, -0.00010798126459121704, -8.241832256317139e-05, -5.685538053512573e-05, -3.129243850708008e-05, -5.729496479034424e-06, 1.983344554901123e-05, 4.5396387577056885e-05, 7.095932960510254e-05, 9.65222716331482e-05, 0.00012208521366119385, 0.0001476481556892395, 0.00017321109771728516, 0.0001987740397453308, 0.00022433698177337646, 0.0002498999238014221, 0.0002754628658294678, 0.00030102580785751343, 0.0003265887498855591, 0.00035215169191360474, 0.0003777146339416504, 0.00040327757596969604, 0.0004288405179977417, 0.00045440346002578735, 0.000479966402053833, 0.0005055293440818787, 0.0005310922861099243, 0.00055665522813797, 0.0005822181701660156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 2.0, 3.0, 6.0, 13.0, 9.0, 22.0, 36.0, 62.0, 83.0, 111.0, 196.0, 349.0, 557.0, 1004.0, 2134.0, 5179.0, 16617.0, 143552.0, 807262.0, 54095.0, 10036.0, 3595.0, 1627.0, 833.0, 455.0, 276.0, 150.0, 100.0, 63.0, 43.0, 33.0, 16.0, 12.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.21533203125, -33.0869140625, -31.95849609375, -30.830078125, -29.70166015625, -28.5732421875, -27.44482421875, -26.31640625, -25.18798828125, -24.0595703125, -22.93115234375, -21.802734375, -20.67431640625, -19.5458984375, -18.41748046875, -17.2890625, -16.16064453125, -15.0322265625, -13.90380859375, -12.775390625, -11.64697265625, -10.5185546875, -9.39013671875, -8.26171875, -7.13330078125, -6.0048828125, -4.87646484375, -3.748046875, -2.61962890625, -1.4912109375, -0.36279296875, 0.765625, 1.89404296875, 3.0224609375, 4.15087890625, 5.279296875, 6.40771484375, 7.5361328125, 8.66455078125, 9.79296875, 10.92138671875, 12.0498046875, 13.17822265625, 14.306640625, 15.43505859375, 16.5634765625, 17.69189453125, 18.8203125, 19.94873046875, 21.0771484375, 22.20556640625, 23.333984375, 24.46240234375, 25.5908203125, 26.71923828125, 27.84765625, 28.97607421875, 30.1044921875, 31.23291015625, 32.361328125, 33.48974609375, 34.6181640625, 35.74658203125, 36.875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 10.0, 9.0, 11.0, 9.0, 22.0, 27.0, 28.0, 29.0, 56.0, 72.0, 92.0, 142.0, 89.0, 92.0, 64.0, 62.0, 46.0, 33.0, 24.0, 17.0, 13.0, 16.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.47772216796875, -9.2210693359375, -8.96441650390625, -8.707763671875, -8.45111083984375, -8.1944580078125, -7.93780517578125, -7.68115234375, -7.42449951171875, -7.1678466796875, -6.91119384765625, -6.654541015625, -6.39788818359375, -6.1412353515625, -5.88458251953125, -5.6279296875, -5.37127685546875, -5.1146240234375, -4.85797119140625, -4.601318359375, -4.34466552734375, -4.0880126953125, -3.83135986328125, -3.57470703125, -3.31805419921875, -3.0614013671875, -2.80474853515625, -2.548095703125, -2.29144287109375, -2.0347900390625, -1.77813720703125, -1.521484375, -1.26483154296875, -1.0081787109375, -0.75152587890625, -0.494873046875, -0.23822021484375, 0.0184326171875, 0.27508544921875, 0.53173828125, 0.78839111328125, 1.0450439453125, 1.30169677734375, 1.558349609375, 1.81500244140625, 2.0716552734375, 2.32830810546875, 2.5849609375, 2.84161376953125, 3.0982666015625, 3.35491943359375, 3.611572265625, 3.86822509765625, 4.1248779296875, 4.38153076171875, 4.63818359375, 4.89483642578125, 5.1514892578125, 5.40814208984375, 5.664794921875, 5.92144775390625, 6.1781005859375, 6.43475341796875, 6.69140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 20.0, 36.0, 62.0, 119.0, 166.0, 172.0, 178.0, 94.0, 61.0, 30.0, 18.0, 13.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.8785400390625, -99.69815063476562, -96.51775360107422, -93.33736419677734, -90.15696716308594, -86.97657775878906, -83.79618835449219, -80.61579895019531, -77.4354019165039, -74.25501251220703, -71.07461547851562, -67.89422607421875, -64.71383666992188, -61.53343963623047, -58.353050231933594, -55.17265701293945, -51.99226379394531, -48.81187057495117, -45.63147735595703, -42.451087951660156, -39.270694732666016, -36.090301513671875, -32.909912109375, -29.72951889038086, -26.54912567138672, -23.368732452392578, -20.18834114074707, -17.007949829101562, -13.827556610107422, -10.647164344787598, -7.466772079467773, -4.286380767822266, -1.105987548828125, 2.074404716491699, 5.254796981811523, 8.435189247131348, 11.615581512451172, 14.795973777770996, 17.97636604309082, 21.156757354736328, 24.33715057373047, 27.51754379272461, 30.697935104370117, 33.878326416015625, 37.058719635009766, 40.239112854003906, 43.41950225830078, 46.59989547729492, 49.78028869628906, 52.9606819152832, 56.141075134277344, 59.32146453857422, 62.50185775756836, 65.6822509765625, 68.86264038085938, 72.04302978515625, 75.22342681884766, 78.40381622314453, 81.58421325683594, 84.76460266113281, 87.94499206542969, 91.1253890991211, 94.30577850341797, 97.48617553710938, 100.66656494140625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 4.0, 8.0, 10.0, 18.0, 10.0, 8.0, 16.0, 20.0, 20.0, 30.0, 35.0, 42.0, 45.0, 41.0, 52.0, 49.0, 62.0, 60.0, 58.0, 60.0, 40.0, 34.0, 32.0, 41.0, 30.0, 26.0, 27.0, 22.0, 21.0, 11.0, 13.0, 8.0, 9.0, 4.0, 10.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.935176849365234, -40.591121673583984, -39.247066497802734, -37.903011322021484, -36.558956146240234, -35.21490478515625, -33.870849609375, -32.52679443359375, -31.1827392578125, -29.83868408203125, -28.49462890625, -27.15057373046875, -25.806520462036133, -24.462465286254883, -23.118410110473633, -21.774356842041016, -20.430299758911133, -19.086244583129883, -17.742189407348633, -16.398136138916016, -15.054080963134766, -13.710025787353516, -12.365970611572266, -11.021916389465332, -9.677861213684082, -8.333806037902832, -6.989751815795898, -5.645696640014648, -4.301641941070557, -2.957587242126465, -1.6135320663452148, -0.26947784423828125, 1.0745773315429688, 2.4186320304870605, 3.7626869678497314, 5.106741905212402, 6.450796604156494, 7.794851303100586, 9.138906478881836, 10.48296070098877, 11.82701587677002, 13.17107105255127, 14.515125274658203, 15.859180450439453, 17.203235626220703, 18.547290802001953, 19.891345977783203, 21.23539924621582, 22.57945442199707, 23.92350959777832, 25.26756477355957, 26.611618041992188, 27.955673217773438, 29.299728393554688, 30.643783569335938, 31.987838745117188, 33.33189392089844, 34.67594909667969, 36.02000427246094, 37.36405944824219, 38.70811462402344, 40.05216979980469, 41.39622497558594, 42.74027633666992, 44.08433151245117]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 11.0, 14.0, 15.0, 25.0, 44.0, 52.0, 77.0, 134.0, 182.0, 280.0, 472.0, 870.0, 1637.0, 3189.0, 7330.0, 18273.0, 60448.0, 408501.0, 3539880.0, 105648.0, 28027.0, 10079.0, 4295.0, 2085.0, 1125.0, 647.0, 372.0, 198.0, 141.0, 67.0, 38.0, 27.0, 21.0, 16.0, 11.0, 7.0, 0.0, 2.0, 5.0], "bins": [-48.3125, -47.19384765625, -46.0751953125, -44.95654296875, -43.837890625, -42.71923828125, -41.6005859375, -40.48193359375, -39.36328125, -38.24462890625, -37.1259765625, -36.00732421875, -34.888671875, -33.77001953125, -32.6513671875, -31.53271484375, -30.4140625, -29.29541015625, -28.1767578125, -27.05810546875, -25.939453125, -24.82080078125, -23.7021484375, -22.58349609375, -21.46484375, -20.34619140625, -19.2275390625, -18.10888671875, -16.990234375, -15.87158203125, -14.7529296875, -13.63427734375, -12.515625, -11.39697265625, -10.2783203125, -9.15966796875, -8.041015625, -6.92236328125, -5.8037109375, -4.68505859375, -3.56640625, -2.44775390625, -1.3291015625, -0.21044921875, 0.908203125, 2.02685546875, 3.1455078125, 4.26416015625, 5.3828125, 6.50146484375, 7.6201171875, 8.73876953125, 9.857421875, 10.97607421875, 12.0947265625, 13.21337890625, 14.33203125, 15.45068359375, 16.5693359375, 17.68798828125, 18.806640625, 19.92529296875, 21.0439453125, 22.16259765625, 23.28125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 14.0, 18.0, 24.0, 30.0, 43.0, 42.0, 34.0, 39.0, 41.0, 44.0, 44.0, 37.0, 48.0, 53.0, 55.0, 53.0, 53.0, 43.0, 26.0, 29.0, 29.0, 31.0, 16.0, 22.0, 19.0, 13.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.04296875, -1.0087890625, -0.974609375, -0.9404296875, -0.90625, -0.8720703125, -0.837890625, -0.8037109375, -0.76953125, -0.7353515625, -0.701171875, -0.6669921875, -0.6328125, -0.5986328125, -0.564453125, -0.5302734375, -0.49609375, -0.4619140625, -0.427734375, -0.3935546875, -0.359375, -0.3251953125, -0.291015625, -0.2568359375, -0.22265625, -0.1884765625, -0.154296875, -0.1201171875, -0.0859375, -0.0517578125, -0.017578125, 0.0166015625, 0.05078125, 0.0849609375, 0.119140625, 0.1533203125, 0.1875, 0.2216796875, 0.255859375, 0.2900390625, 0.32421875, 0.3583984375, 0.392578125, 0.4267578125, 0.4609375, 0.4951171875, 0.529296875, 0.5634765625, 0.59765625, 0.6318359375, 0.666015625, 0.7001953125, 0.734375, 0.7685546875, 0.802734375, 0.8369140625, 0.87109375, 0.9052734375, 0.939453125, 0.9736328125, 1.0078125, 1.0419921875, 1.076171875, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 19.0, 15.0, 32.0, 38.0, 55.0, 94.0, 197.0, 1091.0, 27140.0, 4054593.0, 108060.0, 2324.0, 302.0, 107.0, 55.0, 46.0, 27.0, 21.0, 25.0, 12.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.625, -141.5400390625, -137.455078125, -133.3701171875, -129.28515625, -125.2001953125, -121.115234375, -117.0302734375, -112.9453125, -108.8603515625, -104.775390625, -100.6904296875, -96.60546875, -92.5205078125, -88.435546875, -84.3505859375, -80.265625, -76.1806640625, -72.095703125, -68.0107421875, -63.92578125, -59.8408203125, -55.755859375, -51.6708984375, -47.5859375, -43.5009765625, -39.416015625, -35.3310546875, -31.24609375, -27.1611328125, -23.076171875, -18.9912109375, -14.90625, -10.8212890625, -6.736328125, -2.6513671875, 1.43359375, 5.5185546875, 9.603515625, 13.6884765625, 17.7734375, 21.8583984375, 25.943359375, 30.0283203125, 34.11328125, 38.1982421875, 42.283203125, 46.3681640625, 50.453125, 54.5380859375, 58.623046875, 62.7080078125, 66.79296875, 70.8779296875, 74.962890625, 79.0478515625, 83.1328125, 87.2177734375, 91.302734375, 95.3876953125, 99.47265625, 103.5576171875, 107.642578125, 111.7275390625, 115.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 16.0, 15.0, 12.0, 12.0, 27.0, 43.0, 40.0, 55.0, 68.0, 107.0, 152.0, 297.0, 1835.0, 572.0, 225.0, 149.0, 104.0, 75.0, 56.0, 35.0, 38.0, 28.0, 25.0, 15.0, 11.0, 6.0, 5.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.919677734375, -3.80029296875, -3.680908203125, -3.5615234375, -3.442138671875, -3.32275390625, -3.203369140625, -3.083984375, -2.964599609375, -2.84521484375, -2.725830078125, -2.6064453125, -2.487060546875, -2.36767578125, -2.248291015625, -2.12890625, -2.009521484375, -1.89013671875, -1.770751953125, -1.6513671875, -1.531982421875, -1.41259765625, -1.293212890625, -1.173828125, -1.054443359375, -0.93505859375, -0.815673828125, -0.6962890625, -0.576904296875, -0.45751953125, -0.338134765625, -0.21875, -0.099365234375, 0.02001953125, 0.139404296875, 0.2587890625, 0.378173828125, 0.49755859375, 0.616943359375, 0.736328125, 0.855712890625, 0.97509765625, 1.094482421875, 1.2138671875, 1.333251953125, 1.45263671875, 1.572021484375, 1.69140625, 1.810791015625, 1.93017578125, 2.049560546875, 2.1689453125, 2.288330078125, 2.40771484375, 2.527099609375, 2.646484375, 2.765869140625, 2.88525390625, 3.004638671875, 3.1240234375, 3.243408203125, 3.36279296875, 3.482177734375, 3.6015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 33.0, 94.0, 219.0, 252.0, 230.0, 97.0, 39.0, 19.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.35034942626953, -114.00067901611328, -111.65100860595703, -109.30133819580078, -106.95167541503906, -104.60200500488281, -102.25233459472656, -99.90266418457031, -97.55299377441406, -95.20332336425781, -92.85365295410156, -90.50398254394531, -88.15431213378906, -85.80464935302734, -83.4549789428711, -81.10530853271484, -78.7556381225586, -76.40596771240234, -74.0562973022461, -71.70662689208984, -69.35696411132812, -67.00729370117188, -64.65762329101562, -62.307952880859375, -59.958282470703125, -57.608612060546875, -55.258941650390625, -52.90927505493164, -50.55960464477539, -48.20993423461914, -45.860267639160156, -43.510597229003906, -41.16092300415039, -38.81125259399414, -36.461585998535156, -34.111915588378906, -31.762245178222656, -29.412574768066406, -27.06290626525879, -24.713237762451172, -22.363567352294922, -20.013896942138672, -17.664228439331055, -15.314558982849121, -12.964889526367188, -10.615220069885254, -8.26555061340332, -5.915882110595703, -3.566211700439453, -1.2165422439575195, 1.133127212524414, 3.4827966690063477, 5.832466125488281, 8.182135581970215, 10.531805038452148, 12.881473541259766, 15.231143951416016, 17.580814361572266, 19.930482864379883, 22.2801513671875, 24.62982177734375, 26.9794921875, 29.329160690307617, 31.678829193115234, 34.028499603271484]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 7.0, 6.0, 13.0, 12.0, 18.0, 14.0, 20.0, 26.0, 20.0, 39.0, 40.0, 41.0, 46.0, 47.0, 59.0, 48.0, 59.0, 48.0, 56.0, 49.0, 49.0, 35.0, 44.0, 34.0, 33.0, 34.0, 13.0, 21.0, 12.0, 17.0, 6.0, 6.0, 4.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.313941955566406, -19.796260833740234, -19.278579711914062, -18.76089859008789, -18.24321746826172, -17.72553825378418, -17.207857131958008, -16.690176010131836, -16.172494888305664, -15.654813766479492, -15.13713264465332, -14.619452476501465, -14.101771354675293, -13.584090232849121, -13.066410064697266, -12.548728942871094, -12.031047821044922, -11.51336669921875, -10.995685577392578, -10.478005409240723, -9.96032428741455, -9.442643165588379, -8.924962997436523, -8.407281875610352, -7.88960075378418, -7.371919631958008, -6.854238986968994, -6.3365583419799805, -5.818877220153809, -5.301196098327637, -4.783515453338623, -4.265834808349609, -3.7481517791748047, -3.230470895767212, -2.712790012359619, -2.1951091289520264, -1.6774282455444336, -1.1597473621368408, -0.642066478729248, -0.12438559532165527, 0.3932952880859375, 0.9109761714935303, 1.428657054901123, 1.9463379383087158, 2.4640188217163086, 2.9816997051239014, 3.499380588531494, 4.017061233520508, 4.53474235534668, 5.052423477172852, 5.570104122161865, 6.087784767150879, 6.605465888977051, 7.123147010803223, 7.640827655792236, 8.15850830078125, 8.676189422607422, 9.193870544433594, 9.711551666259766, 10.229231834411621, 10.746912956237793, 11.264594078063965, 11.78227424621582, 12.299955368041992, 12.817636489868164]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 6.0, 12.0, 15.0, 27.0, 36.0, 45.0, 74.0, 122.0, 201.0, 399.0, 772.0, 1826.0, 4183.0, 10409.0, 27349.0, 72314.0, 181080.0, 328241.0, 247460.0, 106891.0, 40813.0, 15424.0, 5996.0, 2545.0, 1136.0, 510.0, 260.0, 136.0, 81.0, 51.0, 31.0, 18.0, 24.0, 18.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.9954833984375, -15.490966796875, -14.9864501953125, -14.48193359375, -13.9774169921875, -13.472900390625, -12.9683837890625, -12.4638671875, -11.9593505859375, -11.454833984375, -10.9503173828125, -10.44580078125, -9.9412841796875, -9.436767578125, -8.9322509765625, -8.427734375, -7.9232177734375, -7.418701171875, -6.9141845703125, -6.40966796875, -5.9051513671875, -5.400634765625, -4.8961181640625, -4.3916015625, -3.8870849609375, -3.382568359375, -2.8780517578125, -2.37353515625, -1.8690185546875, -1.364501953125, -0.8599853515625, -0.35546875, 0.1490478515625, 0.653564453125, 1.1580810546875, 1.66259765625, 2.1671142578125, 2.671630859375, 3.1761474609375, 3.6806640625, 4.1851806640625, 4.689697265625, 5.1942138671875, 5.69873046875, 6.2032470703125, 6.707763671875, 7.2122802734375, 7.716796875, 8.2213134765625, 8.725830078125, 9.2303466796875, 9.73486328125, 10.2393798828125, 10.743896484375, 11.2484130859375, 11.7529296875, 12.2574462890625, 12.761962890625, 13.2664794921875, 13.77099609375, 14.2755126953125, 14.780029296875, 15.2845458984375, 15.7890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 19.0, 22.0, 26.0, 34.0, 42.0, 40.0, 47.0, 60.0, 58.0, 78.0, 72.0, 64.0, 66.0, 70.0, 50.0, 43.0, 36.0, 33.0, 28.0, 24.0, 20.0, 8.0, 13.0, 6.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9848175048828125, -0.937408447265625, -0.8899993896484375, -0.84259033203125, -0.7951812744140625, -0.747772216796875, -0.7003631591796875, -0.6529541015625, -0.6055450439453125, -0.558135986328125, -0.5107269287109375, -0.46331787109375, -0.4159088134765625, -0.368499755859375, -0.3210906982421875, -0.273681640625, -0.2262725830078125, -0.178863525390625, -0.1314544677734375, -0.08404541015625, -0.0366363525390625, 0.010772705078125, 0.0581817626953125, 0.1055908203125, 0.1529998779296875, 0.200408935546875, 0.2478179931640625, 0.29522705078125, 0.3426361083984375, 0.390045166015625, 0.4374542236328125, 0.48486328125, 0.5322723388671875, 0.579681396484375, 0.6270904541015625, 0.67449951171875, 0.7219085693359375, 0.769317626953125, 0.8167266845703125, 0.8641357421875, 0.9115447998046875, 0.958953857421875, 1.0063629150390625, 1.05377197265625, 1.1011810302734375, 1.148590087890625, 1.1959991455078125, 1.243408203125, 1.2908172607421875, 1.338226318359375, 1.3856353759765625, 1.43304443359375, 1.4804534912109375, 1.527862548828125, 1.5752716064453125, 1.6226806640625, 1.6700897216796875, 1.717498779296875, 1.7649078369140625, 1.81231689453125, 1.8597259521484375, 1.907135009765625, 1.9545440673828125, 2.001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 7.0, 7.0, 11.0, 23.0, 22.0, 34.0, 47.0, 66.0, 99.0, 121.0, 176.0, 223.0, 294.0, 465.0, 695.0, 1155.0, 1915.0, 2974.0, 5253.0, 10005.0, 19032.0, 37685.0, 76001.0, 145713.0, 234711.0, 227561.0, 137425.0, 71082.0, 35463.0, 17946.0, 9463.0, 5082.0, 2887.0, 1702.0, 1052.0, 655.0, 459.0, 268.0, 191.0, 150.0, 116.0, 71.0, 73.0, 43.0, 46.0, 22.0, 13.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.703125, -11.3369140625, -10.970703125, -10.6044921875, -10.23828125, -9.8720703125, -9.505859375, -9.1396484375, -8.7734375, -8.4072265625, -8.041015625, -7.6748046875, -7.30859375, -6.9423828125, -6.576171875, -6.2099609375, -5.84375, -5.4775390625, -5.111328125, -4.7451171875, -4.37890625, -4.0126953125, -3.646484375, -3.2802734375, -2.9140625, -2.5478515625, -2.181640625, -1.8154296875, -1.44921875, -1.0830078125, -0.716796875, -0.3505859375, 0.015625, 0.3818359375, 0.748046875, 1.1142578125, 1.48046875, 1.8466796875, 2.212890625, 2.5791015625, 2.9453125, 3.3115234375, 3.677734375, 4.0439453125, 4.41015625, 4.7763671875, 5.142578125, 5.5087890625, 5.875, 6.2412109375, 6.607421875, 6.9736328125, 7.33984375, 7.7060546875, 8.072265625, 8.4384765625, 8.8046875, 9.1708984375, 9.537109375, 9.9033203125, 10.26953125, 10.6357421875, 11.001953125, 11.3681640625, 11.734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 3.0, 10.0, 15.0, 14.0, 16.0, 19.0, 18.0, 17.0, 20.0, 25.0, 34.0, 30.0, 38.0, 28.0, 47.0, 50.0, 44.0, 38.0, 38.0, 38.0, 47.0, 38.0, 39.0, 39.0, 42.0, 31.0, 33.0, 29.0, 19.0, 25.0, 31.0, 14.0, 11.0, 3.0, 11.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.23046875, -7.01580810546875, -6.8011474609375, -6.58648681640625, -6.371826171875, -6.15716552734375, -5.9425048828125, -5.72784423828125, -5.51318359375, -5.29852294921875, -5.0838623046875, -4.86920166015625, -4.654541015625, -4.43988037109375, -4.2252197265625, -4.01055908203125, -3.7958984375, -3.58123779296875, -3.3665771484375, -3.15191650390625, -2.937255859375, -2.72259521484375, -2.5079345703125, -2.29327392578125, -2.07861328125, -1.86395263671875, -1.6492919921875, -1.43463134765625, -1.219970703125, -1.00531005859375, -0.7906494140625, -0.57598876953125, -0.361328125, -0.14666748046875, 0.0679931640625, 0.28265380859375, 0.497314453125, 0.71197509765625, 0.9266357421875, 1.14129638671875, 1.35595703125, 1.57061767578125, 1.7852783203125, 1.99993896484375, 2.214599609375, 2.42926025390625, 2.6439208984375, 2.85858154296875, 3.0732421875, 3.28790283203125, 3.5025634765625, 3.71722412109375, 3.931884765625, 4.14654541015625, 4.3612060546875, 4.57586669921875, 4.79052734375, 5.00518798828125, 5.2198486328125, 5.43450927734375, 5.649169921875, 5.86383056640625, 6.0784912109375, 6.29315185546875, 6.5078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 20.0, 17.0, 41.0, 33.0, 50.0, 101.0, 124.0, 190.0, 265.0, 431.0, 685.0, 1198.0, 2165.0, 4552.0, 9781.0, 23252.0, 64868.0, 184044.0, 358032.0, 249316.0, 91650.0, 32524.0, 12905.0, 5672.0, 2761.0, 1455.0, 886.0, 524.0, 307.0, 197.0, 126.0, 92.0, 71.0, 58.0, 34.0, 26.0, 18.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8302001953125, -9.519775390625, -9.2093505859375, -8.89892578125, -8.5885009765625, -8.278076171875, -7.9676513671875, -7.6572265625, -7.3468017578125, -7.036376953125, -6.7259521484375, -6.41552734375, -6.1051025390625, -5.794677734375, -5.4842529296875, -5.173828125, -4.8634033203125, -4.552978515625, -4.2425537109375, -3.93212890625, -3.6217041015625, -3.311279296875, -3.0008544921875, -2.6904296875, -2.3800048828125, -2.069580078125, -1.7591552734375, -1.44873046875, -1.1383056640625, -0.827880859375, -0.5174560546875, -0.20703125, 0.1033935546875, 0.413818359375, 0.7242431640625, 1.03466796875, 1.3450927734375, 1.655517578125, 1.9659423828125, 2.2763671875, 2.5867919921875, 2.897216796875, 3.2076416015625, 3.51806640625, 3.8284912109375, 4.138916015625, 4.4493408203125, 4.759765625, 5.0701904296875, 5.380615234375, 5.6910400390625, 6.00146484375, 6.3118896484375, 6.622314453125, 6.9327392578125, 7.2431640625, 7.5535888671875, 7.864013671875, 8.1744384765625, 8.48486328125, 8.7952880859375, 9.105712890625, 9.4161376953125, 9.7265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 8.0, 15.0, 14.0, 16.0, 25.0, 36.0, 41.0, 49.0, 53.0, 64.0, 68.0, 65.0, 80.0, 79.0, 75.0, 45.0, 65.0, 42.0, 28.0, 25.0, 24.0, 13.0, 11.0, 12.0, 6.0, 4.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013714134693145752, -0.0013313889503479004, -0.0012913644313812256, -0.0012513399124145508, -0.001211315393447876, -0.0011712908744812012, -0.0011312663555145264, -0.0010912418365478516, -0.0010512173175811768, -0.001011192798614502, -0.0009711682796478271, -0.0009311437606811523, -0.0008911192417144775, -0.0008510947227478027, -0.0008110702037811279, -0.0007710456848144531, -0.0007310211658477783, -0.0006909966468811035, -0.0006509721279144287, -0.0006109476089477539, -0.0005709230899810791, -0.0005308985710144043, -0.0004908740520477295, -0.0004508495330810547, -0.0004108250141143799, -0.0003708004951477051, -0.0003307759761810303, -0.00029075145721435547, -0.00025072693824768066, -0.00021070241928100586, -0.00017067790031433105, -0.00013065338134765625, -9.062886238098145e-05, -5.060434341430664e-05, -1.0579824447631836e-05, 2.944469451904297e-05, 6.946921348571777e-05, 0.00010949373245239258, 0.00014951825141906738, 0.0001895427703857422, 0.000229567289352417, 0.0002695918083190918, 0.0003096163272857666, 0.0003496408462524414, 0.0003896653652191162, 0.000429689884185791, 0.0004697144031524658, 0.0005097389221191406, 0.0005497634410858154, 0.0005897879600524902, 0.000629812479019165, 0.0006698369979858398, 0.0007098615169525146, 0.0007498860359191895, 0.0007899105548858643, 0.0008299350738525391, 0.0008699595928192139, 0.0009099841117858887, 0.0009500086307525635, 0.0009900331497192383, 0.001030057668685913, 0.0010700821876525879, 0.0011101067066192627, 0.0011501312255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 8.0, 13.0, 15.0, 27.0, 34.0, 45.0, 64.0, 96.0, 155.0, 249.0, 422.0, 665.0, 1121.0, 2201.0, 4000.0, 8237.0, 19262.0, 52741.0, 161113.0, 378570.0, 272310.0, 90992.0, 30996.0, 12442.0, 5902.0, 2900.0, 1625.0, 866.0, 528.0, 329.0, 202.0, 120.0, 103.0, 55.0, 43.0, 21.0, 20.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-11.078125, -10.7398681640625, -10.401611328125, -10.0633544921875, -9.72509765625, -9.3868408203125, -9.048583984375, -8.7103271484375, -8.3720703125, -8.0338134765625, -7.695556640625, -7.3572998046875, -7.01904296875, -6.6807861328125, -6.342529296875, -6.0042724609375, -5.666015625, -5.3277587890625, -4.989501953125, -4.6512451171875, -4.31298828125, -3.9747314453125, -3.636474609375, -3.2982177734375, -2.9599609375, -2.6217041015625, -2.283447265625, -1.9451904296875, -1.60693359375, -1.2686767578125, -0.930419921875, -0.5921630859375, -0.25390625, 0.0843505859375, 0.422607421875, 0.7608642578125, 1.09912109375, 1.4373779296875, 1.775634765625, 2.1138916015625, 2.4521484375, 2.7904052734375, 3.128662109375, 3.4669189453125, 3.80517578125, 4.1434326171875, 4.481689453125, 4.8199462890625, 5.158203125, 5.4964599609375, 5.834716796875, 6.1729736328125, 6.51123046875, 6.8494873046875, 7.187744140625, 7.5260009765625, 7.8642578125, 8.2025146484375, 8.540771484375, 8.8790283203125, 9.21728515625, 9.5555419921875, 9.893798828125, 10.2320556640625, 10.5703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 4.0, 7.0, 10.0, 14.0, 13.0, 20.0, 22.0, 30.0, 22.0, 45.0, 45.0, 57.0, 48.0, 53.0, 64.0, 72.0, 72.0, 60.0, 59.0, 39.0, 42.0, 39.0, 23.0, 31.0, 21.0, 19.0, 9.0, 11.0, 12.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.83502197265625, -4.6856689453125, -4.53631591796875, -4.386962890625, -4.23760986328125, -4.0882568359375, -3.93890380859375, -3.78955078125, -3.64019775390625, -3.4908447265625, -3.34149169921875, -3.192138671875, -3.04278564453125, -2.8934326171875, -2.74407958984375, -2.5947265625, -2.44537353515625, -2.2960205078125, -2.14666748046875, -1.997314453125, -1.84796142578125, -1.6986083984375, -1.54925537109375, -1.39990234375, -1.25054931640625, -1.1011962890625, -0.95184326171875, -0.802490234375, -0.65313720703125, -0.5037841796875, -0.35443115234375, -0.205078125, -0.05572509765625, 0.0936279296875, 0.24298095703125, 0.392333984375, 0.54168701171875, 0.6910400390625, 0.84039306640625, 0.98974609375, 1.13909912109375, 1.2884521484375, 1.43780517578125, 1.587158203125, 1.73651123046875, 1.8858642578125, 2.03521728515625, 2.1845703125, 2.33392333984375, 2.4832763671875, 2.63262939453125, 2.781982421875, 2.93133544921875, 3.0806884765625, 3.23004150390625, 3.37939453125, 3.52874755859375, 3.6781005859375, 3.82745361328125, 3.976806640625, 4.12615966796875, 4.2755126953125, 4.42486572265625, 4.57421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 10.0, 7.0, 12.0, 10.0, 25.0, 34.0, 55.0, 78.0, 103.0, 114.0, 128.0, 121.0, 78.0, 69.0, 57.0, 23.0, 21.0, 20.0, 7.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.85691833496094, -89.43411254882812, -86.01130676269531, -82.5885009765625, -79.16569519042969, -75.74288940429688, -72.32007598876953, -68.89727020263672, -65.4744644165039, -62.051658630371094, -58.62885284423828, -55.2060432434082, -51.78323745727539, -48.36043167114258, -44.9376220703125, -41.51481628417969, -38.092010498046875, -34.66920471191406, -31.246397018432617, -27.823589324951172, -24.40078353881836, -20.977977752685547, -17.5551700592041, -14.132362365722656, -10.709556579589844, -7.286749839782715, -3.863943099975586, -0.44113636016845703, 2.981670379638672, 6.404476165771484, 9.82728385925293, 13.250091552734375, 16.672897338867188, 20.095703125, 23.518510818481445, 26.94131851196289, 30.364124298095703, 33.786930084228516, 37.209739685058594, 40.632545471191406, 44.05535125732422, 47.47815704345703, 50.900962829589844, 54.32377243041992, 57.746578216552734, 61.16938400268555, 64.59219360351562, 68.01499938964844, 71.43780517578125, 74.86061096191406, 78.28341674804688, 81.70622253417969, 85.1290283203125, 88.55183410644531, 91.97464752197266, 95.39745330810547, 98.82025909423828, 102.2430648803711, 105.6658706665039, 109.08867645263672, 112.51148986816406, 115.93429565429688, 119.35710144042969, 122.7799072265625, 126.20271301269531]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 9.0, 17.0, 10.0, 38.0, 33.0, 40.0, 49.0, 75.0, 74.0, 56.0, 76.0, 70.0, 77.0, 66.0, 60.0, 45.0, 37.0, 39.0, 23.0, 25.0, 19.0, 12.0, 11.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.665313720703125, -58.071136474609375, -55.47695541381836, -52.882774353027344, -50.288597106933594, -47.694419860839844, -45.10023880004883, -42.50605773925781, -39.91188049316406, -37.31770324707031, -34.7235221862793, -32.12934112548828, -29.53516387939453, -26.94098472595215, -24.346805572509766, -21.752626419067383, -19.158447265625, -16.564268112182617, -13.970088958740234, -11.375909805297852, -8.781730651855469, -6.187551498413086, -3.593372344970703, -0.9991931915283203, 1.5949859619140625, 4.189165115356445, 6.783344268798828, 9.377523422241211, 11.971702575683594, 14.565881729125977, 17.16006088256836, 19.754240036010742, 22.348426818847656, 24.94260597229004, 27.536785125732422, 30.130964279174805, 32.72514343261719, 35.31932067871094, 37.91350173950195, 40.50768280029297, 43.10186004638672, 45.69603729248047, 48.290218353271484, 50.8843994140625, 53.47857666015625, 56.07275390625, 58.666934967041016, 61.26111602783203, 63.85529327392578, 66.44947052001953, 69.04365539550781, 71.63783264160156, 74.23200988769531, 76.82618713378906, 79.42036437988281, 82.0145492553711, 84.60872650146484, 87.2029037475586, 89.79708862304688, 92.39126586914062, 94.98544311523438, 97.57962036132812, 100.17379760742188, 102.76798248291016, 105.3621597290039]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 11.0, 16.0, 32.0, 41.0, 63.0, 139.0, 260.0, 769.0, 4390.0, 49761.0, 3927023.0, 195983.0, 12674.0, 2039.0, 586.0, 227.0, 97.0, 64.0, 46.0, 21.0, 14.0, 10.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.9375, -90.548828125, -87.16015625, -83.771484375, -80.3828125, -76.994140625, -73.60546875, -70.216796875, -66.828125, -63.439453125, -60.05078125, -56.662109375, -53.2734375, -49.884765625, -46.49609375, -43.107421875, -39.71875, -36.330078125, -32.94140625, -29.552734375, -26.1640625, -22.775390625, -19.38671875, -15.998046875, -12.609375, -9.220703125, -5.83203125, -2.443359375, 0.9453125, 4.333984375, 7.72265625, 11.111328125, 14.5, 17.888671875, 21.27734375, 24.666015625, 28.0546875, 31.443359375, 34.83203125, 38.220703125, 41.609375, 44.998046875, 48.38671875, 51.775390625, 55.1640625, 58.552734375, 61.94140625, 65.330078125, 68.71875, 72.107421875, 75.49609375, 78.884765625, 82.2734375, 85.662109375, 89.05078125, 92.439453125, 95.828125, 99.216796875, 102.60546875, 105.994140625, 109.3828125, 112.771484375, 116.16015625, 119.548828125, 122.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 13.0, 27.0, 24.0, 38.0, 53.0, 66.0, 57.0, 70.0, 84.0, 105.0, 87.0, 71.0, 65.0, 49.0, 53.0, 43.0, 29.0, 20.0, 12.0, 4.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9500732421875, -1.870849609375, -1.7916259765625, -1.71240234375, -1.6331787109375, -1.553955078125, -1.4747314453125, -1.3955078125, -1.3162841796875, -1.237060546875, -1.1578369140625, -1.07861328125, -0.9993896484375, -0.920166015625, -0.8409423828125, -0.76171875, -0.6824951171875, -0.603271484375, -0.5240478515625, -0.44482421875, -0.3656005859375, -0.286376953125, -0.2071533203125, -0.1279296875, -0.0487060546875, 0.030517578125, 0.1097412109375, 0.18896484375, 0.2681884765625, 0.347412109375, 0.4266357421875, 0.505859375, 0.5850830078125, 0.664306640625, 0.7435302734375, 0.82275390625, 0.9019775390625, 0.981201171875, 1.0604248046875, 1.1396484375, 1.2188720703125, 1.298095703125, 1.3773193359375, 1.45654296875, 1.5357666015625, 1.614990234375, 1.6942138671875, 1.7734375, 1.8526611328125, 1.931884765625, 2.0111083984375, 2.09033203125, 2.1695556640625, 2.248779296875, 2.3280029296875, 2.4072265625, 2.4864501953125, 2.565673828125, 2.6448974609375, 2.72412109375, 2.8033447265625, 2.882568359375, 2.9617919921875, 3.041015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 31.0, 24.0, 57.0, 92.0, 163.0, 380.0, 1082.0, 3551.0, 14766.0, 80039.0, 961414.0, 3007361.0, 101362.0, 17732.0, 4256.0, 1163.0, 384.0, 191.0, 84.0, 60.0, 31.0, 12.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.96875, -52.173828125, -50.37890625, -48.583984375, -46.7890625, -44.994140625, -43.19921875, -41.404296875, -39.609375, -37.814453125, -36.01953125, -34.224609375, -32.4296875, -30.634765625, -28.83984375, -27.044921875, -25.25, -23.455078125, -21.66015625, -19.865234375, -18.0703125, -16.275390625, -14.48046875, -12.685546875, -10.890625, -9.095703125, -7.30078125, -5.505859375, -3.7109375, -1.916015625, -0.12109375, 1.673828125, 3.46875, 5.263671875, 7.05859375, 8.853515625, 10.6484375, 12.443359375, 14.23828125, 16.033203125, 17.828125, 19.623046875, 21.41796875, 23.212890625, 25.0078125, 26.802734375, 28.59765625, 30.392578125, 32.1875, 33.982421875, 35.77734375, 37.572265625, 39.3671875, 41.162109375, 42.95703125, 44.751953125, 46.546875, 48.341796875, 50.13671875, 51.931640625, 53.7265625, 55.521484375, 57.31640625, 59.111328125, 60.90625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 8.0, 11.0, 6.0, 14.0, 13.0, 19.0, 39.0, 43.0, 56.0, 90.0, 90.0, 126.0, 206.0, 494.0, 1862.0, 365.0, 210.0, 106.0, 83.0, 75.0, 35.0, 29.0, 16.0, 19.0, 15.0, 17.0, 8.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.02227783203125, -5.8101806640625, -5.59808349609375, -5.385986328125, -5.17388916015625, -4.9617919921875, -4.74969482421875, -4.53759765625, -4.32550048828125, -4.1134033203125, -3.90130615234375, -3.689208984375, -3.47711181640625, -3.2650146484375, -3.05291748046875, -2.8408203125, -2.62872314453125, -2.4166259765625, -2.20452880859375, -1.992431640625, -1.78033447265625, -1.5682373046875, -1.35614013671875, -1.14404296875, -0.93194580078125, -0.7198486328125, -0.50775146484375, -0.295654296875, -0.08355712890625, 0.1285400390625, 0.34063720703125, 0.552734375, 0.76483154296875, 0.9769287109375, 1.18902587890625, 1.401123046875, 1.61322021484375, 1.8253173828125, 2.03741455078125, 2.24951171875, 2.46160888671875, 2.6737060546875, 2.88580322265625, 3.097900390625, 3.30999755859375, 3.5220947265625, 3.73419189453125, 3.9462890625, 4.15838623046875, 4.3704833984375, 4.58258056640625, 4.794677734375, 5.00677490234375, 5.2188720703125, 5.43096923828125, 5.64306640625, 5.85516357421875, 6.0672607421875, 6.27935791015625, 6.491455078125, 6.70355224609375, 6.9156494140625, 7.12774658203125, 7.33984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 16.0, 14.0, 27.0, 35.0, 51.0, 73.0, 103.0, 129.0, 119.0, 116.0, 106.0, 74.0, 41.0, 26.0, 15.0, 20.0, 6.0, 4.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.21955108642578, -30.569355010986328, -28.919158935546875, -27.268962860107422, -25.6187686920166, -23.96857261657715, -22.318376541137695, -20.668182373046875, -19.017986297607422, -17.36779022216797, -15.717595100402832, -14.067399024963379, -12.417203903198242, -10.767007827758789, -9.116811752319336, -7.466616630554199, -5.81641960144043, -4.166224002838135, -2.5160281658172607, -0.8658323287963867, 0.7843632698059082, 2.434558868408203, 4.084754943847656, 5.734950065612793, 7.385146141052246, 9.0353422164917, 10.685537338256836, 12.335733413696289, 13.985929489135742, 15.636124610900879, 17.286319732666016, 18.93651580810547, 20.586711883544922, 22.236907958984375, 23.887104034423828, 25.53730010986328, 27.1874942779541, 28.837690353393555, 30.487886428833008, 32.13808059692383, 33.78827667236328, 35.438472747802734, 37.08866882324219, 38.73886489868164, 40.389060974121094, 42.03925323486328, 43.689453125, 45.33964538574219, 46.989845275878906, 48.64004135131836, 50.29023742675781, 51.940433502197266, 53.59062957763672, 55.240821838378906, 56.891021728515625, 58.54121398925781, 60.191410064697266, 61.84160614013672, 63.49180221557617, 65.14199829101562, 66.79219055175781, 68.44239044189453, 70.09258270263672, 71.74278259277344, 73.39297485351562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 15.0, 19.0, 19.0, 16.0, 26.0, 28.0, 29.0, 38.0, 29.0, 38.0, 42.0, 43.0, 36.0, 57.0, 50.0, 65.0, 53.0, 48.0, 38.0, 37.0, 37.0, 33.0, 29.0, 21.0, 19.0, 17.0, 27.0, 8.0, 10.0, 4.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-31.966903686523438, -31.10605812072754, -30.245210647583008, -29.38436508178711, -28.52351951599121, -27.662673950195312, -26.80182647705078, -25.940980911254883, -25.080135345458984, -24.219289779663086, -23.358442306518555, -22.497596740722656, -21.636751174926758, -20.77590560913086, -19.915058135986328, -19.05421257019043, -18.19336700439453, -17.332521438598633, -16.4716739654541, -15.610828399658203, -14.749982833862305, -13.88913631439209, -13.028289794921875, -12.167444229125977, -11.306596755981445, -10.44575023651123, -9.584904670715332, -8.724058151245117, -7.863212585449219, -7.002366065979004, -6.141520023345947, -5.280673980712891, -4.419828414916992, -3.5589823722839355, -2.698136329650879, -1.8372900485992432, -0.9764440059661865, -0.11559772491455078, 0.7452483177185059, 1.6060943603515625, 2.466940402984619, 3.327786445617676, 4.188632488250732, 5.049478530883789, 5.910325050354004, 6.7711710929870605, 7.632017135620117, 8.492862701416016, 9.35370922088623, 10.214555740356445, 11.075401306152344, 11.936247825622559, 12.797093391418457, 13.657939910888672, 14.51878547668457, 15.379631996154785, 16.240478515625, 17.1013240814209, 17.96217155456543, 18.823017120361328, 19.683862686157227, 20.544708251953125, 21.405555725097656, 22.266401290893555, 23.127246856689453]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 2.0, 9.0, 11.0, 12.0, 21.0, 35.0, 32.0, 47.0, 80.0, 87.0, 174.0, 246.0, 442.0, 711.0, 1556.0, 3586.0, 10875.0, 39895.0, 161917.0, 476233.0, 260279.0, 65422.0, 17127.0, 5375.0, 2068.0, 914.0, 481.0, 290.0, 180.0, 126.0, 83.0, 64.0, 38.0, 36.0, 24.0, 15.0, 7.0, 12.0, 12.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-27.578125, -26.80517578125, -26.0322265625, -25.25927734375, -24.486328125, -23.71337890625, -22.9404296875, -22.16748046875, -21.39453125, -20.62158203125, -19.8486328125, -19.07568359375, -18.302734375, -17.52978515625, -16.7568359375, -15.98388671875, -15.2109375, -14.43798828125, -13.6650390625, -12.89208984375, -12.119140625, -11.34619140625, -10.5732421875, -9.80029296875, -9.02734375, -8.25439453125, -7.4814453125, -6.70849609375, -5.935546875, -5.16259765625, -4.3896484375, -3.61669921875, -2.84375, -2.07080078125, -1.2978515625, -0.52490234375, 0.248046875, 1.02099609375, 1.7939453125, 2.56689453125, 3.33984375, 4.11279296875, 4.8857421875, 5.65869140625, 6.431640625, 7.20458984375, 7.9775390625, 8.75048828125, 9.5234375, 10.29638671875, 11.0693359375, 11.84228515625, 12.615234375, 13.38818359375, 14.1611328125, 14.93408203125, 15.70703125, 16.47998046875, 17.2529296875, 18.02587890625, 18.798828125, 19.57177734375, 20.3447265625, 21.11767578125, 21.890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 11.0, 27.0, 42.0, 60.0, 58.0, 105.0, 121.0, 109.0, 110.0, 94.0, 72.0, 62.0, 37.0, 40.0, 13.0, 13.0, 4.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.429168701171875, -3.30950927734375, -3.189849853515625, -3.0701904296875, -2.950531005859375, -2.83087158203125, -2.711212158203125, -2.591552734375, -2.471893310546875, -2.35223388671875, -2.232574462890625, -2.1129150390625, -1.993255615234375, -1.87359619140625, -1.753936767578125, -1.63427734375, -1.514617919921875, -1.39495849609375, -1.275299072265625, -1.1556396484375, -1.035980224609375, -0.91632080078125, -0.796661376953125, -0.677001953125, -0.557342529296875, -0.43768310546875, -0.318023681640625, -0.1983642578125, -0.078704833984375, 0.04095458984375, 0.160614013671875, 0.2802734375, 0.399932861328125, 0.51959228515625, 0.639251708984375, 0.7589111328125, 0.878570556640625, 0.99822998046875, 1.117889404296875, 1.237548828125, 1.357208251953125, 1.47686767578125, 1.596527099609375, 1.7161865234375, 1.835845947265625, 1.95550537109375, 2.075164794921875, 2.19482421875, 2.314483642578125, 2.43414306640625, 2.553802490234375, 2.6734619140625, 2.793121337890625, 2.91278076171875, 3.032440185546875, 3.152099609375, 3.271759033203125, 3.39141845703125, 3.511077880859375, 3.6307373046875, 3.750396728515625, 3.87005615234375, 3.989715576171875, 4.109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 16.0, 24.0, 33.0, 46.0, 75.0, 118.0, 167.0, 245.0, 404.0, 721.0, 1397.0, 2684.0, 5500.0, 14358.0, 40619.0, 127652.0, 383418.0, 314377.0, 101647.0, 33104.0, 11827.0, 4702.0, 2365.0, 1187.0, 644.0, 410.0, 273.0, 156.0, 100.0, 75.0, 54.0, 37.0, 20.0, 17.0, 12.0, 17.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.484375, -19.880126953125, -19.27587890625, -18.671630859375, -18.0673828125, -17.463134765625, -16.85888671875, -16.254638671875, -15.650390625, -15.046142578125, -14.44189453125, -13.837646484375, -13.2333984375, -12.629150390625, -12.02490234375, -11.420654296875, -10.81640625, -10.212158203125, -9.60791015625, -9.003662109375, -8.3994140625, -7.795166015625, -7.19091796875, -6.586669921875, -5.982421875, -5.378173828125, -4.77392578125, -4.169677734375, -3.5654296875, -2.961181640625, -2.35693359375, -1.752685546875, -1.1484375, -0.544189453125, 0.06005859375, 0.664306640625, 1.2685546875, 1.872802734375, 2.47705078125, 3.081298828125, 3.685546875, 4.289794921875, 4.89404296875, 5.498291015625, 6.1025390625, 6.706787109375, 7.31103515625, 7.915283203125, 8.51953125, 9.123779296875, 9.72802734375, 10.332275390625, 10.9365234375, 11.540771484375, 12.14501953125, 12.749267578125, 13.353515625, 13.957763671875, 14.56201171875, 15.166259765625, 15.7705078125, 16.374755859375, 16.97900390625, 17.583251953125, 18.1875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 7.0, 10.0, 23.0, 20.0, 15.0, 33.0, 28.0, 33.0, 43.0, 41.0, 36.0, 42.0, 46.0, 46.0, 53.0, 50.0, 44.0, 48.0, 44.0, 45.0, 41.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 14.0, 18.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3702392578125, -9.045166015625, -8.7200927734375, -8.39501953125, -8.0699462890625, -7.744873046875, -7.4197998046875, -7.0947265625, -6.7696533203125, -6.444580078125, -6.1195068359375, -5.79443359375, -5.4693603515625, -5.144287109375, -4.8192138671875, -4.494140625, -4.1690673828125, -3.843994140625, -3.5189208984375, -3.19384765625, -2.8687744140625, -2.543701171875, -2.2186279296875, -1.8935546875, -1.5684814453125, -1.243408203125, -0.9183349609375, -0.59326171875, -0.2681884765625, 0.056884765625, 0.3819580078125, 0.70703125, 1.0321044921875, 1.357177734375, 1.6822509765625, 2.00732421875, 2.3323974609375, 2.657470703125, 2.9825439453125, 3.3076171875, 3.6326904296875, 3.957763671875, 4.2828369140625, 4.60791015625, 4.9329833984375, 5.258056640625, 5.5831298828125, 5.908203125, 6.2332763671875, 6.558349609375, 6.8834228515625, 7.20849609375, 7.5335693359375, 7.858642578125, 8.1837158203125, 8.5087890625, 8.8338623046875, 9.158935546875, 9.4840087890625, 9.80908203125, 10.1341552734375, 10.459228515625, 10.7843017578125, 11.109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 8.0, 15.0, 8.0, 30.0, 46.0, 60.0, 161.0, 298.0, 755.0, 2100.0, 8755.0, 55960.0, 504636.0, 419797.0, 45333.0, 7437.0, 1956.0, 611.0, 270.0, 129.0, 63.0, 44.0, 19.0, 16.0, 17.0, 11.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.761474609375, -17.14794921875, -16.534423828125, -15.9208984375, -15.307373046875, -14.69384765625, -14.080322265625, -13.466796875, -12.853271484375, -12.23974609375, -11.626220703125, -11.0126953125, -10.399169921875, -9.78564453125, -9.172119140625, -8.55859375, -7.945068359375, -7.33154296875, -6.718017578125, -6.1044921875, -5.490966796875, -4.87744140625, -4.263916015625, -3.650390625, -3.036865234375, -2.42333984375, -1.809814453125, -1.1962890625, -0.582763671875, 0.03076171875, 0.644287109375, 1.2578125, 1.871337890625, 2.48486328125, 3.098388671875, 3.7119140625, 4.325439453125, 4.93896484375, 5.552490234375, 6.166015625, 6.779541015625, 7.39306640625, 8.006591796875, 8.6201171875, 9.233642578125, 9.84716796875, 10.460693359375, 11.07421875, 11.687744140625, 12.30126953125, 12.914794921875, 13.5283203125, 14.141845703125, 14.75537109375, 15.368896484375, 15.982421875, 16.595947265625, 17.20947265625, 17.822998046875, 18.4365234375, 19.050048828125, 19.66357421875, 20.277099609375, 20.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 4.0, 7.0, 16.0, 13.0, 21.0, 17.0, 22.0, 34.0, 38.0, 39.0, 52.0, 70.0, 96.0, 83.0, 91.0, 74.0, 56.0, 49.0, 30.0, 40.0, 30.0, 23.0, 17.0, 13.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.0013904869556427002, -0.0013495087623596191, -0.001308530569076538, -0.001267552375793457, -0.001226574182510376, -0.001185595989227295, -0.0011446177959442139, -0.0011036396026611328, -0.0010626614093780518, -0.0010216832160949707, -0.0009807050228118896, -0.0009397268295288086, -0.0008987486362457275, -0.0008577704429626465, -0.0008167922496795654, -0.0007758140563964844, -0.0007348358631134033, -0.0006938576698303223, -0.0006528794765472412, -0.0006119012832641602, -0.0005709230899810791, -0.000529944896697998, -0.000488966703414917, -0.00044798851013183594, -0.0004070103168487549, -0.00036603212356567383, -0.0003250539302825928, -0.0002840757369995117, -0.00024309754371643066, -0.0002021193504333496, -0.00016114115715026855, -0.0001201629638671875, -7.918477058410645e-05, -3.820657730102539e-05, 2.771615982055664e-06, 4.374980926513672e-05, 8.472800254821777e-05, 0.00012570619583129883, 0.00016668438911437988, 0.00020766258239746094, 0.000248640775680542, 0.00028961896896362305, 0.0003305971622467041, 0.00037157535552978516, 0.0004125535488128662, 0.00045353174209594727, 0.0004945099353790283, 0.0005354881286621094, 0.0005764663219451904, 0.0006174445152282715, 0.0006584227085113525, 0.0006994009017944336, 0.0007403790950775146, 0.0007813572883605957, 0.0008223354816436768, 0.0008633136749267578, 0.0009042918682098389, 0.0009452700614929199, 0.000986248254776001, 0.001027226448059082, 0.001068204641342163, 0.0011091828346252441, 0.0011501610279083252, 0.0011911392211914062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 9.0, 17.0, 19.0, 43.0, 52.0, 87.0, 118.0, 221.0, 469.0, 1142.0, 3407.0, 13912.0, 98625.0, 694438.0, 204978.0, 23367.0, 4960.0, 1506.0, 554.0, 263.0, 125.0, 73.0, 63.0, 31.0, 20.0, 12.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.2177734375, -23.498046875, -22.7783203125, -22.05859375, -21.3388671875, -20.619140625, -19.8994140625, -19.1796875, -18.4599609375, -17.740234375, -17.0205078125, -16.30078125, -15.5810546875, -14.861328125, -14.1416015625, -13.421875, -12.7021484375, -11.982421875, -11.2626953125, -10.54296875, -9.8232421875, -9.103515625, -8.3837890625, -7.6640625, -6.9443359375, -6.224609375, -5.5048828125, -4.78515625, -4.0654296875, -3.345703125, -2.6259765625, -1.90625, -1.1865234375, -0.466796875, 0.2529296875, 0.97265625, 1.6923828125, 2.412109375, 3.1318359375, 3.8515625, 4.5712890625, 5.291015625, 6.0107421875, 6.73046875, 7.4501953125, 8.169921875, 8.8896484375, 9.609375, 10.3291015625, 11.048828125, 11.7685546875, 12.48828125, 13.2080078125, 13.927734375, 14.6474609375, 15.3671875, 16.0869140625, 16.806640625, 17.5263671875, 18.24609375, 18.9658203125, 19.685546875, 20.4052734375, 21.125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 26.0, 38.0, 66.0, 97.0, 126.0, 132.0, 131.0, 115.0, 74.0, 63.0, 41.0, 26.0, 13.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.71875, -16.36932373046875, -16.0198974609375, -15.67047119140625, -15.321044921875, -14.97161865234375, -14.6221923828125, -14.27276611328125, -13.92333984375, -13.57391357421875, -13.2244873046875, -12.87506103515625, -12.525634765625, -12.17620849609375, -11.8267822265625, -11.47735595703125, -11.1279296875, -10.77850341796875, -10.4290771484375, -10.07965087890625, -9.730224609375, -9.38079833984375, -9.0313720703125, -8.68194580078125, -8.33251953125, -7.98309326171875, -7.6336669921875, -7.28424072265625, -6.934814453125, -6.58538818359375, -6.2359619140625, -5.88653564453125, -5.537109375, -5.18768310546875, -4.8382568359375, -4.48883056640625, -4.139404296875, -3.78997802734375, -3.4405517578125, -3.09112548828125, -2.74169921875, -2.39227294921875, -2.0428466796875, -1.69342041015625, -1.343994140625, -0.99456787109375, -0.6451416015625, -0.29571533203125, 0.0537109375, 0.40313720703125, 0.7525634765625, 1.10198974609375, 1.451416015625, 1.80084228515625, 2.1502685546875, 2.49969482421875, 2.84912109375, 3.19854736328125, 3.5479736328125, 3.89739990234375, 4.246826171875, 4.59625244140625, 4.9456787109375, 5.29510498046875, 5.64453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 16.0, 27.0, 77.0, 220.0, 328.0, 215.0, 86.0, 31.0, 6.0, 5.0, 2.0, 1.0, 1.0], "bins": [-496.0281982421875, -487.0992431640625, -478.1703186035156, -469.2413635253906, -460.31243896484375, -451.38348388671875, -442.45452880859375, -433.5256042480469, -424.5966491699219, -415.6676940917969, -406.73876953125, -397.809814453125, -388.880859375, -379.9519348144531, -371.0229797363281, -362.09405517578125, -353.16510009765625, -344.23614501953125, -335.3072204589844, -326.3782653808594, -317.4493408203125, -308.5203857421875, -299.5914306640625, -290.6625061035156, -281.7335510253906, -272.8045959472656, -263.87567138671875, -254.94671630859375, -246.0177764892578, -237.08883666992188, -228.15988159179688, -219.23094177246094, -210.30198669433594, -201.373046875, -192.444091796875, -183.51515197753906, -174.58621215820312, -165.6572723388672, -156.72833251953125, -147.79937744140625, -138.8704376220703, -129.94149780273438, -121.0125503540039, -112.08360290527344, -103.1546630859375, -94.22572326660156, -85.2967758178711, -76.36782836914062, -67.43888854980469, -58.509944915771484, -49.58100128173828, -40.65205764770508, -31.723114013671875, -22.794170379638672, -13.865226745605469, -4.936283111572266, 3.9926605224609375, 12.92160415649414, 21.850547790527344, 30.779491424560547, 39.70843505859375, 48.63737869262695, 57.566322326660156, 66.49526977539062, 75.42420959472656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 10.0, 7.0, 10.0, 12.0, 19.0, 20.0, 18.0, 16.0, 26.0, 40.0, 44.0, 41.0, 52.0, 45.0, 49.0, 62.0, 51.0, 51.0, 51.0, 47.0, 36.0, 39.0, 37.0, 43.0, 28.0, 22.0, 22.0, 9.0, 14.0, 15.0, 14.0, 9.0, 4.0, 3.0, 9.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-84.17637634277344, -81.90940856933594, -79.64244842529297, -77.37548065185547, -75.10851287841797, -72.841552734375, -70.5745849609375, -68.3076171875, -66.0406494140625, -63.773685455322266, -61.506717681884766, -59.23975372314453, -56.97278594970703, -54.7058219909668, -52.43885803222656, -50.17189025878906, -47.904930114746094, -45.63796615600586, -43.37099838256836, -41.104034423828125, -38.837066650390625, -36.57010269165039, -34.303138732910156, -32.036170959472656, -29.769207000732422, -27.502241134643555, -25.235275268554688, -22.968311309814453, -20.701345443725586, -18.43437957763672, -16.167415618896484, -13.900449752807617, -11.633476257324219, -9.366510391235352, -7.099545478820801, -4.832580089569092, -2.565614700317383, -0.2986488342285156, 1.9683160781860352, 4.235280990600586, 6.502246856689453, 8.76921272277832, 11.036177635192871, 13.303142547607422, 15.570108413696289, 17.837074279785156, 20.10403823852539, 22.371004104614258, 24.637969970703125, 26.904935836791992, 29.17190170288086, 31.438865661621094, 33.705833435058594, 35.97279739379883, 38.23976135253906, 40.50672912597656, 42.7736930847168, 45.04065704345703, 47.30762481689453, 49.574588775634766, 51.841552734375, 54.1085205078125, 56.375484466552734, 58.64244842529297, 60.90941619873047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 0.0, 5.0, 4.0, 16.0, 22.0, 31.0, 49.0, 70.0, 130.0, 255.0, 560.0, 1527.0, 5085.0, 25281.0, 387373.0, 3708611.0, 52843.0, 8640.0, 2189.0, 779.0, 346.0, 173.0, 105.0, 60.0, 43.0, 36.0, 12.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.0625, -58.072265625, -56.08203125, -54.091796875, -52.1015625, -50.111328125, -48.12109375, -46.130859375, -44.140625, -42.150390625, -40.16015625, -38.169921875, -36.1796875, -34.189453125, -32.19921875, -30.208984375, -28.21875, -26.228515625, -24.23828125, -22.248046875, -20.2578125, -18.267578125, -16.27734375, -14.287109375, -12.296875, -10.306640625, -8.31640625, -6.326171875, -4.3359375, -2.345703125, -0.35546875, 1.634765625, 3.625, 5.615234375, 7.60546875, 9.595703125, 11.5859375, 13.576171875, 15.56640625, 17.556640625, 19.546875, 21.537109375, 23.52734375, 25.517578125, 27.5078125, 29.498046875, 31.48828125, 33.478515625, 35.46875, 37.458984375, 39.44921875, 41.439453125, 43.4296875, 45.419921875, 47.41015625, 49.400390625, 51.390625, 53.380859375, 55.37109375, 57.361328125, 59.3515625, 61.341796875, 63.33203125, 65.322265625, 67.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 2.0, 2.0, 7.0, 10.0, 11.0, 11.0, 26.0, 16.0, 49.0, 39.0, 48.0, 58.0, 66.0, 72.0, 67.0, 65.0, 84.0, 69.0, 69.0, 50.0, 51.0, 27.0, 19.0, 18.0, 11.0, 14.0, 16.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.962890625, -2.875946044921875, -2.78900146484375, -2.702056884765625, -2.6151123046875, -2.528167724609375, -2.44122314453125, -2.354278564453125, -2.267333984375, -2.180389404296875, -2.09344482421875, -2.006500244140625, -1.9195556640625, -1.832611083984375, -1.74566650390625, -1.658721923828125, -1.57177734375, -1.484832763671875, -1.39788818359375, -1.310943603515625, -1.2239990234375, -1.137054443359375, -1.05010986328125, -0.963165283203125, -0.876220703125, -0.789276123046875, -0.70233154296875, -0.615386962890625, -0.5284423828125, -0.441497802734375, -0.35455322265625, -0.267608642578125, -0.1806640625, -0.093719482421875, -0.00677490234375, 0.080169677734375, 0.1671142578125, 0.254058837890625, 0.34100341796875, 0.427947998046875, 0.514892578125, 0.601837158203125, 0.68878173828125, 0.775726318359375, 0.8626708984375, 0.949615478515625, 1.03656005859375, 1.123504638671875, 1.21044921875, 1.297393798828125, 1.38433837890625, 1.471282958984375, 1.5582275390625, 1.645172119140625, 1.73211669921875, 1.819061279296875, 1.906005859375, 1.992950439453125, 2.07989501953125, 2.166839599609375, 2.2537841796875, 2.340728759765625, 2.42767333984375, 2.514617919921875, 2.6015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 14.0, 20.0, 37.0, 61.0, 94.0, 177.0, 366.0, 769.0, 1862.0, 4734.0, 16425.0, 83836.0, 1416119.0, 2548224.0, 94046.0, 18358.0, 5359.0, 2012.0, 861.0, 406.0, 204.0, 115.0, 85.0, 39.0, 25.0, 16.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.19140625, -40.9140625, -39.63671875, -38.359375, -37.08203125, -35.8046875, -34.52734375, -33.25, -31.97265625, -30.6953125, -29.41796875, -28.140625, -26.86328125, -25.5859375, -24.30859375, -23.03125, -21.75390625, -20.4765625, -19.19921875, -17.921875, -16.64453125, -15.3671875, -14.08984375, -12.8125, -11.53515625, -10.2578125, -8.98046875, -7.703125, -6.42578125, -5.1484375, -3.87109375, -2.59375, -1.31640625, -0.0390625, 1.23828125, 2.515625, 3.79296875, 5.0703125, 6.34765625, 7.625, 8.90234375, 10.1796875, 11.45703125, 12.734375, 14.01171875, 15.2890625, 16.56640625, 17.84375, 19.12109375, 20.3984375, 21.67578125, 22.953125, 24.23046875, 25.5078125, 26.78515625, 28.0625, 29.33984375, 30.6171875, 31.89453125, 33.171875, 34.44921875, 35.7265625, 37.00390625, 38.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 12.0, 12.0, 20.0, 25.0, 37.0, 81.0, 125.0, 293.0, 753.0, 1874.0, 412.0, 156.0, 100.0, 54.0, 45.0, 14.0, 17.0, 12.0, 8.0, 3.0, 8.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4552001953125, -9.152587890625, -8.8499755859375, -8.54736328125, -8.2447509765625, -7.942138671875, -7.6395263671875, -7.3369140625, -7.0343017578125, -6.731689453125, -6.4290771484375, -6.12646484375, -5.8238525390625, -5.521240234375, -5.2186279296875, -4.916015625, -4.6134033203125, -4.310791015625, -4.0081787109375, -3.70556640625, -3.4029541015625, -3.100341796875, -2.7977294921875, -2.4951171875, -2.1925048828125, -1.889892578125, -1.5872802734375, -1.28466796875, -0.9820556640625, -0.679443359375, -0.3768310546875, -0.07421875, 0.2283935546875, 0.531005859375, 0.8336181640625, 1.13623046875, 1.4388427734375, 1.741455078125, 2.0440673828125, 2.3466796875, 2.6492919921875, 2.951904296875, 3.2545166015625, 3.55712890625, 3.8597412109375, 4.162353515625, 4.4649658203125, 4.767578125, 5.0701904296875, 5.372802734375, 5.6754150390625, 5.97802734375, 6.2806396484375, 6.583251953125, 6.8858642578125, 7.1884765625, 7.4910888671875, 7.793701171875, 8.0963134765625, 8.39892578125, 8.7015380859375, 9.004150390625, 9.3067626953125, 9.609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 14.0, 17.0, 28.0, 51.0, 70.0, 118.0, 163.0, 167.0, 132.0, 112.0, 53.0, 31.0, 23.0, 11.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.6428451538086, -69.5374755859375, -67.4321060180664, -65.32673645019531, -63.22136306762695, -61.11599349975586, -59.010623931884766, -56.90525436401367, -54.79988098144531, -52.69451141357422, -50.589141845703125, -48.48377227783203, -46.37839889526367, -44.27302932739258, -42.167659759521484, -40.06229019165039, -37.9569206237793, -35.8515510559082, -33.74618148803711, -31.640810012817383, -29.535438537597656, -27.430068969726562, -25.32469940185547, -23.219329833984375, -21.11395835876465, -19.008588790893555, -16.903217315673828, -14.797847747802734, -12.692477226257324, -10.587106704711914, -8.48173713684082, -6.37636661529541, -4.270992279052734, -2.1656219959259033, -0.060251712799072266, 2.0451183319091797, 4.15048885345459, 6.255859375, 8.361228942871094, 10.466599464416504, 12.571969985961914, 14.677340507507324, 16.782711029052734, 18.888080596923828, 20.993450164794922, 23.09882164001465, 25.204191207885742, 27.30956268310547, 29.414932250976562, 31.520301818847656, 33.62567138671875, 35.731040954589844, 37.8364143371582, 39.9417839050293, 42.04715347290039, 44.152523040771484, 46.257896423339844, 48.36326599121094, 50.46863555908203, 52.574005126953125, 54.679378509521484, 56.78474807739258, 58.89011764526367, 60.995487213134766, 63.10085678100586]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 14.0, 6.0, 18.0, 37.0, 30.0, 43.0, 73.0, 71.0, 98.0, 83.0, 94.0, 98.0, 74.0, 59.0, 57.0, 39.0, 42.0, 27.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.262306213378906, -30.87497329711914, -29.487640380859375, -28.100309371948242, -26.712976455688477, -25.32564353942871, -23.938312530517578, -22.550979614257812, -21.163646697998047, -19.77631378173828, -18.388980865478516, -17.001649856567383, -15.614316940307617, -14.226984024047852, -12.839652061462402, -11.452320098876953, -10.064987182617188, -8.677654266357422, -7.290322303771973, -5.902989864349365, -4.515657424926758, -3.1283249855041504, -1.740992546081543, -0.35366058349609375, 1.0336723327636719, 2.4210047721862793, 3.8083372116088867, 5.195669651031494, 6.583002090454102, 7.970334529876709, 9.357666969299316, 10.744998931884766, 12.132331848144531, 13.519664764404297, 14.906996726989746, 16.294328689575195, 17.68166160583496, 19.068994522094727, 20.45632553100586, 21.843658447265625, 23.23099136352539, 24.618324279785156, 26.005657196044922, 27.392988204956055, 28.78032112121582, 30.167654037475586, 31.55498504638672, 32.942317962646484, 34.32965087890625, 35.716983795166016, 37.10431671142578, 38.49164962768555, 39.87898254394531, 41.26631164550781, 42.65364456176758, 44.040977478027344, 45.42831039428711, 46.815643310546875, 48.20297622680664, 49.590309143066406, 50.977638244628906, 52.36497116088867, 53.75230407714844, 55.1396369934082, 56.52696990966797]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 16.0, 16.0, 21.0, 35.0, 29.0, 56.0, 71.0, 96.0, 163.0, 219.0, 364.0, 643.0, 1160.0, 2351.0, 5808.0, 19027.0, 71520.0, 265729.0, 447576.0, 169658.0, 43502.0, 12206.0, 4087.0, 1781.0, 966.0, 503.0, 335.0, 187.0, 126.0, 77.0, 51.0, 40.0, 32.0, 19.0, 16.0, 16.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.375, -20.713623046875, -20.05224609375, -19.390869140625, -18.7294921875, -18.068115234375, -17.40673828125, -16.745361328125, -16.083984375, -15.422607421875, -14.76123046875, -14.099853515625, -13.4384765625, -12.777099609375, -12.11572265625, -11.454345703125, -10.79296875, -10.131591796875, -9.47021484375, -8.808837890625, -8.1474609375, -7.486083984375, -6.82470703125, -6.163330078125, -5.501953125, -4.840576171875, -4.17919921875, -3.517822265625, -2.8564453125, -2.195068359375, -1.53369140625, -0.872314453125, -0.2109375, 0.450439453125, 1.11181640625, 1.773193359375, 2.4345703125, 3.095947265625, 3.75732421875, 4.418701171875, 5.080078125, 5.741455078125, 6.40283203125, 7.064208984375, 7.7255859375, 8.386962890625, 9.04833984375, 9.709716796875, 10.37109375, 11.032470703125, 11.69384765625, 12.355224609375, 13.0166015625, 13.677978515625, 14.33935546875, 15.000732421875, 15.662109375, 16.323486328125, 16.98486328125, 17.646240234375, 18.3076171875, 18.968994140625, 19.63037109375, 20.291748046875, 20.953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 1.0, 5.0, 7.0, 14.0, 18.0, 22.0, 53.0, 43.0, 70.0, 80.0, 100.0, 98.0, 102.0, 95.0, 77.0, 52.0, 47.0, 40.0, 23.0, 18.0, 12.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.703460693359375, -2.58465576171875, -2.465850830078125, -2.3470458984375, -2.228240966796875, -2.10943603515625, -1.990631103515625, -1.871826171875, -1.753021240234375, -1.63421630859375, -1.515411376953125, -1.3966064453125, -1.277801513671875, -1.15899658203125, -1.040191650390625, -0.92138671875, -0.802581787109375, -0.68377685546875, -0.564971923828125, -0.4461669921875, -0.327362060546875, -0.20855712890625, -0.089752197265625, 0.029052734375, 0.147857666015625, 0.26666259765625, 0.385467529296875, 0.5042724609375, 0.623077392578125, 0.74188232421875, 0.860687255859375, 0.9794921875, 1.098297119140625, 1.21710205078125, 1.335906982421875, 1.4547119140625, 1.573516845703125, 1.69232177734375, 1.811126708984375, 1.929931640625, 2.048736572265625, 2.16754150390625, 2.286346435546875, 2.4051513671875, 2.523956298828125, 2.64276123046875, 2.761566162109375, 2.88037109375, 2.999176025390625, 3.11798095703125, 3.236785888671875, 3.3555908203125, 3.474395751953125, 3.59320068359375, 3.712005615234375, 3.830810546875, 3.949615478515625, 4.06842041015625, 4.187225341796875, 4.3060302734375, 4.424835205078125, 4.54364013671875, 4.662445068359375, 4.78125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 12.0, 4.0, 8.0, 21.0, 22.0, 28.0, 43.0, 63.0, 68.0, 117.0, 163.0, 238.0, 338.0, 482.0, 821.0, 1497.0, 2928.0, 6018.0, 13807.0, 32886.0, 80919.0, 184810.0, 298212.0, 233529.0, 111256.0, 45316.0, 18408.0, 7966.0, 3731.0, 1870.0, 1024.0, 621.0, 381.0, 256.0, 213.0, 125.0, 93.0, 57.0, 52.0, 33.0, 33.0, 20.0, 16.0, 16.0, 11.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.44091796875, -10.1005859375, -9.76025390625, -9.419921875, -9.07958984375, -8.7392578125, -8.39892578125, -8.05859375, -7.71826171875, -7.3779296875, -7.03759765625, -6.697265625, -6.35693359375, -6.0166015625, -5.67626953125, -5.3359375, -4.99560546875, -4.6552734375, -4.31494140625, -3.974609375, -3.63427734375, -3.2939453125, -2.95361328125, -2.61328125, -2.27294921875, -1.9326171875, -1.59228515625, -1.251953125, -0.91162109375, -0.5712890625, -0.23095703125, 0.109375, 0.44970703125, 0.7900390625, 1.13037109375, 1.470703125, 1.81103515625, 2.1513671875, 2.49169921875, 2.83203125, 3.17236328125, 3.5126953125, 3.85302734375, 4.193359375, 4.53369140625, 4.8740234375, 5.21435546875, 5.5546875, 5.89501953125, 6.2353515625, 6.57568359375, 6.916015625, 7.25634765625, 7.5966796875, 7.93701171875, 8.27734375, 8.61767578125, 8.9580078125, 9.29833984375, 9.638671875, 9.97900390625, 10.3193359375, 10.65966796875, 11.0]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 6.0, 14.0, 11.0, 11.0, 17.0, 16.0, 34.0, 30.0, 29.0, 42.0, 30.0, 37.0, 40.0, 42.0, 49.0, 47.0, 44.0, 38.0, 43.0, 36.0, 34.0, 33.0, 47.0, 49.0, 27.0, 30.0, 24.0, 27.0, 25.0, 9.0, 8.0, 8.0, 10.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.0703125, -8.8079833984375, -8.545654296875, -8.2833251953125, -8.02099609375, -7.7586669921875, -7.496337890625, -7.2340087890625, -6.9716796875, -6.7093505859375, -6.447021484375, -6.1846923828125, -5.92236328125, -5.6600341796875, -5.397705078125, -5.1353759765625, -4.873046875, -4.6107177734375, -4.348388671875, -4.0860595703125, -3.82373046875, -3.5614013671875, -3.299072265625, -3.0367431640625, -2.7744140625, -2.5120849609375, -2.249755859375, -1.9874267578125, -1.72509765625, -1.4627685546875, -1.200439453125, -0.9381103515625, -0.67578125, -0.4134521484375, -0.151123046875, 0.1112060546875, 0.37353515625, 0.6358642578125, 0.898193359375, 1.1605224609375, 1.4228515625, 1.6851806640625, 1.947509765625, 2.2098388671875, 2.47216796875, 2.7344970703125, 2.996826171875, 3.2591552734375, 3.521484375, 3.7838134765625, 4.046142578125, 4.3084716796875, 4.57080078125, 4.8331298828125, 5.095458984375, 5.3577880859375, 5.6201171875, 5.8824462890625, 6.144775390625, 6.4071044921875, 6.66943359375, 6.9317626953125, 7.194091796875, 7.4564208984375, 7.71875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 14.0, 15.0, 13.0, 19.0, 31.0, 72.0, 104.0, 155.0, 210.0, 351.0, 641.0, 1199.0, 2685.0, 6208.0, 16692.0, 46269.0, 126360.0, 277033.0, 312074.0, 161155.0, 60854.0, 21627.0, 8199.0, 3138.0, 1522.0, 756.0, 394.0, 242.0, 158.0, 103.0, 72.0, 42.0, 43.0, 31.0, 10.0, 13.0, 11.0, 6.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45306396484375, -4.2889404296875, -4.12481689453125, -3.960693359375, -3.79656982421875, -3.6324462890625, -3.46832275390625, -3.30419921875, -3.14007568359375, -2.9759521484375, -2.81182861328125, -2.647705078125, -2.48358154296875, -2.3194580078125, -2.15533447265625, -1.9912109375, -1.82708740234375, -1.6629638671875, -1.49884033203125, -1.334716796875, -1.17059326171875, -1.0064697265625, -0.84234619140625, -0.67822265625, -0.51409912109375, -0.3499755859375, -0.18585205078125, -0.021728515625, 0.14239501953125, 0.3065185546875, 0.47064208984375, 0.634765625, 0.79888916015625, 0.9630126953125, 1.12713623046875, 1.291259765625, 1.45538330078125, 1.6195068359375, 1.78363037109375, 1.94775390625, 2.11187744140625, 2.2760009765625, 2.44012451171875, 2.604248046875, 2.76837158203125, 2.9324951171875, 3.09661865234375, 3.2607421875, 3.42486572265625, 3.5889892578125, 3.75311279296875, 3.917236328125, 4.08135986328125, 4.2454833984375, 4.40960693359375, 4.57373046875, 4.73785400390625, 4.9019775390625, 5.06610107421875, 5.230224609375, 5.39434814453125, 5.5584716796875, 5.72259521484375, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 8.0, 15.0, 14.0, 21.0, 25.0, 29.0, 47.0, 56.0, 67.0, 67.0, 93.0, 105.0, 77.0, 71.0, 38.0, 54.0, 36.0, 24.0, 21.0, 21.0, 12.0, 10.0, 17.0, 8.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009593963623046875, -0.0009296610951423645, -0.0008999258279800415, -0.0008701905608177185, -0.0008404552936553955, -0.0008107200264930725, -0.0007809847593307495, -0.0007512494921684265, -0.0007215142250061035, -0.0006917789578437805, -0.0006620436906814575, -0.0006323084235191345, -0.0006025731563568115, -0.0005728378891944885, -0.0005431026220321655, -0.0005133673548698425, -0.00048363208770751953, -0.00045389682054519653, -0.00042416155338287354, -0.00039442628622055054, -0.00036469101905822754, -0.00033495575189590454, -0.00030522048473358154, -0.00027548521757125854, -0.00024574995040893555, -0.00021601468324661255, -0.00018627941608428955, -0.00015654414892196655, -0.00012680888175964355, -9.707361459732056e-05, -6.733834743499756e-05, -3.760308027267456e-05, -7.867813110351562e-06, 2.1867454051971436e-05, 5.1602721214294434e-05, 8.133798837661743e-05, 0.00011107325553894043, 0.00014080852270126343, 0.00017054378986358643, 0.00020027905702590942, 0.00023001432418823242, 0.0002597495913505554, 0.0002894848585128784, 0.0003192201256752014, 0.0003489553928375244, 0.0003786906599998474, 0.0004084259271621704, 0.0004381611943244934, 0.0004678964614868164, 0.0004976317286491394, 0.0005273669958114624, 0.0005571022629737854, 0.0005868375301361084, 0.0006165727972984314, 0.0006463080644607544, 0.0006760433316230774, 0.0007057785987854004, 0.0007355138659477234, 0.0007652491331100464, 0.0007949844002723694, 0.0008247196674346924, 0.0008544549345970154, 0.0008841902017593384, 0.0009139254689216614, 0.0009436607360839844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 5.0, 13.0, 15.0, 19.0, 27.0, 30.0, 54.0, 67.0, 95.0, 153.0, 186.0, 309.0, 477.0, 812.0, 1501.0, 2830.0, 5980.0, 13732.0, 35468.0, 95553.0, 232597.0, 326363.0, 201221.0, 79209.0, 29236.0, 11534.0, 5031.0, 2453.0, 1363.0, 788.0, 469.0, 299.0, 173.0, 141.0, 123.0, 54.0, 48.0, 27.0, 21.0, 17.0, 14.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.16748046875, -5.0029296875, -4.83837890625, -4.673828125, -4.50927734375, -4.3447265625, -4.18017578125, -4.015625, -3.85107421875, -3.6865234375, -3.52197265625, -3.357421875, -3.19287109375, -3.0283203125, -2.86376953125, -2.69921875, -2.53466796875, -2.3701171875, -2.20556640625, -2.041015625, -1.87646484375, -1.7119140625, -1.54736328125, -1.3828125, -1.21826171875, -1.0537109375, -0.88916015625, -0.724609375, -0.56005859375, -0.3955078125, -0.23095703125, -0.06640625, 0.09814453125, 0.2626953125, 0.42724609375, 0.591796875, 0.75634765625, 0.9208984375, 1.08544921875, 1.25, 1.41455078125, 1.5791015625, 1.74365234375, 1.908203125, 2.07275390625, 2.2373046875, 2.40185546875, 2.56640625, 2.73095703125, 2.8955078125, 3.06005859375, 3.224609375, 3.38916015625, 3.5537109375, 3.71826171875, 3.8828125, 4.04736328125, 4.2119140625, 4.37646484375, 4.541015625, 4.70556640625, 4.8701171875, 5.03466796875, 5.19921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 14.0, 21.0, 21.0, 35.0, 27.0, 34.0, 33.0, 35.0, 48.0, 50.0, 60.0, 76.0, 68.0, 57.0, 54.0, 55.0, 54.0, 48.0, 20.0, 26.0, 26.0, 13.0, 18.0, 17.0, 13.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48046875, -3.374359130859375, -3.26824951171875, -3.162139892578125, -3.0560302734375, -2.949920654296875, -2.84381103515625, -2.737701416015625, -2.631591796875, -2.525482177734375, -2.41937255859375, -2.313262939453125, -2.2071533203125, -2.101043701171875, -1.99493408203125, -1.888824462890625, -1.78271484375, -1.676605224609375, -1.57049560546875, -1.464385986328125, -1.3582763671875, -1.252166748046875, -1.14605712890625, -1.039947509765625, -0.933837890625, -0.827728271484375, -0.72161865234375, -0.615509033203125, -0.5093994140625, -0.403289794921875, -0.29718017578125, -0.191070556640625, -0.0849609375, 0.021148681640625, 0.12725830078125, 0.233367919921875, 0.3394775390625, 0.445587158203125, 0.55169677734375, 0.657806396484375, 0.763916015625, 0.870025634765625, 0.97613525390625, 1.082244873046875, 1.1883544921875, 1.294464111328125, 1.40057373046875, 1.506683349609375, 1.61279296875, 1.718902587890625, 1.82501220703125, 1.931121826171875, 2.0372314453125, 2.143341064453125, 2.24945068359375, 2.355560302734375, 2.461669921875, 2.567779541015625, 2.67388916015625, 2.779998779296875, 2.8861083984375, 2.992218017578125, 3.09832763671875, 3.204437255859375, 3.310546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 16.0, 33.0, 50.0, 59.0, 130.0, 128.0, 143.0, 133.0, 98.0, 73.0, 47.0, 27.0, 21.0, 17.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.74972534179688, -70.46208190917969, -67.1744384765625, -63.88679885864258, -60.599159240722656, -57.31151580810547, -54.02387237548828, -50.736228942871094, -47.44858932495117, -44.160945892333984, -40.87330627441406, -37.585662841796875, -34.29801940917969, -31.010379791259766, -27.722736358642578, -24.435094833374023, -21.14745330810547, -17.859811782836914, -14.572169303894043, -11.284526824951172, -7.996885299682617, -4.7092437744140625, -1.421600341796875, 1.8660411834716797, 5.153682708740234, 8.441324234008789, 11.72896671295166, 15.016609191894531, 18.304250717163086, 21.59189224243164, 24.879535675048828, 28.167177200317383, 31.454818725585938, 34.742462158203125, 38.03010177612305, 41.317745208740234, 44.605384826660156, 47.893028259277344, 51.18067169189453, 54.46831512451172, 57.75595474243164, 61.04359817504883, 64.33123779296875, 67.61888122558594, 70.90652465820312, 74.19416809082031, 77.4818115234375, 80.76944732666016, 84.05709075927734, 87.34473419189453, 90.63237762451172, 93.92001342773438, 97.20765686035156, 100.49530029296875, 103.78294372558594, 107.07058715820312, 110.35823059082031, 113.6458740234375, 116.93351745605469, 120.22116088867188, 123.50879669189453, 126.79644012451172, 130.08407592773438, 133.37171936035156, 136.65936279296875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 21.0, 23.0, 22.0, 38.0, 23.0, 41.0, 40.0, 46.0, 63.0, 59.0, 66.0, 71.0, 70.0, 42.0, 51.0, 49.0, 54.0, 42.0, 29.0, 30.0, 22.0, 19.0, 13.0, 12.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11974334716797, -67.11236572265625, -65.10498046875, -63.09760284423828, -61.0902214050293, -59.08283996582031, -57.075462341308594, -55.06808090209961, -53.060699462890625, -51.05331802368164, -49.04594039916992, -47.03855895996094, -45.03117752075195, -43.02379608154297, -41.01641845703125, -39.009037017822266, -37.00165939331055, -34.99427795410156, -32.986900329589844, -30.97951889038086, -28.972137451171875, -26.964757919311523, -24.957378387451172, -22.949996948242188, -20.942617416381836, -18.935237884521484, -16.9278564453125, -14.920476913452148, -12.91309642791748, -10.905715942382812, -8.898336410522461, -6.890955924987793, -4.883579254150391, -2.8761990070343018, -0.8688187599182129, 1.1385612487792969, 3.145941734313965, 5.153322219848633, 7.160701751708984, 9.168082237243652, 11.17546272277832, 13.182843208312988, 15.190223693847656, 17.197603225708008, 19.20498275756836, 21.212364196777344, 23.219743728637695, 25.227123260498047, 27.23450469970703, 29.241884231567383, 31.249265670776367, 33.25664520263672, 35.2640266418457, 37.27140808105469, 39.278785705566406, 41.28616714477539, 43.293548583984375, 45.30093002319336, 47.30830764770508, 49.31568908691406, 51.32307052612305, 53.33045196533203, 55.33782958984375, 57.345211029052734, 59.35258865356445]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 14.0, 21.0, 24.0, 42.0, 52.0, 90.0, 138.0, 182.0, 343.0, 653.0, 1317.0, 3203.0, 9775.0, 41473.0, 537638.0, 3511248.0, 67167.0, 13597.0, 3940.0, 1550.0, 692.0, 397.0, 248.0, 130.0, 87.0, 49.0, 61.0, 30.0, 13.0, 29.0, 13.0, 10.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.0625, -30.9619140625, -29.861328125, -28.7607421875, -27.66015625, -26.5595703125, -25.458984375, -24.3583984375, -23.2578125, -22.1572265625, -21.056640625, -19.9560546875, -18.85546875, -17.7548828125, -16.654296875, -15.5537109375, -14.453125, -13.3525390625, -12.251953125, -11.1513671875, -10.05078125, -8.9501953125, -7.849609375, -6.7490234375, -5.6484375, -4.5478515625, -3.447265625, -2.3466796875, -1.24609375, -0.1455078125, 0.955078125, 2.0556640625, 3.15625, 4.2568359375, 5.357421875, 6.4580078125, 7.55859375, 8.6591796875, 9.759765625, 10.8603515625, 11.9609375, 13.0615234375, 14.162109375, 15.2626953125, 16.36328125, 17.4638671875, 18.564453125, 19.6650390625, 20.765625, 21.8662109375, 22.966796875, 24.0673828125, 25.16796875, 26.2685546875, 27.369140625, 28.4697265625, 29.5703125, 30.6708984375, 31.771484375, 32.8720703125, 33.97265625, 35.0732421875, 36.173828125, 37.2744140625, 38.375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 12.0, 15.0, 19.0, 19.0, 32.0, 47.0, 47.0, 53.0, 61.0, 72.0, 73.0, 76.0, 82.0, 66.0, 64.0, 58.0, 56.0, 35.0, 32.0, 16.0, 16.0, 12.0, 8.0, 5.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.50079345703125, -2.4019775390625, -2.30316162109375, -2.204345703125, -2.10552978515625, -2.0067138671875, -1.90789794921875, -1.80908203125, -1.71026611328125, -1.6114501953125, -1.51263427734375, -1.413818359375, -1.31500244140625, -1.2161865234375, -1.11737060546875, -1.0185546875, -0.91973876953125, -0.8209228515625, -0.72210693359375, -0.623291015625, -0.52447509765625, -0.4256591796875, -0.32684326171875, -0.22802734375, -0.12921142578125, -0.0303955078125, 0.06842041015625, 0.167236328125, 0.26605224609375, 0.3648681640625, 0.46368408203125, 0.5625, 0.66131591796875, 0.7601318359375, 0.85894775390625, 0.957763671875, 1.05657958984375, 1.1553955078125, 1.25421142578125, 1.35302734375, 1.45184326171875, 1.5506591796875, 1.64947509765625, 1.748291015625, 1.84710693359375, 1.9459228515625, 2.04473876953125, 2.1435546875, 2.24237060546875, 2.3411865234375, 2.44000244140625, 2.538818359375, 2.63763427734375, 2.7364501953125, 2.83526611328125, 2.93408203125, 3.03289794921875, 3.1317138671875, 3.23052978515625, 3.329345703125, 3.42816162109375, 3.5269775390625, 3.62579345703125, 3.724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 10.0, 11.0, 25.0, 21.0, 41.0, 42.0, 80.0, 88.0, 127.0, 177.0, 292.0, 532.0, 936.0, 1788.0, 3959.0, 10021.0, 32929.0, 144125.0, 2583833.0, 1250510.0, 120739.0, 28459.0, 8825.0, 3380.0, 1503.0, 709.0, 389.0, 223.0, 157.0, 107.0, 75.0, 38.0, 38.0, 20.0, 22.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.8564453125, -18.181640625, -17.5068359375, -16.83203125, -16.1572265625, -15.482421875, -14.8076171875, -14.1328125, -13.4580078125, -12.783203125, -12.1083984375, -11.43359375, -10.7587890625, -10.083984375, -9.4091796875, -8.734375, -8.0595703125, -7.384765625, -6.7099609375, -6.03515625, -5.3603515625, -4.685546875, -4.0107421875, -3.3359375, -2.6611328125, -1.986328125, -1.3115234375, -0.63671875, 0.0380859375, 0.712890625, 1.3876953125, 2.0625, 2.7373046875, 3.412109375, 4.0869140625, 4.76171875, 5.4365234375, 6.111328125, 6.7861328125, 7.4609375, 8.1357421875, 8.810546875, 9.4853515625, 10.16015625, 10.8349609375, 11.509765625, 12.1845703125, 12.859375, 13.5341796875, 14.208984375, 14.8837890625, 15.55859375, 16.2333984375, 16.908203125, 17.5830078125, 18.2578125, 18.9326171875, 19.607421875, 20.2822265625, 20.95703125, 21.6318359375, 22.306640625, 22.9814453125, 23.65625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 17.0, 20.0, 32.0, 50.0, 91.0, 175.0, 399.0, 1880.0, 791.0, 264.0, 139.0, 79.0, 54.0, 28.0, 22.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.21063232421875, -9.9603271484375, -9.71002197265625, -9.459716796875, -9.20941162109375, -8.9591064453125, -8.70880126953125, -8.45849609375, -8.20819091796875, -7.9578857421875, -7.70758056640625, -7.457275390625, -7.20697021484375, -6.9566650390625, -6.70635986328125, -6.4560546875, -6.20574951171875, -5.9554443359375, -5.70513916015625, -5.454833984375, -5.20452880859375, -4.9542236328125, -4.70391845703125, -4.45361328125, -4.20330810546875, -3.9530029296875, -3.70269775390625, -3.452392578125, -3.20208740234375, -2.9517822265625, -2.70147705078125, -2.451171875, -2.20086669921875, -1.9505615234375, -1.70025634765625, -1.449951171875, -1.19964599609375, -0.9493408203125, -0.69903564453125, -0.44873046875, -0.19842529296875, 0.0518798828125, 0.30218505859375, 0.552490234375, 0.80279541015625, 1.0531005859375, 1.30340576171875, 1.5537109375, 1.80401611328125, 2.0543212890625, 2.30462646484375, 2.554931640625, 2.80523681640625, 3.0555419921875, 3.30584716796875, 3.55615234375, 3.80645751953125, 4.0567626953125, 4.30706787109375, 4.557373046875, 4.80767822265625, 5.0579833984375, 5.30828857421875, 5.55859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 7.0, 18.0, 11.0, 29.0, 25.0, 43.0, 46.0, 93.0, 100.0, 117.0, 105.0, 97.0, 100.0, 65.0, 47.0, 39.0, 21.0, 11.0, 11.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.752973556518555, -27.701313018798828, -26.649654388427734, -25.597993850708008, -24.54633331298828, -23.494674682617188, -22.44301414489746, -21.391353607177734, -20.33969497680664, -19.288034439086914, -18.23637580871582, -17.184715270996094, -16.133054733276367, -15.081395149230957, -14.029735565185547, -12.97807502746582, -11.926414489746094, -10.874754905700684, -9.823094367980957, -8.771434783935547, -7.7197747230529785, -6.66811466217041, -5.616455078125, -4.564795017242432, -3.5131349563598633, -2.461474895477295, -1.4098150730133057, -0.3581552505493164, 0.693504810333252, 1.7451648712158203, 2.7968244552612305, 3.848484516143799, 4.900142669677734, 5.951802730560303, 7.003462791442871, 8.055122375488281, 9.106782913208008, 10.158442497253418, 11.210102081298828, 12.261762619018555, 13.313422203063965, 14.365081787109375, 15.416742324829102, 16.468402862548828, 17.520061492919922, 18.57172203063965, 19.623382568359375, 20.67504119873047, 21.726701736450195, 22.778362274169922, 23.830020904541016, 24.881681442260742, 25.93334197998047, 26.985000610351562, 28.03666114807129, 29.088321685791016, 30.13998031616211, 31.191640853881836, 32.24330139160156, 33.294960021972656, 34.34661865234375, 35.39828109741211, 36.4499397277832, 37.5015983581543, 38.553260803222656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 14.0, 5.0, 12.0, 8.0, 14.0, 11.0, 12.0, 13.0, 10.0, 12.0, 20.0, 22.0, 16.0, 34.0, 36.0, 23.0, 18.0, 33.0, 40.0, 26.0, 33.0, 54.0, 41.0, 37.0, 30.0, 42.0, 38.0, 30.0, 31.0, 29.0, 30.0, 23.0, 31.0, 41.0, 15.0, 16.0, 16.0, 16.0, 12.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.96296501159668, -15.47378921508789, -14.984614372253418, -14.495438575744629, -14.00626277923584, -13.517087936401367, -13.027912139892578, -12.538736343383789, -12.049560546875, -11.560384750366211, -11.071209907531738, -10.58203411102295, -10.09285831451416, -9.603683471679688, -9.114507675170898, -8.62533187866211, -8.136157035827637, -7.646981716156006, -7.157805919647217, -6.668630599975586, -6.179454803466797, -5.690279483795166, -5.201104164123535, -4.711928367614746, -4.222753047943115, -3.7335774898529053, -3.2444019317626953, -2.7552266120910645, -2.2660510540008545, -1.7768754959106445, -1.2877001762390137, -0.7985246181488037, -0.30934810638427734, 0.17982739210128784, 0.669002890586853, 1.1581783294677734, 1.6473538875579834, 2.1365294456481934, 2.625704765319824, 3.114880323410034, 3.604055881500244, 4.093231201171875, 4.582406997680664, 5.071582317352295, 5.560757637023926, 6.049933433532715, 6.539108753204346, 7.028284072875977, 7.517459869384766, 8.006635665893555, 8.495810508728027, 8.984986305236816, 9.474162101745605, 9.963336944580078, 10.452512741088867, 10.941688537597656, 11.430864334106445, 11.920040130615234, 12.409214973449707, 12.898390769958496, 13.387566566467285, 13.876741409301758, 14.365917205810547, 14.855093002319336, 15.344267845153809]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 14.0, 24.0, 29.0, 29.0, 40.0, 48.0, 53.0, 97.0, 137.0, 221.0, 329.0, 596.0, 1049.0, 2310.0, 5913.0, 18109.0, 67582.0, 271669.0, 469183.0, 153685.0, 38502.0, 11209.0, 3882.0, 1663.0, 803.0, 439.0, 285.0, 205.0, 117.0, 83.0, 52.0, 41.0, 33.0, 33.0, 22.0, 14.0, 7.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.056640625, -19.39453125, -18.732421875, -18.0703125, -17.408203125, -16.74609375, -16.083984375, -15.421875, -14.759765625, -14.09765625, -13.435546875, -12.7734375, -12.111328125, -11.44921875, -10.787109375, -10.125, -9.462890625, -8.80078125, -8.138671875, -7.4765625, -6.814453125, -6.15234375, -5.490234375, -4.828125, -4.166015625, -3.50390625, -2.841796875, -2.1796875, -1.517578125, -0.85546875, -0.193359375, 0.46875, 1.130859375, 1.79296875, 2.455078125, 3.1171875, 3.779296875, 4.44140625, 5.103515625, 5.765625, 6.427734375, 7.08984375, 7.751953125, 8.4140625, 9.076171875, 9.73828125, 10.400390625, 11.0625, 11.724609375, 12.38671875, 13.048828125, 13.7109375, 14.373046875, 15.03515625, 15.697265625, 16.359375, 17.021484375, 17.68359375, 18.345703125, 19.0078125, 19.669921875, 20.33203125, 20.994140625, 21.65625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 19.0, 19.0, 19.0, 41.0, 51.0, 51.0, 47.0, 71.0, 89.0, 83.0, 86.0, 79.0, 72.0, 78.0, 46.0, 35.0, 35.0, 24.0, 19.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.21856689453125, -3.1070556640625, -2.99554443359375, -2.884033203125, -2.77252197265625, -2.6610107421875, -2.54949951171875, -2.43798828125, -2.32647705078125, -2.2149658203125, -2.10345458984375, -1.991943359375, -1.88043212890625, -1.7689208984375, -1.65740966796875, -1.5458984375, -1.43438720703125, -1.3228759765625, -1.21136474609375, -1.099853515625, -0.98834228515625, -0.8768310546875, -0.76531982421875, -0.65380859375, -0.54229736328125, -0.4307861328125, -0.31927490234375, -0.207763671875, -0.09625244140625, 0.0152587890625, 0.12677001953125, 0.23828125, 0.34979248046875, 0.4613037109375, 0.57281494140625, 0.684326171875, 0.79583740234375, 0.9073486328125, 1.01885986328125, 1.13037109375, 1.24188232421875, 1.3533935546875, 1.46490478515625, 1.576416015625, 1.68792724609375, 1.7994384765625, 1.91094970703125, 2.0224609375, 2.13397216796875, 2.2454833984375, 2.35699462890625, 2.468505859375, 2.58001708984375, 2.6915283203125, 2.80303955078125, 2.91455078125, 3.02606201171875, 3.1375732421875, 3.24908447265625, 3.360595703125, 3.47210693359375, 3.5836181640625, 3.69512939453125, 3.806640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 11.0, 11.0, 19.0, 33.0, 42.0, 60.0, 68.0, 111.0, 167.0, 232.0, 338.0, 482.0, 760.0, 1352.0, 2387.0, 4731.0, 9774.0, 22522.0, 52419.0, 122348.0, 246607.0, 291300.0, 161688.0, 73082.0, 30936.0, 13238.0, 6180.0, 3110.0, 1647.0, 1010.0, 647.0, 399.0, 254.0, 153.0, 105.0, 81.0, 72.0, 42.0, 39.0, 23.0, 18.0, 9.0, 5.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-9.421875, -9.129150390625, -8.83642578125, -8.543701171875, -8.2509765625, -7.958251953125, -7.66552734375, -7.372802734375, -7.080078125, -6.787353515625, -6.49462890625, -6.201904296875, -5.9091796875, -5.616455078125, -5.32373046875, -5.031005859375, -4.73828125, -4.445556640625, -4.15283203125, -3.860107421875, -3.5673828125, -3.274658203125, -2.98193359375, -2.689208984375, -2.396484375, -2.103759765625, -1.81103515625, -1.518310546875, -1.2255859375, -0.932861328125, -0.64013671875, -0.347412109375, -0.0546875, 0.238037109375, 0.53076171875, 0.823486328125, 1.1162109375, 1.408935546875, 1.70166015625, 1.994384765625, 2.287109375, 2.579833984375, 2.87255859375, 3.165283203125, 3.4580078125, 3.750732421875, 4.04345703125, 4.336181640625, 4.62890625, 4.921630859375, 5.21435546875, 5.507080078125, 5.7998046875, 6.092529296875, 6.38525390625, 6.677978515625, 6.970703125, 7.263427734375, 7.55615234375, 7.848876953125, 8.1416015625, 8.434326171875, 8.72705078125, 9.019775390625, 9.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 7.0, 10.0, 9.0, 12.0, 22.0, 21.0, 22.0, 25.0, 27.0, 41.0, 36.0, 38.0, 35.0, 46.0, 35.0, 40.0, 47.0, 39.0, 47.0, 39.0, 36.0, 33.0, 37.0, 38.0, 35.0, 26.0, 30.0, 20.0, 20.0, 15.0, 14.0, 13.0, 14.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.4453125, -8.185791015625, -7.92626953125, -7.666748046875, -7.4072265625, -7.147705078125, -6.88818359375, -6.628662109375, -6.369140625, -6.109619140625, -5.85009765625, -5.590576171875, -5.3310546875, -5.071533203125, -4.81201171875, -4.552490234375, -4.29296875, -4.033447265625, -3.77392578125, -3.514404296875, -3.2548828125, -2.995361328125, -2.73583984375, -2.476318359375, -2.216796875, -1.957275390625, -1.69775390625, -1.438232421875, -1.1787109375, -0.919189453125, -0.65966796875, -0.400146484375, -0.140625, 0.118896484375, 0.37841796875, 0.637939453125, 0.8974609375, 1.156982421875, 1.41650390625, 1.676025390625, 1.935546875, 2.195068359375, 2.45458984375, 2.714111328125, 2.9736328125, 3.233154296875, 3.49267578125, 3.752197265625, 4.01171875, 4.271240234375, 4.53076171875, 4.790283203125, 5.0498046875, 5.309326171875, 5.56884765625, 5.828369140625, 6.087890625, 6.347412109375, 6.60693359375, 6.866455078125, 7.1259765625, 7.385498046875, 7.64501953125, 7.904541015625, 8.1640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 11.0, 9.0, 14.0, 16.0, 29.0, 45.0, 74.0, 67.0, 158.0, 216.0, 449.0, 874.0, 2170.0, 6025.0, 20871.0, 83151.0, 336391.0, 430040.0, 124660.0, 29780.0, 8454.0, 2808.0, 1081.0, 471.0, 282.0, 144.0, 89.0, 61.0, 32.0, 26.0, 25.0, 11.0, 9.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6015625, -8.38177490234375, -8.1619873046875, -7.94219970703125, -7.722412109375, -7.50262451171875, -7.2828369140625, -7.06304931640625, -6.84326171875, -6.62347412109375, -6.4036865234375, -6.18389892578125, -5.964111328125, -5.74432373046875, -5.5245361328125, -5.30474853515625, -5.0849609375, -4.86517333984375, -4.6453857421875, -4.42559814453125, -4.205810546875, -3.98602294921875, -3.7662353515625, -3.54644775390625, -3.32666015625, -3.10687255859375, -2.8870849609375, -2.66729736328125, -2.447509765625, -2.22772216796875, -2.0079345703125, -1.78814697265625, -1.568359375, -1.34857177734375, -1.1287841796875, -0.90899658203125, -0.689208984375, -0.46942138671875, -0.2496337890625, -0.02984619140625, 0.18994140625, 0.40972900390625, 0.6295166015625, 0.84930419921875, 1.069091796875, 1.28887939453125, 1.5086669921875, 1.72845458984375, 1.9482421875, 2.16802978515625, 2.3878173828125, 2.60760498046875, 2.827392578125, 3.04718017578125, 3.2669677734375, 3.48675537109375, 3.70654296875, 3.92633056640625, 4.1461181640625, 4.36590576171875, 4.585693359375, 4.80548095703125, 5.0252685546875, 5.24505615234375, 5.46484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 8.0, 12.0, 8.0, 25.0, 29.0, 25.0, 33.0, 35.0, 42.0, 64.0, 68.0, 91.0, 88.0, 92.0, 66.0, 65.0, 51.0, 33.0, 25.0, 20.0, 17.0, 15.0, 7.0, 12.0, 7.0, 2.0, 12.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007719993591308594, -0.0007464438676834106, -0.0007208883762359619, -0.0006953328847885132, -0.0006697773933410645, -0.0006442219018936157, -0.000618666410446167, -0.0005931109189987183, -0.0005675554275512695, -0.0005419999361038208, -0.0005164444446563721, -0.0004908889532089233, -0.0004653334617614746, -0.0004397779703140259, -0.00041422247886657715, -0.0003886669874191284, -0.0003631114959716797, -0.00033755600452423096, -0.0003120005130767822, -0.0002864450216293335, -0.00026088953018188477, -0.00023533403873443604, -0.0002097785472869873, -0.00018422305583953857, -0.00015866756439208984, -0.0001331120729446411, -0.00010755658149719238, -8.200109004974365e-05, -5.644559860229492e-05, -3.089010715484619e-05, -5.334615707397461e-06, 2.022087574005127e-05, 4.57763671875e-05, 7.133185863494873e-05, 9.688735008239746e-05, 0.0001224428415298462, 0.00014799833297729492, 0.00017355382442474365, 0.00019910931587219238, 0.0002246648073196411, 0.00025022029876708984, 0.0002757757902145386, 0.0003013312816619873, 0.00032688677310943604, 0.00035244226455688477, 0.0003779977560043335, 0.0004035532474517822, 0.00042910873889923096, 0.0004546642303466797, 0.0004802197217941284, 0.0005057752132415771, 0.0005313307046890259, 0.0005568861961364746, 0.0005824416875839233, 0.0006079971790313721, 0.0006335526704788208, 0.0006591081619262695, 0.0006846636533737183, 0.000710219144821167, 0.0007357746362686157, 0.0007613301277160645, 0.0007868856191635132, 0.0008124411106109619, 0.0008379966020584106, 0.0008635520935058594]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 17.0, 28.0, 31.0, 58.0, 80.0, 119.0, 221.0, 439.0, 868.0, 1743.0, 3902.0, 10818.0, 36629.0, 139531.0, 434858.0, 304301.0, 80124.0, 22091.0, 7180.0, 2800.0, 1266.0, 635.0, 327.0, 167.0, 102.0, 65.0, 49.0, 27.0, 21.0, 15.0, 9.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.08856201171875, -6.8724365234375, -6.65631103515625, -6.440185546875, -6.22406005859375, -6.0079345703125, -5.79180908203125, -5.57568359375, -5.35955810546875, -5.1434326171875, -4.92730712890625, -4.711181640625, -4.49505615234375, -4.2789306640625, -4.06280517578125, -3.8466796875, -3.63055419921875, -3.4144287109375, -3.19830322265625, -2.982177734375, -2.76605224609375, -2.5499267578125, -2.33380126953125, -2.11767578125, -1.90155029296875, -1.6854248046875, -1.46929931640625, -1.253173828125, -1.03704833984375, -0.8209228515625, -0.60479736328125, -0.388671875, -0.17254638671875, 0.0435791015625, 0.25970458984375, 0.475830078125, 0.69195556640625, 0.9080810546875, 1.12420654296875, 1.34033203125, 1.55645751953125, 1.7725830078125, 1.98870849609375, 2.204833984375, 2.42095947265625, 2.6370849609375, 2.85321044921875, 3.0693359375, 3.28546142578125, 3.5015869140625, 3.71771240234375, 3.933837890625, 4.14996337890625, 4.3660888671875, 4.58221435546875, 4.79833984375, 5.01446533203125, 5.2305908203125, 5.44671630859375, 5.662841796875, 5.87896728515625, 6.0950927734375, 6.31121826171875, 6.52734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 8.0, 16.0, 11.0, 14.0, 14.0, 21.0, 33.0, 21.0, 31.0, 38.0, 48.0, 33.0, 52.0, 59.0, 35.0, 69.0, 61.0, 64.0, 48.0, 41.0, 32.0, 37.0, 40.0, 26.0, 23.0, 18.0, 22.0, 12.0, 8.0, 7.0, 8.0, 9.0, 2.0, 6.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.470703125, -3.369415283203125, -3.26812744140625, -3.166839599609375, -3.0655517578125, -2.964263916015625, -2.86297607421875, -2.761688232421875, -2.660400390625, -2.559112548828125, -2.45782470703125, -2.356536865234375, -2.2552490234375, -2.153961181640625, -2.05267333984375, -1.951385498046875, -1.85009765625, -1.748809814453125, -1.64752197265625, -1.546234130859375, -1.4449462890625, -1.343658447265625, -1.24237060546875, -1.141082763671875, -1.039794921875, -0.938507080078125, -0.83721923828125, -0.735931396484375, -0.6346435546875, -0.533355712890625, -0.43206787109375, -0.330780029296875, -0.2294921875, -0.128204345703125, -0.02691650390625, 0.074371337890625, 0.1756591796875, 0.276947021484375, 0.37823486328125, 0.479522705078125, 0.580810546875, 0.682098388671875, 0.78338623046875, 0.884674072265625, 0.9859619140625, 1.087249755859375, 1.18853759765625, 1.289825439453125, 1.39111328125, 1.492401123046875, 1.59368896484375, 1.694976806640625, 1.7962646484375, 1.897552490234375, 1.99884033203125, 2.100128173828125, 2.201416015625, 2.302703857421875, 2.40399169921875, 2.505279541015625, 2.6065673828125, 2.707855224609375, 2.80914306640625, 2.910430908203125, 3.01171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 31.0, 47.0, 56.0, 63.0, 106.0, 114.0, 109.0, 107.0, 93.0, 77.0, 51.0, 31.0, 17.0, 17.0, 13.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.70713806152344, -79.26144409179688, -76.81575012207031, -74.37005615234375, -71.92436218261719, -69.47866821289062, -67.03297424316406, -64.5872802734375, -62.14158248901367, -59.69588851928711, -57.25019454956055, -54.804500579833984, -52.358802795410156, -49.913108825683594, -47.46741485595703, -45.02172088623047, -42.576026916503906, -40.130332946777344, -37.68463897705078, -35.23894500732422, -32.793251037597656, -30.34755516052246, -27.901859283447266, -25.456165313720703, -23.01047134399414, -20.564777374267578, -18.119083404541016, -15.67338752746582, -13.227693557739258, -10.781999588012695, -8.336304664611816, -5.8906097412109375, -3.444915771484375, -0.9992213249206543, 1.4464731216430664, 3.892167568206787, 6.337862014770508, 8.78355598449707, 11.22925090789795, 13.674945831298828, 16.12063980102539, 18.566333770751953, 21.012027740478516, 23.45772361755371, 25.903417587280273, 28.349111557006836, 30.79480743408203, 33.240501403808594, 35.686195373535156, 38.13188934326172, 40.57758331298828, 43.023277282714844, 45.468971252441406, 47.91466522216797, 50.3603630065918, 52.80605697631836, 55.25175094604492, 57.697444915771484, 60.14313888549805, 62.58883285522461, 65.03453063964844, 67.480224609375, 69.92591857910156, 72.37161254882812, 74.81730651855469]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 7.0, 10.0, 13.0, 15.0, 17.0, 17.0, 24.0, 29.0, 26.0, 39.0, 39.0, 46.0, 45.0, 42.0, 46.0, 46.0, 52.0, 49.0, 44.0, 41.0, 36.0, 41.0, 34.0, 47.0, 27.0, 22.0, 16.0, 16.0, 21.0, 18.0, 12.0, 18.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.153602600097656, -57.57966613769531, -56.00572967529297, -54.431793212890625, -52.85785675048828, -51.2839241027832, -49.70998764038086, -48.136051177978516, -46.56211471557617, -44.98817825317383, -43.414241790771484, -41.84030532836914, -40.26637268066406, -38.69243621826172, -37.118499755859375, -35.54456329345703, -33.97062683105469, -32.396690368652344, -30.82275390625, -29.24881935119629, -27.674882888793945, -26.1009464263916, -24.52701187133789, -22.953075408935547, -21.379138946533203, -19.80520248413086, -18.231266021728516, -16.657331466674805, -15.083395004272461, -13.509458541870117, -11.93552303314209, -10.361587524414062, -8.787651062011719, -7.213715076446533, -5.639779090881348, -4.065843105316162, -2.4919071197509766, -0.917971134185791, 0.6559648513793945, 2.229900360107422, 3.8038368225097656, 5.377772808074951, 6.951708793640137, 8.525644302368164, 10.099580764770508, 11.673517227172852, 13.247452735900879, 14.821388244628906, 16.39532470703125, 17.969261169433594, 19.543197631835938, 21.11713218688965, 22.691068649291992, 24.265005111694336, 25.838939666748047, 27.41287612915039, 28.986812591552734, 30.560749053955078, 32.13468551635742, 33.708621978759766, 35.282554626464844, 36.85649108886719, 38.43042755126953, 40.004364013671875, 41.57830047607422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 20.0, 16.0, 31.0, 52.0, 72.0, 137.0, 256.0, 557.0, 1218.0, 2986.0, 10728.0, 63543.0, 3406484.0, 657788.0, 38821.0, 7337.0, 2242.0, 918.0, 379.0, 215.0, 164.0, 84.0, 57.0, 42.0, 28.0, 16.0, 24.0, 15.0, 11.0, 2.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -28.728759765625, -27.47314453125, -26.217529296875, -24.9619140625, -23.706298828125, -22.45068359375, -21.195068359375, -19.939453125, -18.683837890625, -17.42822265625, -16.172607421875, -14.9169921875, -13.661376953125, -12.40576171875, -11.150146484375, -9.89453125, -8.638916015625, -7.38330078125, -6.127685546875, -4.8720703125, -3.616455078125, -2.36083984375, -1.105224609375, 0.150390625, 1.406005859375, 2.66162109375, 3.917236328125, 5.1728515625, 6.428466796875, 7.68408203125, 8.939697265625, 10.1953125, 11.450927734375, 12.70654296875, 13.962158203125, 15.2177734375, 16.473388671875, 17.72900390625, 18.984619140625, 20.240234375, 21.495849609375, 22.75146484375, 24.007080078125, 25.2626953125, 26.518310546875, 27.77392578125, 29.029541015625, 30.28515625, 31.540771484375, 32.79638671875, 34.052001953125, 35.3076171875, 36.563232421875, 37.81884765625, 39.074462890625, 40.330078125, 41.585693359375, 42.84130859375, 44.096923828125, 45.3525390625, 46.608154296875, 47.86376953125, 49.119384765625, 50.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 17.0, 20.0, 31.0, 30.0, 37.0, 54.0, 60.0, 69.0, 78.0, 76.0, 86.0, 80.0, 75.0, 55.0, 56.0, 35.0, 33.0, 25.0, 26.0, 13.0, 8.0, 12.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.857086181640625, -2.75518798828125, -2.653289794921875, -2.5513916015625, -2.449493408203125, -2.34759521484375, -2.245697021484375, -2.143798828125, -2.041900634765625, -1.94000244140625, -1.838104248046875, -1.7362060546875, -1.634307861328125, -1.53240966796875, -1.430511474609375, -1.32861328125, -1.226715087890625, -1.12481689453125, -1.022918701171875, -0.9210205078125, -0.819122314453125, -0.71722412109375, -0.615325927734375, -0.513427734375, -0.411529541015625, -0.30963134765625, -0.207733154296875, -0.1058349609375, -0.003936767578125, 0.09796142578125, 0.199859619140625, 0.3017578125, 0.403656005859375, 0.50555419921875, 0.607452392578125, 0.7093505859375, 0.811248779296875, 0.91314697265625, 1.015045166015625, 1.116943359375, 1.218841552734375, 1.32073974609375, 1.422637939453125, 1.5245361328125, 1.626434326171875, 1.72833251953125, 1.830230712890625, 1.93212890625, 2.034027099609375, 2.13592529296875, 2.237823486328125, 2.3397216796875, 2.441619873046875, 2.54351806640625, 2.645416259765625, 2.747314453125, 2.849212646484375, 2.95111083984375, 3.053009033203125, 3.1549072265625, 3.256805419921875, 3.35870361328125, 3.460601806640625, 3.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 16.0, 24.0, 42.0, 50.0, 93.0, 127.0, 213.0, 327.0, 661.0, 1194.0, 2791.0, 8953.0, 58016.0, 3097091.0, 976754.0, 35987.0, 6850.0, 2478.0, 1124.0, 601.0, 343.0, 206.0, 120.0, 66.0, 44.0, 29.0, 19.0, 16.0, 11.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.71826171875, -35.5302734375, -34.34228515625, -33.154296875, -31.96630859375, -30.7783203125, -29.59033203125, -28.40234375, -27.21435546875, -26.0263671875, -24.83837890625, -23.650390625, -22.46240234375, -21.2744140625, -20.08642578125, -18.8984375, -17.71044921875, -16.5224609375, -15.33447265625, -14.146484375, -12.95849609375, -11.7705078125, -10.58251953125, -9.39453125, -8.20654296875, -7.0185546875, -5.83056640625, -4.642578125, -3.45458984375, -2.2666015625, -1.07861328125, 0.109375, 1.29736328125, 2.4853515625, 3.67333984375, 4.861328125, 6.04931640625, 7.2373046875, 8.42529296875, 9.61328125, 10.80126953125, 11.9892578125, 13.17724609375, 14.365234375, 15.55322265625, 16.7412109375, 17.92919921875, 19.1171875, 20.30517578125, 21.4931640625, 22.68115234375, 23.869140625, 25.05712890625, 26.2451171875, 27.43310546875, 28.62109375, 29.80908203125, 30.9970703125, 32.18505859375, 33.373046875, 34.56103515625, 35.7490234375, 36.93701171875, 38.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 23.0, 49.0, 81.0, 191.0, 508.0, 2026.0, 737.0, 242.0, 92.0, 47.0, 16.0, 15.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.3802490234375, -11.932373046875, -11.4844970703125, -11.03662109375, -10.5887451171875, -10.140869140625, -9.6929931640625, -9.2451171875, -8.7972412109375, -8.349365234375, -7.9014892578125, -7.45361328125, -7.0057373046875, -6.557861328125, -6.1099853515625, -5.662109375, -5.2142333984375, -4.766357421875, -4.3184814453125, -3.87060546875, -3.4227294921875, -2.974853515625, -2.5269775390625, -2.0791015625, -1.6312255859375, -1.183349609375, -0.7354736328125, -0.28759765625, 0.1602783203125, 0.608154296875, 1.0560302734375, 1.50390625, 1.9517822265625, 2.399658203125, 2.8475341796875, 3.29541015625, 3.7432861328125, 4.191162109375, 4.6390380859375, 5.0869140625, 5.5347900390625, 5.982666015625, 6.4305419921875, 6.87841796875, 7.3262939453125, 7.774169921875, 8.2220458984375, 8.669921875, 9.1177978515625, 9.565673828125, 10.0135498046875, 10.46142578125, 10.9093017578125, 11.357177734375, 11.8050537109375, 12.2529296875, 12.7008056640625, 13.148681640625, 13.5965576171875, 14.04443359375, 14.4923095703125, 14.940185546875, 15.3880615234375, 15.8359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 15.0, 37.0, 63.0, 97.0, 172.0, 220.0, 158.0, 117.0, 59.0, 28.0, 15.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.96316528320312, -104.12205505371094, -101.28095245361328, -98.43984985351562, -95.59873962402344, -92.75762939453125, -89.9165267944336, -87.07542419433594, -84.23431396484375, -81.39320373535156, -78.5521011352539, -75.71099853515625, -72.86988830566406, -70.02877807617188, -67.18767547607422, -64.34657287597656, -61.505462646484375, -58.66435623168945, -55.82324981689453, -52.98214340209961, -50.14103698730469, -47.299930572509766, -44.458824157714844, -41.61771774291992, -38.776611328125, -35.93550491333008, -33.094398498535156, -30.253292083740234, -27.412185668945312, -24.57107925415039, -21.72997283935547, -18.888866424560547, -16.047767639160156, -13.206661224365234, -10.365554809570312, -7.524448394775391, -4.683341979980469, -1.8422355651855469, 0.998870849609375, 3.839977264404297, 6.681083679199219, 9.52219009399414, 12.363296508789062, 15.204402923583984, 18.045509338378906, 20.886615753173828, 23.72772216796875, 26.568828582763672, 29.409934997558594, 32.251041412353516, 35.09214782714844, 37.93325424194336, 40.77436065673828, 43.6154670715332, 46.456573486328125, 49.29767990112305, 52.13878631591797, 54.97989273071289, 57.82099914550781, 60.662105560302734, 63.503211975097656, 66.34431457519531, 69.1854248046875, 72.02653503417969, 74.86763763427734]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 18.0, 36.0, 31.0, 48.0, 73.0, 66.0, 69.0, 88.0, 97.0, 71.0, 86.0, 83.0, 67.0, 47.0, 30.0, 38.0, 15.0, 13.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.20011901855469, -30.490598678588867, -28.781078338623047, -27.07155990600586, -25.36203956604004, -23.65251922607422, -21.9429988861084, -20.233478546142578, -18.52396011352539, -16.81443977355957, -15.104920387268066, -13.395400047302246, -11.685880661010742, -9.976360321044922, -8.266839981079102, -6.557320594787598, -4.847799301147461, -3.138279438018799, -1.4287593364715576, 0.2807607650756836, 1.9902806282043457, 3.699800491333008, 5.409320831298828, 7.118840217590332, 8.828360557556152, 10.537880897521973, 12.247400283813477, 13.956920623779297, 15.666440963745117, 17.375961303710938, 19.085479736328125, 20.795000076293945, 22.504520416259766, 24.214040756225586, 25.923561096191406, 27.633079528808594, 29.342599868774414, 31.052120208740234, 32.76164245605469, 34.471160888671875, 36.18067932128906, 37.89019775390625, 39.5997200012207, 41.30923843383789, 43.018760681152344, 44.72827911376953, 46.43779754638672, 48.14731979370117, 49.856842041015625, 51.56636047363281, 53.275882720947266, 54.98540115356445, 56.694923400878906, 58.404441833496094, 60.11396026611328, 61.823482513427734, 63.53300094604492, 65.24252319335938, 66.95204162597656, 68.66156005859375, 70.37107849121094, 72.08059692382812, 73.79012298583984, 75.49964141845703, 77.20915985107422]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 15.0, 25.0, 21.0, 41.0, 59.0, 114.0, 212.0, 425.0, 973.0, 3205.0, 30011.0, 741554.0, 256363.0, 12023.0, 2043.0, 745.0, 311.0, 168.0, 87.0, 58.0, 34.0, 23.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.6875, -65.01318359375, -63.3388671875, -61.66455078125, -59.990234375, -58.31591796875, -56.6416015625, -54.96728515625, -53.29296875, -51.61865234375, -49.9443359375, -48.27001953125, -46.595703125, -44.92138671875, -43.2470703125, -41.57275390625, -39.8984375, -38.22412109375, -36.5498046875, -34.87548828125, -33.201171875, -31.52685546875, -29.8525390625, -28.17822265625, -26.50390625, -24.82958984375, -23.1552734375, -21.48095703125, -19.806640625, -18.13232421875, -16.4580078125, -14.78369140625, -13.109375, -11.43505859375, -9.7607421875, -8.08642578125, -6.412109375, -4.73779296875, -3.0634765625, -1.38916015625, 0.28515625, 1.95947265625, 3.6337890625, 5.30810546875, 6.982421875, 8.65673828125, 10.3310546875, 12.00537109375, 13.6796875, 15.35400390625, 17.0283203125, 18.70263671875, 20.376953125, 22.05126953125, 23.7255859375, 25.39990234375, 27.07421875, 28.74853515625, 30.4228515625, 32.09716796875, 33.771484375, 35.44580078125, 37.1201171875, 38.79443359375, 40.46875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 13.0, 22.0, 30.0, 53.0, 67.0, 78.0, 114.0, 124.0, 134.0, 96.0, 75.0, 64.0, 46.0, 32.0, 22.0, 12.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.0904541015625, -2.934814453125, -2.7791748046875, -2.62353515625, -2.4678955078125, -2.312255859375, -2.1566162109375, -2.0009765625, -1.8453369140625, -1.689697265625, -1.5340576171875, -1.37841796875, -1.2227783203125, -1.067138671875, -0.9114990234375, -0.755859375, -0.6002197265625, -0.444580078125, -0.2889404296875, -0.13330078125, 0.0223388671875, 0.177978515625, 0.3336181640625, 0.4892578125, 0.6448974609375, 0.800537109375, 0.9561767578125, 1.11181640625, 1.2674560546875, 1.423095703125, 1.5787353515625, 1.734375, 1.8900146484375, 2.045654296875, 2.2012939453125, 2.35693359375, 2.5125732421875, 2.668212890625, 2.8238525390625, 2.9794921875, 3.1351318359375, 3.290771484375, 3.4464111328125, 3.60205078125, 3.7576904296875, 3.913330078125, 4.0689697265625, 4.224609375, 4.3802490234375, 4.535888671875, 4.6915283203125, 4.84716796875, 5.0028076171875, 5.158447265625, 5.3140869140625, 5.4697265625, 5.6253662109375, 5.781005859375, 5.9366455078125, 6.09228515625, 6.2479248046875, 6.403564453125, 6.5592041015625, 6.71484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 4.0, 7.0, 12.0, 21.0, 14.0, 38.0, 52.0, 76.0, 125.0, 190.0, 302.0, 471.0, 879.0, 1545.0, 2941.0, 6225.0, 13440.0, 30479.0, 70720.0, 167880.0, 357604.0, 226558.0, 94085.0, 40650.0, 18049.0, 7946.0, 3707.0, 1914.0, 1022.0, 585.0, 326.0, 234.0, 171.0, 82.0, 55.0, 41.0, 35.0, 18.0, 13.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8189697265625, -7.536376953125, -7.2537841796875, -6.97119140625, -6.6885986328125, -6.406005859375, -6.1234130859375, -5.8408203125, -5.5582275390625, -5.275634765625, -4.9930419921875, -4.71044921875, -4.4278564453125, -4.145263671875, -3.8626708984375, -3.580078125, -3.2974853515625, -3.014892578125, -2.7322998046875, -2.44970703125, -2.1671142578125, -1.884521484375, -1.6019287109375, -1.3193359375, -1.0367431640625, -0.754150390625, -0.4715576171875, -0.18896484375, 0.0936279296875, 0.376220703125, 0.6588134765625, 0.94140625, 1.2239990234375, 1.506591796875, 1.7891845703125, 2.07177734375, 2.3543701171875, 2.636962890625, 2.9195556640625, 3.2021484375, 3.4847412109375, 3.767333984375, 4.0499267578125, 4.33251953125, 4.6151123046875, 4.897705078125, 5.1802978515625, 5.462890625, 5.7454833984375, 6.028076171875, 6.3106689453125, 6.59326171875, 6.8758544921875, 7.158447265625, 7.4410400390625, 7.7236328125, 8.0062255859375, 8.288818359375, 8.5714111328125, 8.85400390625, 9.1365966796875, 9.419189453125, 9.7017822265625, 9.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 10.0, 8.0, 12.0, 24.0, 26.0, 24.0, 22.0, 40.0, 44.0, 47.0, 48.0, 44.0, 45.0, 43.0, 55.0, 49.0, 48.0, 57.0, 49.0, 47.0, 45.0, 36.0, 35.0, 20.0, 26.0, 17.0, 17.0, 15.0, 7.0, 8.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34765625, -10.03125, -9.71484375, -9.3984375, -9.08203125, -8.765625, -8.44921875, -8.1328125, -7.81640625, -7.5, -7.18359375, -6.8671875, -6.55078125, -6.234375, -5.91796875, -5.6015625, -5.28515625, -4.96875, -4.65234375, -4.3359375, -4.01953125, -3.703125, -3.38671875, -3.0703125, -2.75390625, -2.4375, -2.12109375, -1.8046875, -1.48828125, -1.171875, -0.85546875, -0.5390625, -0.22265625, 0.09375, 0.41015625, 0.7265625, 1.04296875, 1.359375, 1.67578125, 1.9921875, 2.30859375, 2.625, 2.94140625, 3.2578125, 3.57421875, 3.890625, 4.20703125, 4.5234375, 4.83984375, 5.15625, 5.47265625, 5.7890625, 6.10546875, 6.421875, 6.73828125, 7.0546875, 7.37109375, 7.6875, 8.00390625, 8.3203125, 8.63671875, 8.953125, 9.26953125, 9.5859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 9.0, 21.0, 24.0, 31.0, 48.0, 75.0, 111.0, 194.0, 326.0, 565.0, 945.0, 1996.0, 4202.0, 9942.0, 26958.0, 84111.0, 283441.0, 426617.0, 139135.0, 43043.0, 15067.0, 5907.0, 2652.0, 1343.0, 693.0, 395.0, 232.0, 152.0, 90.0, 62.0, 49.0, 25.0, 15.0, 10.0, 6.0, 10.0, 6.0, 7.0, 0.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.30126953125, -5.1064453125, -4.91162109375, -4.716796875, -4.52197265625, -4.3271484375, -4.13232421875, -3.9375, -3.74267578125, -3.5478515625, -3.35302734375, -3.158203125, -2.96337890625, -2.7685546875, -2.57373046875, -2.37890625, -2.18408203125, -1.9892578125, -1.79443359375, -1.599609375, -1.40478515625, -1.2099609375, -1.01513671875, -0.8203125, -0.62548828125, -0.4306640625, -0.23583984375, -0.041015625, 0.15380859375, 0.3486328125, 0.54345703125, 0.73828125, 0.93310546875, 1.1279296875, 1.32275390625, 1.517578125, 1.71240234375, 1.9072265625, 2.10205078125, 2.296875, 2.49169921875, 2.6865234375, 2.88134765625, 3.076171875, 3.27099609375, 3.4658203125, 3.66064453125, 3.85546875, 4.05029296875, 4.2451171875, 4.43994140625, 4.634765625, 4.82958984375, 5.0244140625, 5.21923828125, 5.4140625, 5.60888671875, 5.8037109375, 5.99853515625, 6.193359375, 6.38818359375, 6.5830078125, 6.77783203125, 6.97265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 9.0, 8.0, 23.0, 16.0, 26.0, 41.0, 52.0, 73.0, 108.0, 150.0, 144.0, 105.0, 67.0, 40.0, 38.0, 28.0, 18.0, 11.0, 12.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001331329345703125, -0.0012942701578140259, -0.0012572109699249268, -0.0012201517820358276, -0.0011830925941467285, -0.0011460334062576294, -0.0011089742183685303, -0.0010719150304794312, -0.001034855842590332, -0.000997796654701233, -0.0009607374668121338, -0.0009236782789230347, -0.0008866190910339355, -0.0008495599031448364, -0.0008125007152557373, -0.0007754415273666382, -0.0007383823394775391, -0.0007013231515884399, -0.0006642639636993408, -0.0006272047758102417, -0.0005901455879211426, -0.0005530864000320435, -0.0005160272121429443, -0.0004789680242538452, -0.0004419088363647461, -0.00040484964847564697, -0.00036779046058654785, -0.00033073127269744873, -0.0002936720848083496, -0.0002566128969192505, -0.00021955370903015137, -0.00018249452114105225, -0.00014543533325195312, -0.000108376145362854, -7.131695747375488e-05, -3.425776958465576e-05, 2.8014183044433594e-06, 3.986060619354248e-05, 7.69197940826416e-05, 0.00011397898197174072, 0.00015103816986083984, 0.00018809735774993896, 0.00022515654563903809, 0.0002622157335281372, 0.00029927492141723633, 0.00033633410930633545, 0.00037339329719543457, 0.0004104524850845337, 0.0004475116729736328, 0.00048457086086273193, 0.0005216300487518311, 0.0005586892366409302, 0.0005957484245300293, 0.0006328076124191284, 0.0006698668003082275, 0.0007069259881973267, 0.0007439851760864258, 0.0007810443639755249, 0.000818103551864624, 0.0008551627397537231, 0.0008922219276428223, 0.0009292811155319214, 0.0009663403034210205, 0.0010033994913101196, 0.0010404586791992188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 5.0, 12.0, 7.0, 19.0, 26.0, 40.0, 53.0, 73.0, 112.0, 167.0, 246.0, 373.0, 652.0, 1023.0, 1702.0, 2960.0, 5713.0, 11757.0, 27466.0, 72430.0, 210120.0, 408758.0, 190725.0, 65431.0, 25233.0, 10876.0, 5503.0, 2854.0, 1589.0, 952.0, 588.0, 350.0, 249.0, 157.0, 102.0, 64.0, 51.0, 36.0, 23.0, 12.0, 15.0, 9.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.4423828125, -5.263671875, -5.0849609375, -4.90625, -4.7275390625, -4.548828125, -4.3701171875, -4.19140625, -4.0126953125, -3.833984375, -3.6552734375, -3.4765625, -3.2978515625, -3.119140625, -2.9404296875, -2.76171875, -2.5830078125, -2.404296875, -2.2255859375, -2.046875, -1.8681640625, -1.689453125, -1.5107421875, -1.33203125, -1.1533203125, -0.974609375, -0.7958984375, -0.6171875, -0.4384765625, -0.259765625, -0.0810546875, 0.09765625, 0.2763671875, 0.455078125, 0.6337890625, 0.8125, 0.9912109375, 1.169921875, 1.3486328125, 1.52734375, 1.7060546875, 1.884765625, 2.0634765625, 2.2421875, 2.4208984375, 2.599609375, 2.7783203125, 2.95703125, 3.1357421875, 3.314453125, 3.4931640625, 3.671875, 3.8505859375, 4.029296875, 4.2080078125, 4.38671875, 4.5654296875, 4.744140625, 4.9228515625, 5.1015625, 5.2802734375, 5.458984375, 5.6376953125, 5.81640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 9.0, 16.0, 16.0, 21.0, 32.0, 34.0, 47.0, 77.0, 91.0, 83.0, 77.0, 100.0, 62.0, 80.0, 59.0, 44.0, 24.0, 19.0, 17.0, 13.0, 14.0, 12.0, 8.0, 1.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.30517578125, -5.1416015625, -4.97802734375, -4.814453125, -4.65087890625, -4.4873046875, -4.32373046875, -4.16015625, -3.99658203125, -3.8330078125, -3.66943359375, -3.505859375, -3.34228515625, -3.1787109375, -3.01513671875, -2.8515625, -2.68798828125, -2.5244140625, -2.36083984375, -2.197265625, -2.03369140625, -1.8701171875, -1.70654296875, -1.54296875, -1.37939453125, -1.2158203125, -1.05224609375, -0.888671875, -0.72509765625, -0.5615234375, -0.39794921875, -0.234375, -0.07080078125, 0.0927734375, 0.25634765625, 0.419921875, 0.58349609375, 0.7470703125, 0.91064453125, 1.07421875, 1.23779296875, 1.4013671875, 1.56494140625, 1.728515625, 1.89208984375, 2.0556640625, 2.21923828125, 2.3828125, 2.54638671875, 2.7099609375, 2.87353515625, 3.037109375, 3.20068359375, 3.3642578125, 3.52783203125, 3.69140625, 3.85498046875, 4.0185546875, 4.18212890625, 4.345703125, 4.50927734375, 4.6728515625, 4.83642578125, 5.0]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 17.0, 37.0, 64.0, 163.0, 239.0, 226.0, 140.0, 66.0, 26.0, 13.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.753631591796875, -51.51547622680664, -46.27731704711914, -41.039161682128906, -35.801002502441406, -30.562847137451172, -25.324691772460938, -20.086532592773438, -14.848377227783203, -9.610219955444336, -4.372063636779785, 0.8660926818847656, 6.104249954223633, 11.3424072265625, 16.580562591552734, 21.818721771240234, 27.05687713623047, 32.2950325012207, 37.5331916809082, 42.77134704589844, 48.00950622558594, 53.24766159057617, 58.485816955566406, 63.723976135253906, 68.96212768554688, 74.20028686523438, 79.43843841552734, 84.67659759521484, 89.91475677490234, 95.15290832519531, 100.39106750488281, 105.62922668457031, 110.86738586425781, 116.10554504394531, 121.34369659423828, 126.58185577392578, 131.82000732421875, 137.05816650390625, 142.29632568359375, 147.53448486328125, 152.77264404296875, 158.01080322265625, 163.24896240234375, 168.48712158203125, 173.7252655029297, 178.9634246826172, 184.2015838623047, 189.4397430419922, 194.67788696289062, 199.91604614257812, 205.15420532226562, 210.39236450195312, 215.63050842285156, 220.86866760253906, 226.10682678222656, 231.34498596191406, 236.58314514160156, 241.82130432128906, 247.05946350097656, 252.297607421875, 257.5357666015625, 262.77392578125, 268.0120849609375, 273.250244140625, 278.4884033203125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 10.0, 7.0, 3.0, 11.0, 13.0, 9.0, 20.0, 16.0, 19.0, 14.0, 20.0, 35.0, 27.0, 26.0, 36.0, 39.0, 35.0, 43.0, 40.0, 26.0, 49.0, 49.0, 58.0, 41.0, 43.0, 29.0, 33.0, 33.0, 25.0, 26.0, 26.0, 27.0, 12.0, 17.0, 13.0, 19.0, 15.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.838951110839844, -43.33690643310547, -41.83486557006836, -40.332820892333984, -38.83077621459961, -37.3287353515625, -35.826690673828125, -34.32464599609375, -32.82260513305664, -31.3205623626709, -29.818517684936523, -28.31647491455078, -26.81443214416504, -25.312389373779297, -23.810344696044922, -22.30830192565918, -20.806257247924805, -19.304214477539062, -17.802169799804688, -16.300127029418945, -14.798084259033203, -13.296040534973145, -11.793996810913086, -10.291954040527344, -8.789910316467285, -7.287867069244385, -5.785823822021484, -4.283780097961426, -2.7817368507385254, -1.279693603515625, 0.2223501205444336, 1.7243928909301758, 3.2264366149902344, 4.728479862213135, 6.230523109436035, 7.732566833496094, 9.234609603881836, 10.736653327941895, 12.238697052001953, 13.740739822387695, 15.242783546447754, 16.744827270507812, 18.246870040893555, 19.748912811279297, 21.250957489013672, 22.753000259399414, 24.255043029785156, 25.75708770751953, 27.259130477905273, 28.761173248291016, 30.26321792602539, 31.765260696411133, 33.267303466796875, 34.76934814453125, 36.271392822265625, 37.773433685302734, 39.27547836303711, 40.777523040771484, 42.279563903808594, 43.78160858154297, 45.283653259277344, 46.78569412231445, 48.28773880004883, 49.78977966308594, 51.29182434082031]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 13.0, 13.0, 29.0, 49.0, 117.0, 237.0, 568.0, 1943.0, 12872.0, 3396902.0, 768697.0, 10079.0, 1632.0, 574.0, 240.0, 130.0, 57.0, 46.0, 28.0, 14.0, 7.0, 6.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.005859375, -53.76171875, -51.517578125, -49.2734375, -47.029296875, -44.78515625, -42.541015625, -40.296875, -38.052734375, -35.80859375, -33.564453125, -31.3203125, -29.076171875, -26.83203125, -24.587890625, -22.34375, -20.099609375, -17.85546875, -15.611328125, -13.3671875, -11.123046875, -8.87890625, -6.634765625, -4.390625, -2.146484375, 0.09765625, 2.341796875, 4.5859375, 6.830078125, 9.07421875, 11.318359375, 13.5625, 15.806640625, 18.05078125, 20.294921875, 22.5390625, 24.783203125, 27.02734375, 29.271484375, 31.515625, 33.759765625, 36.00390625, 38.248046875, 40.4921875, 42.736328125, 44.98046875, 47.224609375, 49.46875, 51.712890625, 53.95703125, 56.201171875, 58.4453125, 60.689453125, 62.93359375, 65.177734375, 67.421875, 69.666015625, 71.91015625, 74.154296875, 76.3984375, 78.642578125, 80.88671875, 83.130859375, 85.375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 24.0, 41.0, 46.0, 47.0, 80.0, 110.0, 131.0, 124.0, 98.0, 79.0, 72.0, 44.0, 33.0, 28.0, 13.0, 6.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.163330078125, -3.00634765625, -2.849365234375, -2.6923828125, -2.535400390625, -2.37841796875, -2.221435546875, -2.064453125, -1.907470703125, -1.75048828125, -1.593505859375, -1.4365234375, -1.279541015625, -1.12255859375, -0.965576171875, -0.80859375, -0.651611328125, -0.49462890625, -0.337646484375, -0.1806640625, -0.023681640625, 0.13330078125, 0.290283203125, 0.447265625, 0.604248046875, 0.76123046875, 0.918212890625, 1.0751953125, 1.232177734375, 1.38916015625, 1.546142578125, 1.703125, 1.860107421875, 2.01708984375, 2.174072265625, 2.3310546875, 2.488037109375, 2.64501953125, 2.802001953125, 2.958984375, 3.115966796875, 3.27294921875, 3.429931640625, 3.5869140625, 3.743896484375, 3.90087890625, 4.057861328125, 4.21484375, 4.371826171875, 4.52880859375, 4.685791015625, 4.8427734375, 4.999755859375, 5.15673828125, 5.313720703125, 5.470703125, 5.627685546875, 5.78466796875, 5.941650390625, 6.0986328125, 6.255615234375, 6.41259765625, 6.569580078125, 6.7265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 8.0, 10.0, 15.0, 14.0, 35.0, 38.0, 33.0, 70.0, 81.0, 128.0, 189.0, 337.0, 570.0, 1106.0, 2347.0, 5389.0, 13391.0, 38067.0, 125194.0, 625981.0, 2956726.0, 305452.0, 76445.0, 25501.0, 9269.0, 3926.0, 1832.0, 862.0, 487.0, 246.0, 164.0, 97.0, 71.0, 54.0, 31.0, 27.0, 21.0, 12.0, 16.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-13.5234375, -13.0772705078125, -12.631103515625, -12.1849365234375, -11.73876953125, -11.2926025390625, -10.846435546875, -10.4002685546875, -9.9541015625, -9.5079345703125, -9.061767578125, -8.6156005859375, -8.16943359375, -7.7232666015625, -7.277099609375, -6.8309326171875, -6.384765625, -5.9385986328125, -5.492431640625, -5.0462646484375, -4.60009765625, -4.1539306640625, -3.707763671875, -3.2615966796875, -2.8154296875, -2.3692626953125, -1.923095703125, -1.4769287109375, -1.03076171875, -0.5845947265625, -0.138427734375, 0.3077392578125, 0.75390625, 1.2000732421875, 1.646240234375, 2.0924072265625, 2.53857421875, 2.9847412109375, 3.430908203125, 3.8770751953125, 4.3232421875, 4.7694091796875, 5.215576171875, 5.6617431640625, 6.10791015625, 6.5540771484375, 7.000244140625, 7.4464111328125, 7.892578125, 8.3387451171875, 8.784912109375, 9.2310791015625, 9.67724609375, 10.1234130859375, 10.569580078125, 11.0157470703125, 11.4619140625, 11.9080810546875, 12.354248046875, 12.8004150390625, 13.24658203125, 13.6927490234375, 14.138916015625, 14.5850830078125, 15.03125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 10.0, 22.0, 28.0, 37.0, 56.0, 93.0, 156.0, 272.0, 622.0, 1663.0, 528.0, 225.0, 129.0, 86.0, 47.0, 29.0, 21.0, 9.0, 10.0, 8.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.078125, -8.847900390625, -8.61767578125, -8.387451171875, -8.1572265625, -7.927001953125, -7.69677734375, -7.466552734375, -7.236328125, -7.006103515625, -6.77587890625, -6.545654296875, -6.3154296875, -6.085205078125, -5.85498046875, -5.624755859375, -5.39453125, -5.164306640625, -4.93408203125, -4.703857421875, -4.4736328125, -4.243408203125, -4.01318359375, -3.782958984375, -3.552734375, -3.322509765625, -3.09228515625, -2.862060546875, -2.6318359375, -2.401611328125, -2.17138671875, -1.941162109375, -1.7109375, -1.480712890625, -1.25048828125, -1.020263671875, -0.7900390625, -0.559814453125, -0.32958984375, -0.099365234375, 0.130859375, 0.361083984375, 0.59130859375, 0.821533203125, 1.0517578125, 1.281982421875, 1.51220703125, 1.742431640625, 1.97265625, 2.202880859375, 2.43310546875, 2.663330078125, 2.8935546875, 3.123779296875, 3.35400390625, 3.584228515625, 3.814453125, 4.044677734375, 4.27490234375, 4.505126953125, 4.7353515625, 4.965576171875, 5.19580078125, 5.426025390625, 5.65625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 14.0, 29.0, 45.0, 63.0, 85.0, 72.0, 96.0, 85.0, 104.0, 104.0, 76.0, 68.0, 43.0, 33.0, 32.0, 7.0, 5.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.733978271484375, -38.596065521240234, -37.458152770996094, -36.32024002075195, -35.18232727050781, -34.04441452026367, -32.90650177001953, -31.76858901977539, -30.63067626953125, -29.49276351928711, -28.35485076904297, -27.216938018798828, -26.079025268554688, -24.941112518310547, -23.803199768066406, -22.665287017822266, -21.527372360229492, -20.38945960998535, -19.25154685974121, -18.11363410949707, -16.97572135925293, -15.837808609008789, -14.699894905090332, -13.561982154846191, -12.42406940460205, -11.28615665435791, -10.14824390411377, -9.010330200195312, -7.87241792678833, -6.7345051765441895, -5.596591949462891, -4.45867919921875, -3.3207664489746094, -2.1828536987304688, -1.044940710067749, 0.0929722785949707, 1.2308850288391113, 2.368797779083252, 3.506711006164551, 4.644623756408691, 5.782536506652832, 6.920449256896973, 8.058362007141113, 9.19627571105957, 10.334188461303711, 11.472101211547852, 12.610013961791992, 13.747926712036133, 14.885839462280273, 16.023752212524414, 17.161664962768555, 18.299577713012695, 19.437490463256836, 20.575403213500977, 21.71331787109375, 22.85123062133789, 23.98914337158203, 25.127056121826172, 26.264968872070312, 27.402881622314453, 28.540794372558594, 29.678707122802734, 30.816619873046875, 31.954532623291016, 33.092445373535156]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 10.0, 16.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 32.0, 29.0, 37.0, 37.0, 37.0, 42.0, 50.0, 49.0, 46.0, 51.0, 49.0, 43.0, 51.0, 43.0, 37.0, 38.0, 36.0, 30.0, 16.0, 20.0, 11.0, 16.0, 12.0, 20.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.554555892944336, -17.885683059692383, -17.21681022644043, -16.54793930053711, -15.879066467285156, -15.210193634033203, -14.54132080078125, -13.872447967529297, -13.20357608795166, -12.534703254699707, -11.86583137512207, -11.196958541870117, -10.528085708618164, -9.859213829040527, -9.190340995788574, -8.521469116210938, -7.852596282958984, -7.1837239265441895, -6.5148515701293945, -5.845978736877441, -5.1771063804626465, -4.508234024047852, -3.8393611907958984, -3.1704888343811035, -2.5016164779663086, -1.8327440023422241, -1.1638715267181396, -0.4949989318847656, 0.1738734245300293, 0.8427457809448242, 1.5116186141967773, 2.1804909706115723, 2.849363327026367, 3.518235683441162, 4.187108039855957, 4.85598087310791, 5.524853229522705, 6.1937255859375, 6.862598419189453, 7.531470775604248, 8.200343132019043, 8.869215965270996, 9.538087844848633, 10.206960678100586, 10.875833511352539, 11.544705390930176, 12.213578224182129, 12.882450103759766, 13.551322937011719, 14.220195770263672, 14.889067649841309, 15.557940483093262, 16.2268123626709, 16.89568519592285, 17.564558029174805, 18.233430862426758, 18.902301788330078, 19.57117462158203, 20.240047454833984, 20.908920288085938, 21.577791213989258, 22.24666404724121, 22.915536880493164, 23.584409713745117, 24.25328254699707]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 13.0, 4.0, 13.0, 18.0, 26.0, 52.0, 63.0, 93.0, 185.0, 338.0, 666.0, 1585.0, 5447.0, 37278.0, 441513.0, 509324.0, 42764.0, 5981.0, 1639.0, 704.0, 292.0, 194.0, 126.0, 70.0, 50.0, 30.0, 32.0, 13.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0], "bins": [-50.65625, -49.421630859375, -48.18701171875, -46.952392578125, -45.7177734375, -44.483154296875, -43.24853515625, -42.013916015625, -40.779296875, -39.544677734375, -38.31005859375, -37.075439453125, -35.8408203125, -34.606201171875, -33.37158203125, -32.136962890625, -30.90234375, -29.667724609375, -28.43310546875, -27.198486328125, -25.9638671875, -24.729248046875, -23.49462890625, -22.260009765625, -21.025390625, -19.790771484375, -18.55615234375, -17.321533203125, -16.0869140625, -14.852294921875, -13.61767578125, -12.383056640625, -11.1484375, -9.913818359375, -8.67919921875, -7.444580078125, -6.2099609375, -4.975341796875, -3.74072265625, -2.506103515625, -1.271484375, -0.036865234375, 1.19775390625, 2.432373046875, 3.6669921875, 4.901611328125, 6.13623046875, 7.370849609375, 8.60546875, 9.840087890625, 11.07470703125, 12.309326171875, 13.5439453125, 14.778564453125, 16.01318359375, 17.247802734375, 18.482421875, 19.717041015625, 20.95166015625, 22.186279296875, 23.4208984375, 24.655517578125, 25.89013671875, 27.124755859375, 28.359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 17.0, 20.0, 42.0, 37.0, 61.0, 91.0, 129.0, 111.0, 114.0, 87.0, 87.0, 59.0, 51.0, 35.0, 23.0, 11.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.186248779296875, -3.02679443359375, -2.867340087890625, -2.7078857421875, -2.548431396484375, -2.38897705078125, -2.229522705078125, -2.070068359375, -1.910614013671875, -1.75115966796875, -1.591705322265625, -1.4322509765625, -1.272796630859375, -1.11334228515625, -0.953887939453125, -0.79443359375, -0.634979248046875, -0.47552490234375, -0.316070556640625, -0.1566162109375, 0.002838134765625, 0.16229248046875, 0.321746826171875, 0.481201171875, 0.640655517578125, 0.80010986328125, 0.959564208984375, 1.1190185546875, 1.278472900390625, 1.43792724609375, 1.597381591796875, 1.7568359375, 1.916290283203125, 2.07574462890625, 2.235198974609375, 2.3946533203125, 2.554107666015625, 2.71356201171875, 2.873016357421875, 3.032470703125, 3.191925048828125, 3.35137939453125, 3.510833740234375, 3.6702880859375, 3.829742431640625, 3.98919677734375, 4.148651123046875, 4.30810546875, 4.467559814453125, 4.62701416015625, 4.786468505859375, 4.9459228515625, 5.105377197265625, 5.26483154296875, 5.424285888671875, 5.583740234375, 5.743194580078125, 5.90264892578125, 6.062103271484375, 6.2215576171875, 6.381011962890625, 6.54046630859375, 6.699920654296875, 6.859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 5.0, 7.0, 7.0, 14.0, 23.0, 38.0, 62.0, 84.0, 91.0, 167.0, 234.0, 343.0, 587.0, 1180.0, 2756.0, 7887.0, 26492.0, 96854.0, 328316.0, 402681.0, 128377.0, 35601.0, 10078.0, 3421.0, 1393.0, 669.0, 425.0, 241.0, 178.0, 119.0, 68.0, 43.0, 43.0, 24.0, 7.0, 13.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.66943359375, -11.2685546875, -10.86767578125, -10.466796875, -10.06591796875, -9.6650390625, -9.26416015625, -8.86328125, -8.46240234375, -8.0615234375, -7.66064453125, -7.259765625, -6.85888671875, -6.4580078125, -6.05712890625, -5.65625, -5.25537109375, -4.8544921875, -4.45361328125, -4.052734375, -3.65185546875, -3.2509765625, -2.85009765625, -2.44921875, -2.04833984375, -1.6474609375, -1.24658203125, -0.845703125, -0.44482421875, -0.0439453125, 0.35693359375, 0.7578125, 1.15869140625, 1.5595703125, 1.96044921875, 2.361328125, 2.76220703125, 3.1630859375, 3.56396484375, 3.96484375, 4.36572265625, 4.7666015625, 5.16748046875, 5.568359375, 5.96923828125, 6.3701171875, 6.77099609375, 7.171875, 7.57275390625, 7.9736328125, 8.37451171875, 8.775390625, 9.17626953125, 9.5771484375, 9.97802734375, 10.37890625, 10.77978515625, 11.1806640625, 11.58154296875, 11.982421875, 12.38330078125, 12.7841796875, 13.18505859375, 13.5859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 9.0, 9.0, 11.0, 13.0, 10.0, 15.0, 20.0, 21.0, 29.0, 31.0, 25.0, 20.0, 30.0, 31.0, 37.0, 29.0, 44.0, 32.0, 31.0, 28.0, 38.0, 34.0, 53.0, 28.0, 31.0, 33.0, 30.0, 25.0, 41.0, 22.0, 22.0, 18.0, 17.0, 20.0, 19.0, 11.0, 19.0, 7.0, 14.0, 2.0, 4.0, 11.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.72265625, -6.495849609375, -6.26904296875, -6.042236328125, -5.8154296875, -5.588623046875, -5.36181640625, -5.135009765625, -4.908203125, -4.681396484375, -4.45458984375, -4.227783203125, -4.0009765625, -3.774169921875, -3.54736328125, -3.320556640625, -3.09375, -2.866943359375, -2.64013671875, -2.413330078125, -2.1865234375, -1.959716796875, -1.73291015625, -1.506103515625, -1.279296875, -1.052490234375, -0.82568359375, -0.598876953125, -0.3720703125, -0.145263671875, 0.08154296875, 0.308349609375, 0.53515625, 0.761962890625, 0.98876953125, 1.215576171875, 1.4423828125, 1.669189453125, 1.89599609375, 2.122802734375, 2.349609375, 2.576416015625, 2.80322265625, 3.030029296875, 3.2568359375, 3.483642578125, 3.71044921875, 3.937255859375, 4.1640625, 4.390869140625, 4.61767578125, 4.844482421875, 5.0712890625, 5.298095703125, 5.52490234375, 5.751708984375, 5.978515625, 6.205322265625, 6.43212890625, 6.658935546875, 6.8857421875, 7.112548828125, 7.33935546875, 7.566162109375, 7.79296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 12.0, 20.0, 14.0, 28.0, 45.0, 70.0, 113.0, 260.0, 557.0, 1748.0, 6195.0, 28932.0, 221458.0, 675841.0, 92545.0, 15163.0, 3688.0, 1066.0, 399.0, 173.0, 78.0, 54.0, 22.0, 23.0, 16.0, 17.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.8270263671875, -13.411865234375, -12.9967041015625, -12.58154296875, -12.1663818359375, -11.751220703125, -11.3360595703125, -10.9208984375, -10.5057373046875, -10.090576171875, -9.6754150390625, -9.26025390625, -8.8450927734375, -8.429931640625, -8.0147705078125, -7.599609375, -7.1844482421875, -6.769287109375, -6.3541259765625, -5.93896484375, -5.5238037109375, -5.108642578125, -4.6934814453125, -4.2783203125, -3.8631591796875, -3.447998046875, -3.0328369140625, -2.61767578125, -2.2025146484375, -1.787353515625, -1.3721923828125, -0.95703125, -0.5418701171875, -0.126708984375, 0.2884521484375, 0.70361328125, 1.1187744140625, 1.533935546875, 1.9490966796875, 2.3642578125, 2.7794189453125, 3.194580078125, 3.6097412109375, 4.02490234375, 4.4400634765625, 4.855224609375, 5.2703857421875, 5.685546875, 6.1007080078125, 6.515869140625, 6.9310302734375, 7.34619140625, 7.7613525390625, 8.176513671875, 8.5916748046875, 9.0068359375, 9.4219970703125, 9.837158203125, 10.2523193359375, 10.66748046875, 11.0826416015625, 11.497802734375, 11.9129638671875, 12.328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 18.0, 20.0, 22.0, 29.0, 47.0, 61.0, 97.0, 156.0, 155.0, 108.0, 71.0, 41.0, 34.0, 29.0, 15.0, 20.0, 12.0, 6.0, 12.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016269683837890625, -0.0015861988067626953, -0.0015454292297363281, -0.001504659652709961, -0.0014638900756835938, -0.0014231204986572266, -0.0013823509216308594, -0.0013415813446044922, -0.001300811767578125, -0.0012600421905517578, -0.0012192726135253906, -0.0011785030364990234, -0.0011377334594726562, -0.001096963882446289, -0.0010561943054199219, -0.0010154247283935547, -0.0009746551513671875, -0.0009338855743408203, -0.0008931159973144531, -0.0008523464202880859, -0.0008115768432617188, -0.0007708072662353516, -0.0007300376892089844, -0.0006892681121826172, -0.00064849853515625, -0.0006077289581298828, -0.0005669593811035156, -0.0005261898040771484, -0.00048542022705078125, -0.00044465065002441406, -0.0004038810729980469, -0.0003631114959716797, -0.0003223419189453125, -0.0002815723419189453, -0.00024080276489257812, -0.00020003318786621094, -0.00015926361083984375, -0.00011849403381347656, -7.772445678710938e-05, -3.695487976074219e-05, 3.814697265625e-06, 4.458427429199219e-05, 8.535385131835938e-05, 0.00012612342834472656, 0.00016689300537109375, 0.00020766258239746094, 0.0002484321594238281, 0.0002892017364501953, 0.0003299713134765625, 0.0003707408905029297, 0.0004115104675292969, 0.00045228004455566406, 0.0004930496215820312, 0.0005338191986083984, 0.0005745887756347656, 0.0006153583526611328, 0.0006561279296875, 0.0006968975067138672, 0.0007376670837402344, 0.0007784366607666016, 0.0008192062377929688, 0.0008599758148193359, 0.0009007453918457031, 0.0009415149688720703, 0.0009822845458984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 18.0, 22.0, 23.0, 53.0, 75.0, 119.0, 232.0, 562.0, 1678.0, 6554.0, 35321.0, 407865.0, 540351.0, 44605.0, 7754.0, 1991.0, 670.0, 281.0, 154.0, 75.0, 59.0, 32.0, 16.0, 13.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.6875, -17.1829833984375, -16.678466796875, -16.1739501953125, -15.66943359375, -15.1649169921875, -14.660400390625, -14.1558837890625, -13.6513671875, -13.1468505859375, -12.642333984375, -12.1378173828125, -11.63330078125, -11.1287841796875, -10.624267578125, -10.1197509765625, -9.615234375, -9.1107177734375, -8.606201171875, -8.1016845703125, -7.59716796875, -7.0926513671875, -6.588134765625, -6.0836181640625, -5.5791015625, -5.0745849609375, -4.570068359375, -4.0655517578125, -3.56103515625, -3.0565185546875, -2.552001953125, -2.0474853515625, -1.54296875, -1.0384521484375, -0.533935546875, -0.0294189453125, 0.47509765625, 0.9796142578125, 1.484130859375, 1.9886474609375, 2.4931640625, 2.9976806640625, 3.502197265625, 4.0067138671875, 4.51123046875, 5.0157470703125, 5.520263671875, 6.0247802734375, 6.529296875, 7.0338134765625, 7.538330078125, 8.0428466796875, 8.54736328125, 9.0518798828125, 9.556396484375, 10.0609130859375, 10.5654296875, 11.0699462890625, 11.574462890625, 12.0789794921875, 12.58349609375, 13.0880126953125, 13.592529296875, 14.0970458984375, 14.6015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 13.0, 6.0, 13.0, 12.0, 25.0, 31.0, 42.0, 51.0, 65.0, 86.0, 122.0, 126.0, 85.0, 89.0, 53.0, 43.0, 35.0, 18.0, 22.0, 9.0, 15.0, 7.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -4.98333740234375, -4.7674560546875, -4.55157470703125, -4.335693359375, -4.11981201171875, -3.9039306640625, -3.68804931640625, -3.47216796875, -3.25628662109375, -3.0404052734375, -2.82452392578125, -2.608642578125, -2.39276123046875, -2.1768798828125, -1.96099853515625, -1.7451171875, -1.52923583984375, -1.3133544921875, -1.09747314453125, -0.881591796875, -0.66571044921875, -0.4498291015625, -0.23394775390625, -0.01806640625, 0.19781494140625, 0.4136962890625, 0.62957763671875, 0.845458984375, 1.06134033203125, 1.2772216796875, 1.49310302734375, 1.708984375, 1.92486572265625, 2.1407470703125, 2.35662841796875, 2.572509765625, 2.78839111328125, 3.0042724609375, 3.22015380859375, 3.43603515625, 3.65191650390625, 3.8677978515625, 4.08367919921875, 4.299560546875, 4.51544189453125, 4.7313232421875, 4.94720458984375, 5.1630859375, 5.37896728515625, 5.5948486328125, 5.81072998046875, 6.026611328125, 6.24249267578125, 6.4583740234375, 6.67425537109375, 6.89013671875, 7.10601806640625, 7.3218994140625, 7.53778076171875, 7.753662109375, 7.96954345703125, 8.1854248046875, 8.40130615234375, 8.6171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 12.0, 27.0, 41.0, 66.0, 108.0, 129.0, 162.0, 157.0, 117.0, 71.0, 49.0, 22.0, 15.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.517333984375, -57.0521354675293, -53.586936950683594, -50.121742248535156, -46.65654373168945, -43.19134521484375, -39.72614669799805, -36.260948181152344, -32.795753479003906, -29.330554962158203, -25.865358352661133, -22.40015983581543, -18.93496322631836, -15.469764709472656, -12.004566192626953, -8.539369583129883, -5.074169158935547, -1.608971357345581, 1.8562264442443848, 5.32142448425293, 8.786622047424316, 12.251819610595703, 15.717018127441406, 19.182214736938477, 22.64741325378418, 26.112611770629883, 29.577808380126953, 33.043006896972656, 36.50820541381836, 39.97340393066406, 43.4385986328125, 46.9037971496582, 50.368995666503906, 53.83419418334961, 57.29939270019531, 60.76458740234375, 64.22978973388672, 67.69498443603516, 71.16018676757812, 74.62538146972656, 78.090576171875, 81.55577087402344, 85.0209732055664, 88.48616790771484, 91.95137023925781, 95.41656494140625, 98.88175964355469, 102.34696197509766, 105.81216430664062, 109.27735900878906, 112.74256134033203, 116.20775604248047, 119.67295837402344, 123.13815307617188, 126.60334777832031, 130.06854248046875, 133.5337371826172, 136.99893188476562, 140.46412658691406, 143.92933654785156, 147.39453125, 150.85972595214844, 154.32492065429688, 157.7901153564453, 161.2553253173828]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 6.0, 7.0, 6.0, 10.0, 10.0, 21.0, 17.0, 24.0, 22.0, 22.0, 25.0, 31.0, 26.0, 32.0, 34.0, 33.0, 46.0, 33.0, 29.0, 38.0, 36.0, 43.0, 48.0, 37.0, 35.0, 27.0, 38.0, 36.0, 30.0, 17.0, 28.0, 12.0, 21.0, 15.0, 15.0, 14.0, 5.0, 10.0, 8.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-41.34233093261719, -40.033485412597656, -38.72464370727539, -37.41579818725586, -36.106956481933594, -34.79811096191406, -33.48926544189453, -32.180423736572266, -30.871578216552734, -29.562734603881836, -28.253890991210938, -26.945045471191406, -25.636201858520508, -24.32735824584961, -23.01851463317871, -21.709671020507812, -20.400827407836914, -19.091983795166016, -17.783140182495117, -16.47429656982422, -15.165451049804688, -13.856607437133789, -12.54776382446289, -11.238919258117676, -9.930075645446777, -8.621232032775879, -7.312387466430664, -6.003543853759766, -4.694699764251709, -3.3858556747436523, -2.077012062072754, -0.7681674957275391, 0.5406761169433594, 1.8495200872421265, 3.1583640575408936, 4.467207908630371, 5.776051998138428, 7.084896087646484, 8.393739700317383, 9.702584266662598, 11.011427879333496, 12.320271492004395, 13.62911605834961, 14.937959671020508, 16.246803283691406, 17.555648803710938, 18.864490509033203, 20.173336029052734, 21.482179641723633, 22.79102325439453, 24.09986686706543, 25.408710479736328, 26.71755599975586, 28.026399612426758, 29.335243225097656, 30.644088745117188, 31.952930450439453, 33.261775970458984, 34.57061767578125, 35.87946319580078, 37.18830490112305, 38.49715042114258, 39.805992126464844, 41.114837646484375, 42.423683166503906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 11.0, 8.0, 41.0, 49.0, 73.0, 105.0, 204.0, 355.0, 751.0, 1644.0, 4582.0, 20646.0, 210670.0, 3787669.0, 144107.0, 16275.0, 3984.0, 1392.0, 651.0, 324.0, 216.0, 145.0, 92.0, 67.0, 58.0, 28.0, 17.0, 21.0, 16.0, 6.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.8125, -30.455078125, -29.09765625, -27.740234375, -26.3828125, -25.025390625, -23.66796875, -22.310546875, -20.953125, -19.595703125, -18.23828125, -16.880859375, -15.5234375, -14.166015625, -12.80859375, -11.451171875, -10.09375, -8.736328125, -7.37890625, -6.021484375, -4.6640625, -3.306640625, -1.94921875, -0.591796875, 0.765625, 2.123046875, 3.48046875, 4.837890625, 6.1953125, 7.552734375, 8.91015625, 10.267578125, 11.625, 12.982421875, 14.33984375, 15.697265625, 17.0546875, 18.412109375, 19.76953125, 21.126953125, 22.484375, 23.841796875, 25.19921875, 26.556640625, 27.9140625, 29.271484375, 30.62890625, 31.986328125, 33.34375, 34.701171875, 36.05859375, 37.416015625, 38.7734375, 40.130859375, 41.48828125, 42.845703125, 44.203125, 45.560546875, 46.91796875, 48.275390625, 49.6328125, 50.990234375, 52.34765625, 53.705078125, 55.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 19.0, 23.0, 33.0, 41.0, 68.0, 79.0, 116.0, 125.0, 103.0, 90.0, 95.0, 65.0, 55.0, 32.0, 22.0, 8.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37890625, -3.21807861328125, -3.0572509765625, -2.89642333984375, -2.735595703125, -2.57476806640625, -2.4139404296875, -2.25311279296875, -2.09228515625, -1.93145751953125, -1.7706298828125, -1.60980224609375, -1.448974609375, -1.28814697265625, -1.1273193359375, -0.96649169921875, -0.8056640625, -0.64483642578125, -0.4840087890625, -0.32318115234375, -0.162353515625, -0.00152587890625, 0.1593017578125, 0.32012939453125, 0.48095703125, 0.64178466796875, 0.8026123046875, 0.96343994140625, 1.124267578125, 1.28509521484375, 1.4459228515625, 1.60675048828125, 1.767578125, 1.92840576171875, 2.0892333984375, 2.25006103515625, 2.410888671875, 2.57171630859375, 2.7325439453125, 2.89337158203125, 3.05419921875, 3.21502685546875, 3.3758544921875, 3.53668212890625, 3.697509765625, 3.85833740234375, 4.0191650390625, 4.17999267578125, 4.3408203125, 4.50164794921875, 4.6624755859375, 4.82330322265625, 4.984130859375, 5.14495849609375, 5.3057861328125, 5.46661376953125, 5.62744140625, 5.78826904296875, 5.9490966796875, 6.10992431640625, 6.270751953125, 6.43157958984375, 6.5924072265625, 6.75323486328125, 6.9140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 6.0, 20.0, 18.0, 18.0, 19.0, 43.0, 63.0, 108.0, 131.0, 270.0, 519.0, 1108.0, 3176.0, 11418.0, 53983.0, 415936.0, 3319884.0, 327402.0, 45297.0, 9771.0, 2831.0, 1067.0, 446.0, 245.0, 146.0, 97.0, 73.0, 48.0, 36.0, 24.0, 18.0, 11.0, 10.0, 11.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.953125, -26.2333984375, -25.513671875, -24.7939453125, -24.07421875, -23.3544921875, -22.634765625, -21.9150390625, -21.1953125, -20.4755859375, -19.755859375, -19.0361328125, -18.31640625, -17.5966796875, -16.876953125, -16.1572265625, -15.4375, -14.7177734375, -13.998046875, -13.2783203125, -12.55859375, -11.8388671875, -11.119140625, -10.3994140625, -9.6796875, -8.9599609375, -8.240234375, -7.5205078125, -6.80078125, -6.0810546875, -5.361328125, -4.6416015625, -3.921875, -3.2021484375, -2.482421875, -1.7626953125, -1.04296875, -0.3232421875, 0.396484375, 1.1162109375, 1.8359375, 2.5556640625, 3.275390625, 3.9951171875, 4.71484375, 5.4345703125, 6.154296875, 6.8740234375, 7.59375, 8.3134765625, 9.033203125, 9.7529296875, 10.47265625, 11.1923828125, 11.912109375, 12.6318359375, 13.3515625, 14.0712890625, 14.791015625, 15.5107421875, 16.23046875, 16.9501953125, 17.669921875, 18.3896484375, 19.109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 17.0, 32.0, 35.0, 81.0, 115.0, 243.0, 466.0, 1363.0, 889.0, 358.0, 191.0, 123.0, 55.0, 36.0, 15.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.42327880859375, -5.1004638671875, -4.77764892578125, -4.454833984375, -4.13201904296875, -3.8092041015625, -3.48638916015625, -3.16357421875, -2.84075927734375, -2.5179443359375, -2.19512939453125, -1.872314453125, -1.54949951171875, -1.2266845703125, -0.90386962890625, -0.5810546875, -0.25823974609375, 0.0645751953125, 0.38739013671875, 0.710205078125, 1.03302001953125, 1.3558349609375, 1.67864990234375, 2.00146484375, 2.32427978515625, 2.6470947265625, 2.96990966796875, 3.292724609375, 3.61553955078125, 3.9383544921875, 4.26116943359375, 4.583984375, 4.90679931640625, 5.2296142578125, 5.55242919921875, 5.875244140625, 6.19805908203125, 6.5208740234375, 6.84368896484375, 7.16650390625, 7.48931884765625, 7.8121337890625, 8.13494873046875, 8.457763671875, 8.78057861328125, 9.1033935546875, 9.42620849609375, 9.7490234375, 10.07183837890625, 10.3946533203125, 10.71746826171875, 11.040283203125, 11.36309814453125, 11.6859130859375, 12.00872802734375, 12.33154296875, 12.65435791015625, 12.9771728515625, 13.29998779296875, 13.622802734375, 13.94561767578125, 14.2684326171875, 14.59124755859375, 14.9140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 7.0, 2.0, 12.0, 10.0, 19.0, 19.0, 24.0, 38.0, 47.0, 59.0, 70.0, 84.0, 79.0, 94.0, 86.0, 89.0, 79.0, 61.0, 40.0, 22.0, 20.0, 15.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.11328887939453, -33.76093673706055, -32.40858840942383, -31.056236267089844, -29.70388412475586, -28.351533889770508, -26.999183654785156, -25.646831512451172, -24.29448127746582, -22.94213104248047, -21.589778900146484, -20.237428665161133, -18.88507843017578, -17.532726287841797, -16.180376052856445, -14.828024864196777, -13.47567367553711, -12.123322486877441, -10.770971298217773, -9.418621063232422, -8.066269874572754, -6.713918685913086, -5.361568450927734, -4.009217262268066, -2.6568660736083984, -1.3045151233673096, 0.0478358268737793, 1.400186538696289, 2.752537727355957, 4.104888916015625, 5.457239151000977, 6.8095903396606445, 8.161941528320312, 9.51429271697998, 10.866643905639648, 12.218994140625, 13.571345329284668, 14.923696517944336, 16.276046752929688, 17.628398895263672, 18.980749130249023, 20.333099365234375, 21.68545150756836, 23.03780174255371, 24.390151977539062, 25.742504119873047, 27.0948543548584, 28.44720458984375, 29.799556732177734, 31.151906967163086, 32.50425720214844, 33.85660934448242, 35.208961486816406, 36.561309814453125, 37.91366195678711, 39.266014099121094, 40.61836242675781, 41.9707145690918, 43.323062896728516, 44.6754150390625, 46.027767181396484, 47.38011932373047, 48.73246765136719, 50.08481979370117, 51.437171936035156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 9.0, 6.0, 14.0, 17.0, 14.0, 21.0, 22.0, 27.0, 29.0, 40.0, 47.0, 32.0, 45.0, 44.0, 40.0, 56.0, 37.0, 38.0, 48.0, 39.0, 37.0, 42.0, 38.0, 46.0, 32.0, 27.0, 22.0, 16.0, 21.0, 9.0, 15.0, 10.0, 9.0, 11.0, 10.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.292917251586914, -22.46396255493164, -21.635007858276367, -20.806053161621094, -19.977100372314453, -19.148143768310547, -18.319190979003906, -17.490236282348633, -16.66128158569336, -15.832326889038086, -15.003372192382812, -14.174418449401855, -13.345463752746582, -12.516509056091309, -11.687555313110352, -10.858600616455078, -10.029645919799805, -9.200691223144531, -8.371736526489258, -7.542782783508301, -6.713828086853027, -5.884873390197754, -5.055919170379639, -4.226964950561523, -3.39801025390625, -2.5690557956695557, -1.7401013374328613, -0.911146879196167, -0.08219242095947266, 0.7467622756958008, 1.575716495513916, 2.4046707153320312, 3.233623504638672, 4.062578201293945, 4.8915324211120605, 5.720486640930176, 6.549441337585449, 7.378396034240723, 8.20734977722168, 9.036304473876953, 9.865259170532227, 10.6942138671875, 11.523168563842773, 12.35212230682373, 13.181077003479004, 14.010031700134277, 14.838985443115234, 15.667940139770508, 16.49689483642578, 17.325849533081055, 18.154804229736328, 18.9837589263916, 19.812713623046875, 20.641666412353516, 21.47062110900879, 22.299575805664062, 23.128530502319336, 23.95748519897461, 24.786439895629883, 25.615394592285156, 26.444347381591797, 27.273303985595703, 28.102256774902344, 28.931211471557617, 29.76016616821289]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 9.0, 12.0, 18.0, 36.0, 52.0, 67.0, 105.0, 196.0, 377.0, 786.0, 2151.0, 10022.0, 88933.0, 831478.0, 99485.0, 10835.0, 2286.0, 797.0, 375.0, 215.0, 109.0, 66.0, 31.0, 34.0, 22.0, 8.0, 17.0, 3.0, 2.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.125, -39.73193359375, -38.3388671875, -36.94580078125, -35.552734375, -34.15966796875, -32.7666015625, -31.37353515625, -29.98046875, -28.58740234375, -27.1943359375, -25.80126953125, -24.408203125, -23.01513671875, -21.6220703125, -20.22900390625, -18.8359375, -17.44287109375, -16.0498046875, -14.65673828125, -13.263671875, -11.87060546875, -10.4775390625, -9.08447265625, -7.69140625, -6.29833984375, -4.9052734375, -3.51220703125, -2.119140625, -0.72607421875, 0.6669921875, 2.06005859375, 3.453125, 4.84619140625, 6.2392578125, 7.63232421875, 9.025390625, 10.41845703125, 11.8115234375, 13.20458984375, 14.59765625, 15.99072265625, 17.3837890625, 18.77685546875, 20.169921875, 21.56298828125, 22.9560546875, 24.34912109375, 25.7421875, 27.13525390625, 28.5283203125, 29.92138671875, 31.314453125, 32.70751953125, 34.1005859375, 35.49365234375, 36.88671875, 38.27978515625, 39.6728515625, 41.06591796875, 42.458984375, 43.85205078125, 45.2451171875, 46.63818359375, 48.03125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 18.0, 20.0, 38.0, 55.0, 62.0, 97.0, 107.0, 113.0, 123.0, 105.0, 76.0, 69.0, 43.0, 32.0, 6.0, 12.0, 11.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.710357666015625, -3.53985595703125, -3.369354248046875, -3.1988525390625, -3.028350830078125, -2.85784912109375, -2.687347412109375, -2.516845703125, -2.346343994140625, -2.17584228515625, -2.005340576171875, -1.8348388671875, -1.664337158203125, -1.49383544921875, -1.323333740234375, -1.15283203125, -0.982330322265625, -0.81182861328125, -0.641326904296875, -0.4708251953125, -0.300323486328125, -0.12982177734375, 0.040679931640625, 0.211181640625, 0.381683349609375, 0.55218505859375, 0.722686767578125, 0.8931884765625, 1.063690185546875, 1.23419189453125, 1.404693603515625, 1.5751953125, 1.745697021484375, 1.91619873046875, 2.086700439453125, 2.2572021484375, 2.427703857421875, 2.59820556640625, 2.768707275390625, 2.939208984375, 3.109710693359375, 3.28021240234375, 3.450714111328125, 3.6212158203125, 3.791717529296875, 3.96221923828125, 4.132720947265625, 4.30322265625, 4.473724365234375, 4.64422607421875, 4.814727783203125, 4.9852294921875, 5.155731201171875, 5.32623291015625, 5.496734619140625, 5.667236328125, 5.837738037109375, 6.00823974609375, 6.178741455078125, 6.3492431640625, 6.519744873046875, 6.69024658203125, 6.860748291015625, 7.03125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 37.0, 42.0, 61.0, 80.0, 100.0, 148.0, 193.0, 326.0, 498.0, 855.0, 1573.0, 3618.0, 8902.0, 23910.0, 69676.0, 250168.0, 504110.0, 119490.0, 39920.0, 13931.0, 5548.0, 2350.0, 1063.0, 660.0, 337.0, 252.0, 160.0, 150.0, 87.0, 66.0, 50.0, 43.0, 25.0, 22.0, 8.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.8699951171875, -11.489990234375, -11.1099853515625, -10.72998046875, -10.3499755859375, -9.969970703125, -9.5899658203125, -9.2099609375, -8.8299560546875, -8.449951171875, -8.0699462890625, -7.68994140625, -7.3099365234375, -6.929931640625, -6.5499267578125, -6.169921875, -5.7899169921875, -5.409912109375, -5.0299072265625, -4.64990234375, -4.2698974609375, -3.889892578125, -3.5098876953125, -3.1298828125, -2.7498779296875, -2.369873046875, -1.9898681640625, -1.60986328125, -1.2298583984375, -0.849853515625, -0.4698486328125, -0.08984375, 0.2901611328125, 0.670166015625, 1.0501708984375, 1.43017578125, 1.8101806640625, 2.190185546875, 2.5701904296875, 2.9501953125, 3.3302001953125, 3.710205078125, 4.0902099609375, 4.47021484375, 4.8502197265625, 5.230224609375, 5.6102294921875, 5.990234375, 6.3702392578125, 6.750244140625, 7.1302490234375, 7.51025390625, 7.8902587890625, 8.270263671875, 8.6502685546875, 9.0302734375, 9.4102783203125, 9.790283203125, 10.1702880859375, 10.55029296875, 10.9302978515625, 11.310302734375, 11.6903076171875, 12.0703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 11.0, 12.0, 15.0, 19.0, 23.0, 39.0, 26.0, 39.0, 40.0, 44.0, 38.0, 55.0, 44.0, 50.0, 60.0, 49.0, 40.0, 53.0, 48.0, 34.0, 46.0, 36.0, 25.0, 33.0, 27.0, 15.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0714111328125, -7.752197265625, -7.4329833984375, -7.11376953125, -6.7945556640625, -6.475341796875, -6.1561279296875, -5.8369140625, -5.5177001953125, -5.198486328125, -4.8792724609375, -4.56005859375, -4.2408447265625, -3.921630859375, -3.6024169921875, -3.283203125, -2.9639892578125, -2.644775390625, -2.3255615234375, -2.00634765625, -1.6871337890625, -1.367919921875, -1.0487060546875, -0.7294921875, -0.4102783203125, -0.091064453125, 0.2281494140625, 0.54736328125, 0.8665771484375, 1.185791015625, 1.5050048828125, 1.82421875, 2.1434326171875, 2.462646484375, 2.7818603515625, 3.10107421875, 3.4202880859375, 3.739501953125, 4.0587158203125, 4.3779296875, 4.6971435546875, 5.016357421875, 5.3355712890625, 5.65478515625, 5.9739990234375, 6.293212890625, 6.6124267578125, 6.931640625, 7.2508544921875, 7.570068359375, 7.8892822265625, 8.20849609375, 8.5277099609375, 8.846923828125, 9.1661376953125, 9.4853515625, 9.8045654296875, 10.123779296875, 10.4429931640625, 10.76220703125, 11.0814208984375, 11.400634765625, 11.7198486328125, 12.0390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 9.0, 3.0, 5.0, 16.0, 13.0, 19.0, 27.0, 43.0, 55.0, 86.0, 160.0, 310.0, 682.0, 1611.0, 4617.0, 14834.0, 58425.0, 394976.0, 479008.0, 68387.0, 16743.0, 5250.0, 1777.0, 700.0, 329.0, 160.0, 68.0, 69.0, 41.0, 30.0, 29.0, 12.0, 12.0, 8.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.46240234375, -8.2138671875, -7.96533203125, -7.716796875, -7.46826171875, -7.2197265625, -6.97119140625, -6.72265625, -6.47412109375, -6.2255859375, -5.97705078125, -5.728515625, -5.47998046875, -5.2314453125, -4.98291015625, -4.734375, -4.48583984375, -4.2373046875, -3.98876953125, -3.740234375, -3.49169921875, -3.2431640625, -2.99462890625, -2.74609375, -2.49755859375, -2.2490234375, -2.00048828125, -1.751953125, -1.50341796875, -1.2548828125, -1.00634765625, -0.7578125, -0.50927734375, -0.2607421875, -0.01220703125, 0.236328125, 0.48486328125, 0.7333984375, 0.98193359375, 1.23046875, 1.47900390625, 1.7275390625, 1.97607421875, 2.224609375, 2.47314453125, 2.7216796875, 2.97021484375, 3.21875, 3.46728515625, 3.7158203125, 3.96435546875, 4.212890625, 4.46142578125, 4.7099609375, 4.95849609375, 5.20703125, 5.45556640625, 5.7041015625, 5.95263671875, 6.201171875, 6.44970703125, 6.6982421875, 6.94677734375, 7.1953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 4.0, 14.0, 9.0, 13.0, 11.0, 21.0, 16.0, 27.0, 35.0, 67.0, 115.0, 220.0, 189.0, 64.0, 39.0, 33.0, 21.0, 21.0, 6.0, 12.0, 12.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0015316009521484375, -0.001493014395236969, -0.0014544278383255005, -0.001415841281414032, -0.0013772547245025635, -0.001338668167591095, -0.0013000816106796265, -0.001261495053768158, -0.0012229084968566895, -0.001184321939945221, -0.0011457353830337524, -0.001107148826122284, -0.0010685622692108154, -0.001029975712299347, -0.0009913891553878784, -0.0009528025984764099, -0.0009142160415649414, -0.0008756294846534729, -0.0008370429277420044, -0.0007984563708305359, -0.0007598698139190674, -0.0007212832570075989, -0.0006826967000961304, -0.0006441101431846619, -0.0006055235862731934, -0.0005669370293617249, -0.0005283504724502563, -0.0004897639155387878, -0.00045117735862731934, -0.00041259080171585083, -0.0003740042448043823, -0.0003354176878929138, -0.0002968311309814453, -0.0002582445740699768, -0.0002196580171585083, -0.0001810714602470398, -0.0001424849033355713, -0.00010389834642410278, -6.531178951263428e-05, -2.672523260116577e-05, 1.1861324310302734e-05, 5.044788122177124e-05, 8.903443813323975e-05, 0.00012762099504470825, 0.00016620755195617676, 0.00020479410886764526, 0.00024338066577911377, 0.0002819672226905823, 0.0003205537796020508, 0.0003591403365135193, 0.0003977268934249878, 0.0004363134503364563, 0.0004749000072479248, 0.0005134865641593933, 0.0005520731210708618, 0.0005906596779823303, 0.0006292462348937988, 0.0006678327918052673, 0.0007064193487167358, 0.0007450059056282043, 0.0007835924625396729, 0.0008221790194511414, 0.0008607655763626099, 0.0008993521332740784, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 23.0, 27.0, 36.0, 62.0, 104.0, 181.0, 302.0, 667.0, 1513.0, 4067.0, 14047.0, 66311.0, 563851.0, 336773.0, 44759.0, 10198.0, 3193.0, 1160.0, 551.0, 266.0, 161.0, 111.0, 56.0, 33.0, 26.0, 20.0, 18.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.6171875, -10.329345703125, -10.04150390625, -9.753662109375, -9.4658203125, -9.177978515625, -8.89013671875, -8.602294921875, -8.314453125, -8.026611328125, -7.73876953125, -7.450927734375, -7.1630859375, -6.875244140625, -6.58740234375, -6.299560546875, -6.01171875, -5.723876953125, -5.43603515625, -5.148193359375, -4.8603515625, -4.572509765625, -4.28466796875, -3.996826171875, -3.708984375, -3.421142578125, -3.13330078125, -2.845458984375, -2.5576171875, -2.269775390625, -1.98193359375, -1.694091796875, -1.40625, -1.118408203125, -0.83056640625, -0.542724609375, -0.2548828125, 0.032958984375, 0.32080078125, 0.608642578125, 0.896484375, 1.184326171875, 1.47216796875, 1.760009765625, 2.0478515625, 2.335693359375, 2.62353515625, 2.911376953125, 3.19921875, 3.487060546875, 3.77490234375, 4.062744140625, 4.3505859375, 4.638427734375, 4.92626953125, 5.214111328125, 5.501953125, 5.789794921875, 6.07763671875, 6.365478515625, 6.6533203125, 6.941162109375, 7.22900390625, 7.516845703125, 7.8046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 3.0, 2.0, 10.0, 13.0, 17.0, 24.0, 22.0, 48.0, 57.0, 80.0, 130.0, 171.0, 132.0, 76.0, 56.0, 32.0, 33.0, 26.0, 20.0, 12.0, 14.0, 3.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.76953125, -7.591217041015625, -7.41290283203125, -7.234588623046875, -7.0562744140625, -6.877960205078125, -6.69964599609375, -6.521331787109375, -6.343017578125, -6.164703369140625, -5.98638916015625, -5.808074951171875, -5.6297607421875, -5.451446533203125, -5.27313232421875, -5.094818115234375, -4.91650390625, -4.738189697265625, -4.55987548828125, -4.381561279296875, -4.2032470703125, -4.024932861328125, -3.84661865234375, -3.668304443359375, -3.489990234375, -3.311676025390625, -3.13336181640625, -2.955047607421875, -2.7767333984375, -2.598419189453125, -2.42010498046875, -2.241790771484375, -2.0634765625, -1.885162353515625, -1.70684814453125, -1.528533935546875, -1.3502197265625, -1.171905517578125, -0.99359130859375, -0.815277099609375, -0.636962890625, -0.458648681640625, -0.28033447265625, -0.102020263671875, 0.0762939453125, 0.254608154296875, 0.43292236328125, 0.611236572265625, 0.78955078125, 0.967864990234375, 1.14617919921875, 1.324493408203125, 1.5028076171875, 1.681121826171875, 1.85943603515625, 2.037750244140625, 2.216064453125, 2.394378662109375, 2.57269287109375, 2.751007080078125, 2.9293212890625, 3.107635498046875, 3.28594970703125, 3.464263916015625, 3.642578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 18.0, 40.0, 98.0, 147.0, 208.0, 189.0, 132.0, 89.0, 41.0, 20.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.54129028320312, -113.21691131591797, -108.89253234863281, -104.56814575195312, -100.24376678466797, -95.91938781738281, -91.59500122070312, -87.27062225341797, -82.94624328613281, -78.62186431884766, -74.2974853515625, -69.97309875488281, -65.64871978759766, -61.3243408203125, -56.99995803833008, -52.675575256347656, -48.3511962890625, -44.026817321777344, -39.70243453979492, -35.3780517578125, -31.053672790527344, -26.729291915893555, -22.404911041259766, -18.080530166625977, -13.756149291992188, -9.431768417358398, -5.107387542724609, -0.7830066680908203, 3.5413742065429688, 7.865755081176758, 12.190135955810547, 16.514516830444336, 20.838882446289062, 25.16326332092285, 29.48764419555664, 33.81202697753906, 38.13640594482422, 42.460784912109375, 46.7851676940918, 51.10955047607422, 55.433929443359375, 59.75830841064453, 64.08268737792969, 68.40707397460938, 72.73145294189453, 77.05583190917969, 81.38021850585938, 85.70459747314453, 90.02897644042969, 94.35335540771484, 98.677734375, 103.00212097167969, 107.32649993896484, 111.65087890625, 115.97526550292969, 120.29964447021484, 124.6240234375, 128.9484100341797, 133.2727813720703, 137.59716796875, 141.92153930664062, 146.2459259033203, 150.5703125, 154.89468383789062, 159.2190704345703]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 17.0, 21.0, 22.0, 19.0, 16.0, 17.0, 31.0, 36.0, 42.0, 42.0, 29.0, 35.0, 45.0, 39.0, 42.0, 39.0, 53.0, 40.0, 36.0, 38.0, 32.0, 32.0, 24.0, 27.0, 22.0, 23.0, 24.0, 17.0, 24.0, 12.0, 12.0, 11.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.39265441894531, -42.098670959472656, -40.8046875, -39.510704040527344, -38.21672058105469, -36.922733306884766, -35.62874984741211, -34.33476638793945, -33.0407829284668, -31.74679946899414, -30.452816009521484, -29.158830642700195, -27.86484718322754, -26.570863723754883, -25.276878356933594, -23.982894897460938, -22.68891143798828, -21.394927978515625, -20.10094451904297, -18.80695915222168, -17.512975692749023, -16.218992233276367, -14.925007820129395, -13.631023406982422, -12.337039947509766, -11.04305648803711, -9.749072074890137, -8.455087661743164, -7.161104202270508, -5.867120265960693, -4.573136329650879, -3.2791519165039062, -1.98516845703125, -0.6911845207214355, 0.6027994155883789, 1.8967833518981934, 3.190767288208008, 4.484751224517822, 5.778735160827637, 7.072719573974609, 8.366703033447266, 9.660686492919922, 10.954670906066895, 12.248655319213867, 13.542638778686523, 14.83662223815918, 16.13060760498047, 17.424591064453125, 18.71857452392578, 20.012557983398438, 21.306541442871094, 22.600526809692383, 23.89451026916504, 25.188493728637695, 26.482479095458984, 27.77646255493164, 29.070446014404297, 30.364429473876953, 31.65841293334961, 32.952396392822266, 34.24638366699219, 35.540367126464844, 36.8343505859375, 38.128334045410156, 39.42231750488281]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 12.0, 23.0, 30.0, 57.0, 111.0, 206.0, 438.0, 1015.0, 3434.0, 20672.0, 603760.0, 3525151.0, 32386.0, 4549.0, 1268.0, 527.0, 241.0, 124.0, 71.0, 63.0, 42.0, 25.0, 15.0, 14.0, 12.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3125, -37.3564453125, -35.400390625, -33.4443359375, -31.48828125, -29.5322265625, -27.576171875, -25.6201171875, -23.6640625, -21.7080078125, -19.751953125, -17.7958984375, -15.83984375, -13.8837890625, -11.927734375, -9.9716796875, -8.015625, -6.0595703125, -4.103515625, -2.1474609375, -0.19140625, 1.7646484375, 3.720703125, 5.6767578125, 7.6328125, 9.5888671875, 11.544921875, 13.5009765625, 15.45703125, 17.4130859375, 19.369140625, 21.3251953125, 23.28125, 25.2373046875, 27.193359375, 29.1494140625, 31.10546875, 33.0615234375, 35.017578125, 36.9736328125, 38.9296875, 40.8857421875, 42.841796875, 44.7978515625, 46.75390625, 48.7099609375, 50.666015625, 52.6220703125, 54.578125, 56.5341796875, 58.490234375, 60.4462890625, 62.40234375, 64.3583984375, 66.314453125, 68.2705078125, 70.2265625, 72.1826171875, 74.138671875, 76.0947265625, 78.05078125, 80.0068359375, 81.962890625, 83.9189453125, 85.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 15.0, 22.0, 23.0, 35.0, 47.0, 90.0, 86.0, 106.0, 111.0, 115.0, 94.0, 70.0, 55.0, 55.0, 24.0, 18.0, 9.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.615631103515625, -3.44805908203125, -3.280487060546875, -3.1129150390625, -2.945343017578125, -2.77777099609375, -2.610198974609375, -2.442626953125, -2.275054931640625, -2.10748291015625, -1.939910888671875, -1.7723388671875, -1.604766845703125, -1.43719482421875, -1.269622802734375, -1.10205078125, -0.934478759765625, -0.76690673828125, -0.599334716796875, -0.4317626953125, -0.264190673828125, -0.09661865234375, 0.070953369140625, 0.238525390625, 0.406097412109375, 0.57366943359375, 0.741241455078125, 0.9088134765625, 1.076385498046875, 1.24395751953125, 1.411529541015625, 1.5791015625, 1.746673583984375, 1.91424560546875, 2.081817626953125, 2.2493896484375, 2.416961669921875, 2.58453369140625, 2.752105712890625, 2.919677734375, 3.087249755859375, 3.25482177734375, 3.422393798828125, 3.5899658203125, 3.757537841796875, 3.92510986328125, 4.092681884765625, 4.26025390625, 4.427825927734375, 4.59539794921875, 4.762969970703125, 4.9305419921875, 5.098114013671875, 5.26568603515625, 5.433258056640625, 5.600830078125, 5.768402099609375, 5.93597412109375, 6.103546142578125, 6.2711181640625, 6.438690185546875, 6.60626220703125, 6.773834228515625, 6.94140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 19.0, 20.0, 42.0, 61.0, 81.0, 118.0, 217.0, 407.0, 794.0, 1990.0, 5424.0, 17762.0, 71384.0, 479924.0, 3313200.0, 238441.0, 45280.0, 12128.0, 3925.0, 1572.0, 630.0, 322.0, 186.0, 104.0, 60.0, 34.0, 26.0, 22.0, 13.0, 11.0, 8.0, 9.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.4150390625, -18.705078125, -17.9951171875, -17.28515625, -16.5751953125, -15.865234375, -15.1552734375, -14.4453125, -13.7353515625, -13.025390625, -12.3154296875, -11.60546875, -10.8955078125, -10.185546875, -9.4755859375, -8.765625, -8.0556640625, -7.345703125, -6.6357421875, -5.92578125, -5.2158203125, -4.505859375, -3.7958984375, -3.0859375, -2.3759765625, -1.666015625, -0.9560546875, -0.24609375, 0.4638671875, 1.173828125, 1.8837890625, 2.59375, 3.3037109375, 4.013671875, 4.7236328125, 5.43359375, 6.1435546875, 6.853515625, 7.5634765625, 8.2734375, 8.9833984375, 9.693359375, 10.4033203125, 11.11328125, 11.8232421875, 12.533203125, 13.2431640625, 13.953125, 14.6630859375, 15.373046875, 16.0830078125, 16.79296875, 17.5029296875, 18.212890625, 18.9228515625, 19.6328125, 20.3427734375, 21.052734375, 21.7626953125, 22.47265625, 23.1826171875, 23.892578125, 24.6025390625, 25.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 18.0, 21.0, 40.0, 48.0, 76.0, 103.0, 188.0, 334.0, 1267.0, 1067.0, 401.0, 173.0, 110.0, 57.0, 48.0, 31.0, 18.0, 15.0, 11.0, 5.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.234375, -10.972900390625, -10.71142578125, -10.449951171875, -10.1884765625, -9.927001953125, -9.66552734375, -9.404052734375, -9.142578125, -8.881103515625, -8.61962890625, -8.358154296875, -8.0966796875, -7.835205078125, -7.57373046875, -7.312255859375, -7.05078125, -6.789306640625, -6.52783203125, -6.266357421875, -6.0048828125, -5.743408203125, -5.48193359375, -5.220458984375, -4.958984375, -4.697509765625, -4.43603515625, -4.174560546875, -3.9130859375, -3.651611328125, -3.39013671875, -3.128662109375, -2.8671875, -2.605712890625, -2.34423828125, -2.082763671875, -1.8212890625, -1.559814453125, -1.29833984375, -1.036865234375, -0.775390625, -0.513916015625, -0.25244140625, 0.009033203125, 0.2705078125, 0.531982421875, 0.79345703125, 1.054931640625, 1.31640625, 1.577880859375, 1.83935546875, 2.100830078125, 2.3623046875, 2.623779296875, 2.88525390625, 3.146728515625, 3.408203125, 3.669677734375, 3.93115234375, 4.192626953125, 4.4541015625, 4.715576171875, 4.97705078125, 5.238525390625, 5.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 24.0, 28.0, 41.0, 44.0, 66.0, 78.0, 78.0, 91.0, 100.0, 101.0, 81.0, 64.0, 54.0, 40.0, 16.0, 23.0, 16.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.32663917541504, -29.106979370117188, -27.887319564819336, -26.667659759521484, -25.447999954223633, -24.22834014892578, -23.008678436279297, -21.789020538330078, -20.569358825683594, -19.349699020385742, -18.13003921508789, -16.91037940979004, -15.690719604492188, -14.471059799194336, -13.251399040222168, -12.031739234924316, -10.812080383300781, -9.59242057800293, -8.372760772705078, -7.153100490570068, -5.933440685272217, -4.713780879974365, -3.4941205978393555, -2.274460792541504, -1.0548009872436523, 0.16485893726348877, 1.3845188617706299, 2.6041789054870605, 3.823838710784912, 5.043498516082764, 6.263158798217773, 7.482818603515625, 8.702476501464844, 9.922136306762695, 11.141796112060547, 12.361455917358398, 13.58111572265625, 14.800775527954102, 16.020435333251953, 17.240097045898438, 18.459754943847656, 19.679414749145508, 20.89907455444336, 22.11873435974121, 23.338394165039062, 24.558053970336914, 25.777713775634766, 26.99737548828125, 28.2170352935791, 29.436695098876953, 30.656354904174805, 31.876014709472656, 33.09567642211914, 34.31533432006836, 35.534996032714844, 36.75465393066406, 37.97431564331055, 39.19397735595703, 40.41363525390625, 41.633296966552734, 42.85295486450195, 44.07261657714844, 45.292274475097656, 46.51193618774414, 47.73159408569336]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 15.0, 11.0, 7.0, 18.0, 13.0, 16.0, 19.0, 24.0, 27.0, 19.0, 33.0, 34.0, 38.0, 56.0, 34.0, 29.0, 41.0, 51.0, 54.0, 39.0, 29.0, 41.0, 47.0, 35.0, 28.0, 40.0, 29.0, 20.0, 23.0, 18.0, 16.0, 20.0, 16.0, 12.0, 8.0, 10.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.020980834960938, -21.336862564086914, -20.65274429321289, -19.9686279296875, -19.284509658813477, -18.600391387939453, -17.91627311706543, -17.232154846191406, -16.548038482666016, -15.863920211791992, -15.179802894592285, -14.495684623718262, -13.811567306518555, -13.127449035644531, -12.443330764770508, -11.759212493896484, -11.075094223022461, -10.390975952148438, -9.70685863494873, -9.022740364074707, -8.338623046875, -7.654504776000977, -6.970386505126953, -6.286268711090088, -5.602150917053223, -4.918033123016357, -4.233915328979492, -3.5497970581054688, -2.8656792640686035, -2.1815614700317383, -1.4974431991577148, -0.8133254051208496, -0.1292095184326172, 0.5549083948135376, 1.2390263080596924, 1.9231443405151367, 2.607262134552002, 3.291379928588867, 3.9754981994628906, 4.659615993499756, 5.343733787536621, 6.027851581573486, 6.711969375610352, 7.396087646484375, 8.080205917358398, 8.764323234558105, 9.448441505432129, 10.132558822631836, 10.81667709350586, 11.500795364379883, 12.18491268157959, 12.869030952453613, 13.55314826965332, 14.237266540527344, 14.921384811401367, 15.60550308227539, 16.28961944580078, 16.973737716674805, 17.657855987548828, 18.34197235107422, 19.026090621948242, 19.710208892822266, 20.39432716369629, 21.078445434570312, 21.762563705444336]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 5.0, 10.0, 10.0, 18.0, 34.0, 60.0, 72.0, 179.0, 313.0, 844.0, 2841.0, 22822.0, 496092.0, 498119.0, 22621.0, 2875.0, 853.0, 353.0, 183.0, 90.0, 69.0, 29.0, 14.0, 17.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.109375, -29.553955078125, -27.99853515625, -26.443115234375, -24.8876953125, -23.332275390625, -21.77685546875, -20.221435546875, -18.666015625, -17.110595703125, -15.55517578125, -13.999755859375, -12.4443359375, -10.888916015625, -9.33349609375, -7.778076171875, -6.22265625, -4.667236328125, -3.11181640625, -1.556396484375, -0.0009765625, 1.554443359375, 3.10986328125, 4.665283203125, 6.220703125, 7.776123046875, 9.33154296875, 10.886962890625, 12.4423828125, 13.997802734375, 15.55322265625, 17.108642578125, 18.6640625, 20.219482421875, 21.77490234375, 23.330322265625, 24.8857421875, 26.441162109375, 27.99658203125, 29.552001953125, 31.107421875, 32.662841796875, 34.21826171875, 35.773681640625, 37.3291015625, 38.884521484375, 40.43994140625, 41.995361328125, 43.55078125, 45.106201171875, 46.66162109375, 48.217041015625, 49.7724609375, 51.327880859375, 52.88330078125, 54.438720703125, 55.994140625, 57.549560546875, 59.10498046875, 60.660400390625, 62.2158203125, 63.771240234375, 65.32666015625, 66.882080078125, 68.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 17.0, 11.0, 16.0, 39.0, 41.0, 60.0, 89.0, 99.0, 96.0, 106.0, 95.0, 85.0, 80.0, 48.0, 43.0, 28.0, 13.0, 13.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.5552978515625, -3.387939453125, -3.2205810546875, -3.05322265625, -2.8858642578125, -2.718505859375, -2.5511474609375, -2.3837890625, -2.2164306640625, -2.049072265625, -1.8817138671875, -1.71435546875, -1.5469970703125, -1.379638671875, -1.2122802734375, -1.044921875, -0.8775634765625, -0.710205078125, -0.5428466796875, -0.37548828125, -0.2081298828125, -0.040771484375, 0.1265869140625, 0.2939453125, 0.4613037109375, 0.628662109375, 0.7960205078125, 0.96337890625, 1.1307373046875, 1.298095703125, 1.4654541015625, 1.6328125, 1.8001708984375, 1.967529296875, 2.1348876953125, 2.30224609375, 2.4696044921875, 2.636962890625, 2.8043212890625, 2.9716796875, 3.1390380859375, 3.306396484375, 3.4737548828125, 3.64111328125, 3.8084716796875, 3.975830078125, 4.1431884765625, 4.310546875, 4.4779052734375, 4.645263671875, 4.8126220703125, 4.97998046875, 5.1473388671875, 5.314697265625, 5.4820556640625, 5.6494140625, 5.8167724609375, 5.984130859375, 6.1514892578125, 6.31884765625, 6.4862060546875, 6.653564453125, 6.8209228515625, 6.98828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 13.0, 18.0, 12.0, 28.0, 34.0, 56.0, 127.0, 154.0, 332.0, 616.0, 1188.0, 2623.0, 5893.0, 13638.0, 31727.0, 82487.0, 397323.0, 377168.0, 79776.0, 31209.0, 13196.0, 5762.0, 2638.0, 1151.0, 600.0, 311.0, 161.0, 113.0, 61.0, 35.0, 29.0, 18.0, 12.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5703125, -11.1844482421875, -10.798583984375, -10.4127197265625, -10.02685546875, -9.6409912109375, -9.255126953125, -8.8692626953125, -8.4833984375, -8.0975341796875, -7.711669921875, -7.3258056640625, -6.93994140625, -6.5540771484375, -6.168212890625, -5.7823486328125, -5.396484375, -5.0106201171875, -4.624755859375, -4.2388916015625, -3.85302734375, -3.4671630859375, -3.081298828125, -2.6954345703125, -2.3095703125, -1.9237060546875, -1.537841796875, -1.1519775390625, -0.76611328125, -0.3802490234375, 0.005615234375, 0.3914794921875, 0.77734375, 1.1632080078125, 1.549072265625, 1.9349365234375, 2.32080078125, 2.7066650390625, 3.092529296875, 3.4783935546875, 3.8642578125, 4.2501220703125, 4.635986328125, 5.0218505859375, 5.40771484375, 5.7935791015625, 6.179443359375, 6.5653076171875, 6.951171875, 7.3370361328125, 7.722900390625, 8.1087646484375, 8.49462890625, 8.8804931640625, 9.266357421875, 9.6522216796875, 10.0380859375, 10.4239501953125, 10.809814453125, 11.1956787109375, 11.58154296875, 11.9674072265625, 12.353271484375, 12.7391357421875, 13.125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 13.0, 15.0, 19.0, 32.0, 22.0, 38.0, 34.0, 42.0, 46.0, 54.0, 47.0, 56.0, 46.0, 42.0, 40.0, 57.0, 57.0, 37.0, 43.0, 40.0, 24.0, 30.0, 25.0, 22.0, 25.0, 12.0, 16.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.9296875, -10.5806884765625, -10.231689453125, -9.8826904296875, -9.53369140625, -9.1846923828125, -8.835693359375, -8.4866943359375, -8.1376953125, -7.7886962890625, -7.439697265625, -7.0906982421875, -6.74169921875, -6.3927001953125, -6.043701171875, -5.6947021484375, -5.345703125, -4.9967041015625, -4.647705078125, -4.2987060546875, -3.94970703125, -3.6007080078125, -3.251708984375, -2.9027099609375, -2.5537109375, -2.2047119140625, -1.855712890625, -1.5067138671875, -1.15771484375, -0.8087158203125, -0.459716796875, -0.1107177734375, 0.23828125, 0.5872802734375, 0.936279296875, 1.2852783203125, 1.63427734375, 1.9832763671875, 2.332275390625, 2.6812744140625, 3.0302734375, 3.3792724609375, 3.728271484375, 4.0772705078125, 4.42626953125, 4.7752685546875, 5.124267578125, 5.4732666015625, 5.822265625, 6.1712646484375, 6.520263671875, 6.8692626953125, 7.21826171875, 7.5672607421875, 7.916259765625, 8.2652587890625, 8.6142578125, 8.9632568359375, 9.312255859375, 9.6612548828125, 10.01025390625, 10.3592529296875, 10.708251953125, 11.0572509765625, 11.40625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 13.0, 9.0, 19.0, 26.0, 24.0, 56.0, 61.0, 116.0, 159.0, 294.0, 562.0, 1191.0, 2672.0, 6231.0, 16236.0, 45079.0, 173982.0, 581058.0, 153034.0, 41694.0, 15239.0, 5774.0, 2545.0, 1172.0, 558.0, 267.0, 159.0, 83.0, 73.0, 56.0, 35.0, 15.0, 15.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.2152099609375, -5.031982421875, -4.8487548828125, -4.66552734375, -4.4822998046875, -4.299072265625, -4.1158447265625, -3.9326171875, -3.7493896484375, -3.566162109375, -3.3829345703125, -3.19970703125, -3.0164794921875, -2.833251953125, -2.6500244140625, -2.466796875, -2.2835693359375, -2.100341796875, -1.9171142578125, -1.73388671875, -1.5506591796875, -1.367431640625, -1.1842041015625, -1.0009765625, -0.8177490234375, -0.634521484375, -0.4512939453125, -0.26806640625, -0.0848388671875, 0.098388671875, 0.2816162109375, 0.46484375, 0.6480712890625, 0.831298828125, 1.0145263671875, 1.19775390625, 1.3809814453125, 1.564208984375, 1.7474365234375, 1.9306640625, 2.1138916015625, 2.297119140625, 2.4803466796875, 2.66357421875, 2.8468017578125, 3.030029296875, 3.2132568359375, 3.396484375, 3.5797119140625, 3.762939453125, 3.9461669921875, 4.12939453125, 4.3126220703125, 4.495849609375, 4.6790771484375, 4.8623046875, 5.0455322265625, 5.228759765625, 5.4119873046875, 5.59521484375, 5.7784423828125, 5.961669921875, 6.1448974609375, 6.328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 12.0, 16.0, 9.0, 17.0, 22.0, 56.0, 133.0, 298.0, 194.0, 80.0, 29.0, 21.0, 12.0, 14.0, 17.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011692047119140625, -0.001123771071434021, -0.0010783374309539795, -0.001032903790473938, -0.0009874701499938965, -0.000942036509513855, -0.0008966028690338135, -0.000851169228553772, -0.0008057355880737305, -0.000760301947593689, -0.0007148683071136475, -0.000669434666633606, -0.0006240010261535645, -0.000578567385673523, -0.0005331337451934814, -0.00048770010471343994, -0.00044226646423339844, -0.00039683282375335693, -0.00035139918327331543, -0.0003059655427932739, -0.0002605319023132324, -0.00021509826183319092, -0.00016966462135314941, -0.0001242309808731079, -7.87973403930664e-05, -3.33636999130249e-05, 1.2069940567016602e-05, 5.7503581047058105e-05, 0.00010293722152709961, 0.0001483708620071411, 0.00019380450248718262, 0.00023923814296722412, 0.0002846717834472656, 0.00033010542392730713, 0.00037553906440734863, 0.00042097270488739014, 0.00046640634536743164, 0.0005118399858474731, 0.0005572736263275146, 0.0006027072668075562, 0.0006481409072875977, 0.0006935745477676392, 0.0007390081882476807, 0.0007844418287277222, 0.0008298754692077637, 0.0008753091096878052, 0.0009207427501678467, 0.0009661763906478882, 0.0010116100311279297, 0.0010570436716079712, 0.0011024773120880127, 0.0011479109525680542, 0.0011933445930480957, 0.0012387782335281372, 0.0012842118740081787, 0.0013296455144882202, 0.0013750791549682617, 0.0014205127954483032, 0.0014659464359283447, 0.0015113800764083862, 0.0015568137168884277, 0.0016022473573684692, 0.0016476809978485107, 0.0016931146383285522, 0.0017385482788085938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 22.0, 23.0, 56.0, 75.0, 130.0, 233.0, 394.0, 785.0, 1611.0, 4027.0, 11533.0, 38178.0, 152849.0, 617076.0, 162222.0, 39590.0, 12161.0, 4119.0, 1750.0, 772.0, 359.0, 217.0, 132.0, 70.0, 53.0, 28.0, 20.0, 17.0, 10.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.39300537109375, -6.1688232421875, -5.94464111328125, -5.720458984375, -5.49627685546875, -5.2720947265625, -5.04791259765625, -4.82373046875, -4.59954833984375, -4.3753662109375, -4.15118408203125, -3.927001953125, -3.70281982421875, -3.4786376953125, -3.25445556640625, -3.0302734375, -2.80609130859375, -2.5819091796875, -2.35772705078125, -2.133544921875, -1.90936279296875, -1.6851806640625, -1.46099853515625, -1.23681640625, -1.01263427734375, -0.7884521484375, -0.56427001953125, -0.340087890625, -0.11590576171875, 0.1082763671875, 0.33245849609375, 0.556640625, 0.78082275390625, 1.0050048828125, 1.22918701171875, 1.453369140625, 1.67755126953125, 1.9017333984375, 2.12591552734375, 2.35009765625, 2.57427978515625, 2.7984619140625, 3.02264404296875, 3.246826171875, 3.47100830078125, 3.6951904296875, 3.91937255859375, 4.1435546875, 4.36773681640625, 4.5919189453125, 4.81610107421875, 5.040283203125, 5.26446533203125, 5.4886474609375, 5.71282958984375, 5.93701171875, 6.16119384765625, 6.3853759765625, 6.60955810546875, 6.833740234375, 7.05792236328125, 7.2821044921875, 7.50628662109375, 7.73046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 6.0, 7.0, 10.0, 12.0, 20.0, 18.0, 35.0, 38.0, 59.0, 90.0, 122.0, 139.0, 118.0, 96.0, 50.0, 40.0, 32.0, 27.0, 26.0, 10.0, 14.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9053955078125, -4.713134765625, -4.5208740234375, -4.32861328125, -4.1363525390625, -3.944091796875, -3.7518310546875, -3.5595703125, -3.3673095703125, -3.175048828125, -2.9827880859375, -2.79052734375, -2.5982666015625, -2.406005859375, -2.2137451171875, -2.021484375, -1.8292236328125, -1.636962890625, -1.4447021484375, -1.25244140625, -1.0601806640625, -0.867919921875, -0.6756591796875, -0.4833984375, -0.2911376953125, -0.098876953125, 0.0933837890625, 0.28564453125, 0.4779052734375, 0.670166015625, 0.8624267578125, 1.0546875, 1.2469482421875, 1.439208984375, 1.6314697265625, 1.82373046875, 2.0159912109375, 2.208251953125, 2.4005126953125, 2.5927734375, 2.7850341796875, 2.977294921875, 3.1695556640625, 3.36181640625, 3.5540771484375, 3.746337890625, 3.9385986328125, 4.130859375, 4.3231201171875, 4.515380859375, 4.7076416015625, 4.89990234375, 5.0921630859375, 5.284423828125, 5.4766845703125, 5.6689453125, 5.8612060546875, 6.053466796875, 6.2457275390625, 6.43798828125, 6.6302490234375, 6.822509765625, 7.0147705078125, 7.20703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 13.0, 19.0, 30.0, 31.0, 42.0, 58.0, 60.0, 56.0, 95.0, 75.0, 88.0, 90.0, 83.0, 47.0, 53.0, 40.0, 28.0, 24.0, 18.0, 10.0, 9.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.55586242675781, -73.69187927246094, -71.82788848876953, -69.96390533447266, -68.09991455078125, -66.23593139648438, -64.3719482421875, -62.507957458496094, -60.64397430419922, -58.77998733520508, -56.91600036621094, -55.05201721191406, -53.18803024291992, -51.32404327392578, -49.46005630493164, -47.5960693359375, -45.73208236694336, -43.86809539794922, -42.00410842895508, -40.14012145996094, -38.27613830566406, -36.41215133666992, -34.54816436767578, -32.68417739868164, -30.820192337036133, -28.956205368041992, -27.092220306396484, -25.228233337402344, -23.364246368408203, -21.500261306762695, -19.636274337768555, -17.772289276123047, -15.90829849243164, -14.044312477111816, -12.180326461791992, -10.316339492797852, -8.452353477478027, -6.588367462158203, -4.7243804931640625, -2.8603944778442383, -0.9964084625244141, 0.8675777912139893, 2.7315640449523926, 4.595550537109375, 6.459536552429199, 8.323522567749023, 10.187509536743164, 12.051495552062988, 13.915481567382812, 15.779467582702637, 17.64345359802246, 19.5074405670166, 21.37142562866211, 23.23541259765625, 25.09939956665039, 26.96338653564453, 28.82737159729004, 30.69135856628418, 32.55534362792969, 34.41933059692383, 36.28331756591797, 38.147300720214844, 40.01129150390625, 41.875274658203125, 43.739261627197266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 9.0, 6.0, 6.0, 13.0, 14.0, 6.0, 23.0, 21.0, 26.0, 13.0, 28.0, 37.0, 25.0, 39.0, 28.0, 38.0, 36.0, 46.0, 27.0, 32.0, 32.0, 38.0, 36.0, 35.0, 40.0, 43.0, 37.0, 30.0, 35.0, 18.0, 24.0, 20.0, 19.0, 18.0, 20.0, 14.0, 13.0, 8.0, 11.0, 5.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-40.06098937988281, -38.774513244628906, -37.488037109375, -36.201560974121094, -34.91508483886719, -33.62860870361328, -32.342132568359375, -31.0556583404541, -29.769182205200195, -28.48270606994629, -27.196229934692383, -25.909753799438477, -24.623279571533203, -23.336803436279297, -22.05032730102539, -20.763851165771484, -19.477375030517578, -18.190898895263672, -16.904422760009766, -15.617947578430176, -14.33147144317627, -13.044995307922363, -11.758520126342773, -10.472043991088867, -9.185567855834961, -7.899091720581055, -6.612616062164307, -5.326140403747559, -4.039664268493652, -2.753188133239746, -1.466712474822998, -0.18023681640625, 1.1062393188476562, 2.3927152156829834, 3.6791911125183105, 4.965666770935059, 6.252142906188965, 7.538619041442871, 8.825094223022461, 10.111570358276367, 11.398046493530273, 12.68452262878418, 13.970998764038086, 15.257473945617676, 16.543949127197266, 17.830425262451172, 19.116901397705078, 20.403377532958984, 21.68985366821289, 22.976329803466797, 24.262805938720703, 25.54928207397461, 26.835758209228516, 28.122234344482422, 29.408708572387695, 30.6951847076416, 31.981660842895508, 33.26813507080078, 34.55461120605469, 35.841087341308594, 37.1275634765625, 38.414039611816406, 39.70051574707031, 40.98699188232422, 42.273468017578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 19.0, 25.0, 34.0, 48.0, 85.0, 159.0, 280.0, 575.0, 1404.0, 4282.0, 18365.0, 163416.0, 3877149.0, 108302.0, 14212.0, 3529.0, 1183.0, 473.0, 233.0, 162.0, 90.0, 66.0, 41.0, 29.0, 24.0, 16.0, 9.0, 13.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.5, -47.81787109375, -46.1357421875, -44.45361328125, -42.771484375, -41.08935546875, -39.4072265625, -37.72509765625, -36.04296875, -34.36083984375, -32.6787109375, -30.99658203125, -29.314453125, -27.63232421875, -25.9501953125, -24.26806640625, -22.5859375, -20.90380859375, -19.2216796875, -17.53955078125, -15.857421875, -14.17529296875, -12.4931640625, -10.81103515625, -9.12890625, -7.44677734375, -5.7646484375, -4.08251953125, -2.400390625, -0.71826171875, 0.9638671875, 2.64599609375, 4.328125, 6.01025390625, 7.6923828125, 9.37451171875, 11.056640625, 12.73876953125, 14.4208984375, 16.10302734375, 17.78515625, 19.46728515625, 21.1494140625, 22.83154296875, 24.513671875, 26.19580078125, 27.8779296875, 29.56005859375, 31.2421875, 32.92431640625, 34.6064453125, 36.28857421875, 37.970703125, 39.65283203125, 41.3349609375, 43.01708984375, 44.69921875, 46.38134765625, 48.0634765625, 49.74560546875, 51.427734375, 53.10986328125, 54.7919921875, 56.47412109375, 58.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 16.0, 26.0, 26.0, 37.0, 64.0, 75.0, 101.0, 94.0, 103.0, 101.0, 80.0, 72.0, 68.0, 52.0, 28.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.544921875, -3.379730224609375, -3.21453857421875, -3.049346923828125, -2.8841552734375, -2.718963623046875, -2.55377197265625, -2.388580322265625, -2.223388671875, -2.058197021484375, -1.89300537109375, -1.727813720703125, -1.5626220703125, -1.397430419921875, -1.23223876953125, -1.067047119140625, -0.90185546875, -0.736663818359375, -0.57147216796875, -0.406280517578125, -0.2410888671875, -0.075897216796875, 0.08929443359375, 0.254486083984375, 0.419677734375, 0.584869384765625, 0.75006103515625, 0.915252685546875, 1.0804443359375, 1.245635986328125, 1.41082763671875, 1.576019287109375, 1.7412109375, 1.906402587890625, 2.07159423828125, 2.236785888671875, 2.4019775390625, 2.567169189453125, 2.73236083984375, 2.897552490234375, 3.062744140625, 3.227935791015625, 3.39312744140625, 3.558319091796875, 3.7235107421875, 3.888702392578125, 4.05389404296875, 4.219085693359375, 4.38427734375, 4.549468994140625, 4.71466064453125, 4.879852294921875, 5.0450439453125, 5.210235595703125, 5.37542724609375, 5.540618896484375, 5.705810546875, 5.871002197265625, 6.03619384765625, 6.201385498046875, 6.3665771484375, 6.531768798828125, 6.69696044921875, 6.862152099609375, 7.02734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 11.0, 9.0, 12.0, 23.0, 35.0, 53.0, 73.0, 115.0, 161.0, 230.0, 302.0, 517.0, 739.0, 1130.0, 1781.0, 2714.0, 4397.0, 7429.0, 12962.0, 23705.0, 45350.0, 95566.0, 244408.0, 2143720.0, 1204827.0, 219820.0, 88275.0, 42509.0, 22425.0, 12329.0, 7050.0, 4198.0, 2611.0, 1676.0, 1066.0, 644.0, 427.0, 295.0, 202.0, 132.0, 102.0, 63.0, 56.0, 35.0, 26.0, 17.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.71875, -10.3724365234375, -10.026123046875, -9.6798095703125, -9.33349609375, -8.9871826171875, -8.640869140625, -8.2945556640625, -7.9482421875, -7.6019287109375, -7.255615234375, -6.9093017578125, -6.56298828125, -6.2166748046875, -5.870361328125, -5.5240478515625, -5.177734375, -4.8314208984375, -4.485107421875, -4.1387939453125, -3.79248046875, -3.4461669921875, -3.099853515625, -2.7535400390625, -2.4072265625, -2.0609130859375, -1.714599609375, -1.3682861328125, -1.02197265625, -0.6756591796875, -0.329345703125, 0.0169677734375, 0.36328125, 0.7095947265625, 1.055908203125, 1.4022216796875, 1.74853515625, 2.0948486328125, 2.441162109375, 2.7874755859375, 3.1337890625, 3.4801025390625, 3.826416015625, 4.1727294921875, 4.51904296875, 4.8653564453125, 5.211669921875, 5.5579833984375, 5.904296875, 6.2506103515625, 6.596923828125, 6.9432373046875, 7.28955078125, 7.6358642578125, 7.982177734375, 8.3284912109375, 8.6748046875, 9.0211181640625, 9.367431640625, 9.7137451171875, 10.06005859375, 10.4063720703125, 10.752685546875, 11.0989990234375, 11.4453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 7.0, 13.0, 24.0, 33.0, 60.0, 70.0, 103.0, 133.0, 221.0, 497.0, 1690.0, 475.0, 240.0, 139.0, 91.0, 55.0, 48.0, 30.0, 21.0, 17.0, 22.0, 11.0, 10.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.14990234375, -6.9365234375, -6.72314453125, -6.509765625, -6.29638671875, -6.0830078125, -5.86962890625, -5.65625, -5.44287109375, -5.2294921875, -5.01611328125, -4.802734375, -4.58935546875, -4.3759765625, -4.16259765625, -3.94921875, -3.73583984375, -3.5224609375, -3.30908203125, -3.095703125, -2.88232421875, -2.6689453125, -2.45556640625, -2.2421875, -2.02880859375, -1.8154296875, -1.60205078125, -1.388671875, -1.17529296875, -0.9619140625, -0.74853515625, -0.53515625, -0.32177734375, -0.1083984375, 0.10498046875, 0.318359375, 0.53173828125, 0.7451171875, 0.95849609375, 1.171875, 1.38525390625, 1.5986328125, 1.81201171875, 2.025390625, 2.23876953125, 2.4521484375, 2.66552734375, 2.87890625, 3.09228515625, 3.3056640625, 3.51904296875, 3.732421875, 3.94580078125, 4.1591796875, 4.37255859375, 4.5859375, 4.79931640625, 5.0126953125, 5.22607421875, 5.439453125, 5.65283203125, 5.8662109375, 6.07958984375, 6.29296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 15.0, 24.0, 47.0, 63.0, 89.0, 144.0, 124.0, 128.0, 114.0, 79.0, 63.0, 50.0, 24.0, 14.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.917701721191406, -60.19791793823242, -58.47813415527344, -56.75835418701172, -55.038570404052734, -53.31878662109375, -51.599002838134766, -49.87921905517578, -48.15943908691406, -46.43965530395508, -44.719871520996094, -43.000091552734375, -41.28030776977539, -39.560523986816406, -37.84074020385742, -36.12095642089844, -34.40117263793945, -32.68138885498047, -30.961606979370117, -29.241823196411133, -27.52204132080078, -25.802257537841797, -24.082473754882812, -22.362689971923828, -20.642908096313477, -18.923124313354492, -17.20334243774414, -15.483558654785156, -13.763775825500488, -12.04399299621582, -10.324209213256836, -8.604426383972168, -6.8846435546875, -5.164860725402832, -3.445077419281006, -1.7252941131591797, -0.005511283874511719, 1.7142715454101562, 3.4340553283691406, 5.153838157653809, 6.873620986938477, 8.593403816223145, 10.313186645507812, 12.032970428466797, 13.752753257751465, 15.472536087036133, 17.192319869995117, 18.91210174560547, 20.631885528564453, 22.351669311523438, 24.07145118713379, 25.791234970092773, 27.511016845703125, 29.23080062866211, 30.950584411621094, 32.67036819458008, 34.39015197753906, 36.10993576049805, 37.82971954345703, 39.54949951171875, 41.269283294677734, 42.98906707763672, 44.7088508605957, 46.42863464355469, 48.148414611816406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 13.0, 12.0, 16.0, 13.0, 10.0, 26.0, 14.0, 46.0, 32.0, 34.0, 35.0, 29.0, 41.0, 52.0, 38.0, 45.0, 38.0, 51.0, 47.0, 39.0, 34.0, 31.0, 38.0, 25.0, 18.0, 26.0, 22.0, 12.0, 23.0, 23.0, 14.0, 12.0, 12.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.265933990478516, -19.642507553100586, -19.019081115722656, -18.39565658569336, -17.77223014831543, -17.1488037109375, -16.52537727355957, -15.90195083618164, -15.278525352478027, -14.655098915100098, -14.031673431396484, -13.408246994018555, -12.784820556640625, -12.161395072937012, -11.537968635559082, -10.914543151855469, -10.291116714477539, -9.66769027709961, -9.044264793395996, -8.420838356018066, -7.797412395477295, -7.173986434936523, -6.550559997558594, -5.927134037017822, -5.303708076477051, -4.680282115936279, -4.056856155395508, -3.433429718017578, -2.8100037574768066, -2.186577796936035, -1.5631515979766846, -0.939725399017334, -0.3162994384765625, 0.30712664127349854, 0.9305527210235596, 1.5539788007736206, 2.1774048805236816, 2.800830841064453, 3.4242570400238037, 4.047683238983154, 4.671109199523926, 5.294535160064697, 5.917961120605469, 6.541387557983398, 7.16481351852417, 7.788239479064941, 8.411665916442871, 9.035091400146484, 9.658517837524414, 10.281944274902344, 10.905369758605957, 11.528796195983887, 12.1522216796875, 12.77564811706543, 13.39907455444336, 14.022500991821289, 14.645926475524902, 15.269352912902832, 15.892778396606445, 16.516204833984375, 17.139631271362305, 17.763057708740234, 18.38648223876953, 19.00990867614746, 19.63333511352539]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 6.0, 5.0, 17.0, 25.0, 42.0, 58.0, 119.0, 195.0, 357.0, 800.0, 2062.0, 8520.0, 57400.0, 445965.0, 460972.0, 59515.0, 8687.0, 2108.0, 802.0, 373.0, 189.0, 122.0, 75.0, 44.0, 23.0, 22.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.21875, -44.142333984375, -43.06591796875, -41.989501953125, -40.9130859375, -39.836669921875, -38.76025390625, -37.683837890625, -36.607421875, -35.531005859375, -34.45458984375, -33.378173828125, -32.3017578125, -31.225341796875, -30.14892578125, -29.072509765625, -27.99609375, -26.919677734375, -25.84326171875, -24.766845703125, -23.6904296875, -22.614013671875, -21.53759765625, -20.461181640625, -19.384765625, -18.308349609375, -17.23193359375, -16.155517578125, -15.0791015625, -14.002685546875, -12.92626953125, -11.849853515625, -10.7734375, -9.697021484375, -8.62060546875, -7.544189453125, -6.4677734375, -5.391357421875, -4.31494140625, -3.238525390625, -2.162109375, -1.085693359375, -0.00927734375, 1.067138671875, 2.1435546875, 3.219970703125, 4.29638671875, 5.372802734375, 6.44921875, 7.525634765625, 8.60205078125, 9.678466796875, 10.7548828125, 11.831298828125, 12.90771484375, 13.984130859375, 15.060546875, 16.136962890625, 17.21337890625, 18.289794921875, 19.3662109375, 20.442626953125, 21.51904296875, 22.595458984375, 23.671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 10.0, 15.0, 21.0, 26.0, 42.0, 51.0, 72.0, 82.0, 90.0, 94.0, 93.0, 92.0, 73.0, 62.0, 48.0, 39.0, 33.0, 20.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.510162353515625, -3.34259033203125, -3.175018310546875, -3.0074462890625, -2.839874267578125, -2.67230224609375, -2.504730224609375, -2.337158203125, -2.169586181640625, -2.00201416015625, -1.834442138671875, -1.6668701171875, -1.499298095703125, -1.33172607421875, -1.164154052734375, -0.99658203125, -0.829010009765625, -0.66143798828125, -0.493865966796875, -0.3262939453125, -0.158721923828125, 0.00885009765625, 0.176422119140625, 0.343994140625, 0.511566162109375, 0.67913818359375, 0.846710205078125, 1.0142822265625, 1.181854248046875, 1.34942626953125, 1.516998291015625, 1.6845703125, 1.852142333984375, 2.01971435546875, 2.187286376953125, 2.3548583984375, 2.522430419921875, 2.69000244140625, 2.857574462890625, 3.025146484375, 3.192718505859375, 3.36029052734375, 3.527862548828125, 3.6954345703125, 3.863006591796875, 4.03057861328125, 4.198150634765625, 4.36572265625, 4.533294677734375, 4.70086669921875, 4.868438720703125, 5.0360107421875, 5.203582763671875, 5.37115478515625, 5.538726806640625, 5.706298828125, 5.873870849609375, 6.04144287109375, 6.209014892578125, 6.3765869140625, 6.544158935546875, 6.71173095703125, 6.879302978515625, 7.046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 12.0, 15.0, 19.0, 36.0, 34.0, 47.0, 73.0, 95.0, 111.0, 158.0, 179.0, 240.0, 325.0, 526.0, 911.0, 2027.0, 4997.0, 14657.0, 46029.0, 147491.0, 472937.0, 247112.0, 73207.0, 23250.0, 7683.0, 2733.0, 1334.0, 675.0, 436.0, 289.0, 203.0, 139.0, 135.0, 119.0, 79.0, 48.0, 36.0, 40.0, 20.0, 18.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.8203125, -13.3843994140625, -12.948486328125, -12.5125732421875, -12.07666015625, -11.6407470703125, -11.204833984375, -10.7689208984375, -10.3330078125, -9.8970947265625, -9.461181640625, -9.0252685546875, -8.58935546875, -8.1534423828125, -7.717529296875, -7.2816162109375, -6.845703125, -6.4097900390625, -5.973876953125, -5.5379638671875, -5.10205078125, -4.6661376953125, -4.230224609375, -3.7943115234375, -3.3583984375, -2.9224853515625, -2.486572265625, -2.0506591796875, -1.61474609375, -1.1788330078125, -0.742919921875, -0.3070068359375, 0.12890625, 0.5648193359375, 1.000732421875, 1.4366455078125, 1.87255859375, 2.3084716796875, 2.744384765625, 3.1802978515625, 3.6162109375, 4.0521240234375, 4.488037109375, 4.9239501953125, 5.35986328125, 5.7957763671875, 6.231689453125, 6.6676025390625, 7.103515625, 7.5394287109375, 7.975341796875, 8.4112548828125, 8.84716796875, 9.2830810546875, 9.718994140625, 10.1549072265625, 10.5908203125, 11.0267333984375, 11.462646484375, 11.8985595703125, 12.33447265625, 12.7703857421875, 13.206298828125, 13.6422119140625, 14.078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 4.0, 6.0, 6.0, 8.0, 9.0, 22.0, 16.0, 19.0, 28.0, 31.0, 35.0, 39.0, 38.0, 45.0, 42.0, 39.0, 56.0, 35.0, 47.0, 41.0, 44.0, 39.0, 41.0, 39.0, 37.0, 24.0, 25.0, 18.0, 30.0, 21.0, 16.0, 16.0, 15.0, 14.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.2867431640625, -9.948486328125, -9.6102294921875, -9.27197265625, -8.9337158203125, -8.595458984375, -8.2572021484375, -7.9189453125, -7.5806884765625, -7.242431640625, -6.9041748046875, -6.56591796875, -6.2276611328125, -5.889404296875, -5.5511474609375, -5.212890625, -4.8746337890625, -4.536376953125, -4.1981201171875, -3.85986328125, -3.5216064453125, -3.183349609375, -2.8450927734375, -2.5068359375, -2.1685791015625, -1.830322265625, -1.4920654296875, -1.15380859375, -0.8155517578125, -0.477294921875, -0.1390380859375, 0.19921875, 0.5374755859375, 0.875732421875, 1.2139892578125, 1.55224609375, 1.8905029296875, 2.228759765625, 2.5670166015625, 2.9052734375, 3.2435302734375, 3.581787109375, 3.9200439453125, 4.25830078125, 4.5965576171875, 4.934814453125, 5.2730712890625, 5.611328125, 5.9495849609375, 6.287841796875, 6.6260986328125, 6.96435546875, 7.3026123046875, 7.640869140625, 7.9791259765625, 8.3173828125, 8.6556396484375, 8.993896484375, 9.3321533203125, 9.67041015625, 10.0086669921875, 10.346923828125, 10.6851806640625, 11.0234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 12.0, 7.0, 9.0, 11.0, 31.0, 48.0, 70.0, 129.0, 229.0, 400.0, 834.0, 1822.0, 4290.0, 11481.0, 33740.0, 111732.0, 450250.0, 311371.0, 81622.0, 25122.0, 8852.0, 3396.0, 1532.0, 731.0, 371.0, 177.0, 98.0, 77.0, 39.0, 35.0, 17.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3798828125, -9.150390625, -8.9208984375, -8.69140625, -8.4619140625, -8.232421875, -8.0029296875, -7.7734375, -7.5439453125, -7.314453125, -7.0849609375, -6.85546875, -6.6259765625, -6.396484375, -6.1669921875, -5.9375, -5.7080078125, -5.478515625, -5.2490234375, -5.01953125, -4.7900390625, -4.560546875, -4.3310546875, -4.1015625, -3.8720703125, -3.642578125, -3.4130859375, -3.18359375, -2.9541015625, -2.724609375, -2.4951171875, -2.265625, -2.0361328125, -1.806640625, -1.5771484375, -1.34765625, -1.1181640625, -0.888671875, -0.6591796875, -0.4296875, -0.2001953125, 0.029296875, 0.2587890625, 0.48828125, 0.7177734375, 0.947265625, 1.1767578125, 1.40625, 1.6357421875, 1.865234375, 2.0947265625, 2.32421875, 2.5537109375, 2.783203125, 3.0126953125, 3.2421875, 3.4716796875, 3.701171875, 3.9306640625, 4.16015625, 4.3896484375, 4.619140625, 4.8486328125, 5.078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 7.0, 9.0, 25.0, 33.0, 52.0, 59.0, 100.0, 303.0, 162.0, 75.0, 59.0, 47.0, 20.0, 16.0, 16.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002582550048828125, -0.0025057196617126465, -0.002428889274597168, -0.0023520588874816895, -0.002275228500366211, -0.0021983981132507324, -0.002121567726135254, -0.0020447373390197754, -0.001967906951904297, -0.0018910765647888184, -0.0018142461776733398, -0.0017374157905578613, -0.0016605854034423828, -0.0015837550163269043, -0.0015069246292114258, -0.0014300942420959473, -0.0013532638549804688, -0.0012764334678649902, -0.0011996030807495117, -0.0011227726936340332, -0.0010459423065185547, -0.0009691119194030762, -0.0008922815322875977, -0.0008154511451721191, -0.0007386207580566406, -0.0006617903709411621, -0.0005849599838256836, -0.0005081295967102051, -0.00043129920959472656, -0.00035446882247924805, -0.00027763843536376953, -0.00020080804824829102, -0.0001239776611328125, -4.7147274017333984e-05, 2.968311309814453e-05, 0.00010651350021362305, 0.00018334388732910156, 0.0002601742744445801, 0.0003370046615600586, 0.0004138350486755371, 0.0004906654357910156, 0.0005674958229064941, 0.0006443262100219727, 0.0007211565971374512, 0.0007979869842529297, 0.0008748173713684082, 0.0009516477584838867, 0.0010284781455993652, 0.0011053085327148438, 0.0011821389198303223, 0.0012589693069458008, 0.0013357996940612793, 0.0014126300811767578, 0.0014894604682922363, 0.0015662908554077148, 0.0016431212425231934, 0.0017199516296386719, 0.0017967820167541504, 0.001873612403869629, 0.0019504427909851074, 0.002027273178100586, 0.0021041035652160645, 0.002180933952331543, 0.0022577643394470215, 0.0023345947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 23.0, 26.0, 33.0, 46.0, 70.0, 120.0, 220.0, 422.0, 833.0, 1995.0, 6026.0, 21965.0, 118002.0, 623556.0, 224908.0, 36421.0, 8762.0, 2776.0, 1093.0, 528.0, 278.0, 156.0, 98.0, 57.0, 34.0, 26.0, 18.0, 9.0, 8.0, 3.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.859375, -12.5179443359375, -12.176513671875, -11.8350830078125, -11.49365234375, -11.1522216796875, -10.810791015625, -10.4693603515625, -10.1279296875, -9.7864990234375, -9.445068359375, -9.1036376953125, -8.76220703125, -8.4207763671875, -8.079345703125, -7.7379150390625, -7.396484375, -7.0550537109375, -6.713623046875, -6.3721923828125, -6.03076171875, -5.6893310546875, -5.347900390625, -5.0064697265625, -4.6650390625, -4.3236083984375, -3.982177734375, -3.6407470703125, -3.29931640625, -2.9578857421875, -2.616455078125, -2.2750244140625, -1.93359375, -1.5921630859375, -1.250732421875, -0.9093017578125, -0.56787109375, -0.2264404296875, 0.114990234375, 0.4564208984375, 0.7978515625, 1.1392822265625, 1.480712890625, 1.8221435546875, 2.16357421875, 2.5050048828125, 2.846435546875, 3.1878662109375, 3.529296875, 3.8707275390625, 4.212158203125, 4.5535888671875, 4.89501953125, 5.2364501953125, 5.577880859375, 5.9193115234375, 6.2607421875, 6.6021728515625, 6.943603515625, 7.2850341796875, 7.62646484375, 7.9678955078125, 8.309326171875, 8.6507568359375, 8.9921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 12.0, 15.0, 11.0, 21.0, 24.0, 27.0, 45.0, 48.0, 74.0, 96.0, 118.0, 108.0, 91.0, 67.0, 46.0, 35.0, 44.0, 28.0, 17.0, 13.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.79248046875, -6.5654296875, -6.33837890625, -6.111328125, -5.88427734375, -5.6572265625, -5.43017578125, -5.203125, -4.97607421875, -4.7490234375, -4.52197265625, -4.294921875, -4.06787109375, -3.8408203125, -3.61376953125, -3.38671875, -3.15966796875, -2.9326171875, -2.70556640625, -2.478515625, -2.25146484375, -2.0244140625, -1.79736328125, -1.5703125, -1.34326171875, -1.1162109375, -0.88916015625, -0.662109375, -0.43505859375, -0.2080078125, 0.01904296875, 0.24609375, 0.47314453125, 0.7001953125, 0.92724609375, 1.154296875, 1.38134765625, 1.6083984375, 1.83544921875, 2.0625, 2.28955078125, 2.5166015625, 2.74365234375, 2.970703125, 3.19775390625, 3.4248046875, 3.65185546875, 3.87890625, 4.10595703125, 4.3330078125, 4.56005859375, 4.787109375, 5.01416015625, 5.2412109375, 5.46826171875, 5.6953125, 5.92236328125, 6.1494140625, 6.37646484375, 6.603515625, 6.83056640625, 7.0576171875, 7.28466796875, 7.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 22.0, 60.0, 195.0, 274.0, 272.0, 123.0, 37.0, 15.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.87677001953125, -114.7883071899414, -105.69984436035156, -96.61138916015625, -87.5229263305664, -78.43446350097656, -69.34600830078125, -60.257545471191406, -51.16908264160156, -42.08061981201172, -32.99216079711914, -23.90369987487793, -14.815238952636719, -5.726776123046875, 3.361682891845703, 12.450141906738281, 21.538604736328125, 30.627065658569336, 39.71552658081055, 48.803985595703125, 57.89244842529297, 66.98091125488281, 76.06936645507812, 85.15782928466797, 94.24629211425781, 103.33475494384766, 112.4232177734375, 121.51167297363281, 130.60012817382812, 139.6885986328125, 148.7770538330078, 157.86550903320312, 166.95394897460938, 176.0424041748047, 185.13087463378906, 194.21932983398438, 203.30780029296875, 212.39625549316406, 221.48471069335938, 230.57318115234375, 239.66163635253906, 248.75009155273438, 257.83856201171875, 266.9270324707031, 276.0154724121094, 285.10394287109375, 294.1924133300781, 303.2808532714844, 312.36932373046875, 321.4577941894531, 330.5462341308594, 339.63470458984375, 348.7231750488281, 357.8116455078125, 366.90008544921875, 375.9885559082031, 385.0770263671875, 394.1654968261719, 403.2539367675781, 412.3424072265625, 421.4308776855469, 430.51934814453125, 439.6077880859375, 448.6962585449219, 457.7846984863281]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 12.0, 9.0, 12.0, 14.0, 20.0, 21.0, 21.0, 22.0, 27.0, 34.0, 29.0, 46.0, 31.0, 26.0, 42.0, 51.0, 53.0, 48.0, 35.0, 44.0, 53.0, 47.0, 27.0, 34.0, 31.0, 24.0, 14.0, 20.0, 27.0, 20.0, 19.0, 16.0, 14.0, 10.0, 8.0, 1.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-59.82958984375, -58.04922103881836, -56.268856048583984, -54.488487243652344, -52.7081184387207, -50.92774963378906, -49.14738464355469, -47.36701583862305, -45.586647033691406, -43.806278228759766, -42.02591323852539, -40.24554443359375, -38.46517562866211, -36.68480682373047, -34.904441833496094, -33.12407302856445, -31.343708038330078, -29.56334114074707, -27.78297233581543, -26.002605438232422, -24.22223663330078, -22.441869735717773, -20.661502838134766, -18.881134033203125, -17.100767135620117, -15.320399284362793, -13.540031433105469, -11.759664535522461, -9.979296684265137, -8.198928833007812, -6.418561935424805, -4.6381940841674805, -2.8578262329101562, -1.0774586200714111, 0.702908992767334, 2.4832763671875, 4.263644218444824, 6.044012069702148, 7.824378967285156, 9.60474681854248, 11.385114669799805, 13.165482521057129, 14.945850372314453, 16.72621726989746, 18.50658416748047, 20.28695297241211, 22.067319869995117, 23.847686767578125, 25.628055572509766, 27.408422470092773, 29.188791275024414, 30.969158172607422, 32.74952697753906, 34.52989196777344, 36.31026077270508, 38.09062957763672, 39.870994567871094, 41.651363372802734, 43.43172836303711, 45.21209716796875, 46.99246597290039, 48.77283477783203, 50.553199768066406, 52.33356857299805, 54.11393737792969]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 6.0, 18.0, 17.0, 32.0, 38.0, 60.0, 119.0, 196.0, 330.0, 572.0, 1057.0, 2466.0, 6733.0, 25503.0, 164980.0, 3620998.0, 317776.0, 38054.0, 9079.0, 3056.0, 1378.0, 652.0, 373.0, 267.0, 138.0, 106.0, 69.0, 51.0, 33.0, 15.0, 28.0, 15.0, 11.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.59375, -28.56005859375, -27.5263671875, -26.49267578125, -25.458984375, -24.42529296875, -23.3916015625, -22.35791015625, -21.32421875, -20.29052734375, -19.2568359375, -18.22314453125, -17.189453125, -16.15576171875, -15.1220703125, -14.08837890625, -13.0546875, -12.02099609375, -10.9873046875, -9.95361328125, -8.919921875, -7.88623046875, -6.8525390625, -5.81884765625, -4.78515625, -3.75146484375, -2.7177734375, -1.68408203125, -0.650390625, 0.38330078125, 1.4169921875, 2.45068359375, 3.484375, 4.51806640625, 5.5517578125, 6.58544921875, 7.619140625, 8.65283203125, 9.6865234375, 10.72021484375, 11.75390625, 12.78759765625, 13.8212890625, 14.85498046875, 15.888671875, 16.92236328125, 17.9560546875, 18.98974609375, 20.0234375, 21.05712890625, 22.0908203125, 23.12451171875, 24.158203125, 25.19189453125, 26.2255859375, 27.25927734375, 28.29296875, 29.32666015625, 30.3603515625, 31.39404296875, 32.427734375, 33.46142578125, 34.4951171875, 35.52880859375, 36.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0, 10.0, 22.0, 21.0, 37.0, 56.0, 62.0, 77.0, 86.0, 95.0, 92.0, 91.0, 97.0, 64.0, 54.0, 40.0, 27.0, 19.0, 19.0, 12.0, 7.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.57818603515625, -3.4102783203125, -3.24237060546875, -3.074462890625, -2.90655517578125, -2.7386474609375, -2.57073974609375, -2.40283203125, -2.23492431640625, -2.0670166015625, -1.89910888671875, -1.731201171875, -1.56329345703125, -1.3953857421875, -1.22747802734375, -1.0595703125, -0.89166259765625, -0.7237548828125, -0.55584716796875, -0.387939453125, -0.22003173828125, -0.0521240234375, 0.11578369140625, 0.28369140625, 0.45159912109375, 0.6195068359375, 0.78741455078125, 0.955322265625, 1.12322998046875, 1.2911376953125, 1.45904541015625, 1.626953125, 1.79486083984375, 1.9627685546875, 2.13067626953125, 2.298583984375, 2.46649169921875, 2.6343994140625, 2.80230712890625, 2.97021484375, 3.13812255859375, 3.3060302734375, 3.47393798828125, 3.641845703125, 3.80975341796875, 3.9776611328125, 4.14556884765625, 4.3134765625, 4.48138427734375, 4.6492919921875, 4.81719970703125, 4.985107421875, 5.15301513671875, 5.3209228515625, 5.48883056640625, 5.65673828125, 5.82464599609375, 5.9925537109375, 6.16046142578125, 6.328369140625, 6.49627685546875, 6.6641845703125, 6.83209228515625, 7.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 13.0, 23.0, 31.0, 38.0, 45.0, 58.0, 76.0, 104.0, 168.0, 193.0, 299.0, 457.0, 842.0, 1828.0, 4117.0, 11583.0, 38098.0, 160341.0, 1364056.0, 2359362.0, 186924.0, 43808.0, 12901.0, 4559.0, 1838.0, 918.0, 475.0, 313.0, 219.0, 147.0, 126.0, 75.0, 63.0, 50.0, 37.0, 26.0, 8.0, 13.0, 12.0, 12.0, 6.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6220703125, -18.041015625, -17.4599609375, -16.87890625, -16.2978515625, -15.716796875, -15.1357421875, -14.5546875, -13.9736328125, -13.392578125, -12.8115234375, -12.23046875, -11.6494140625, -11.068359375, -10.4873046875, -9.90625, -9.3251953125, -8.744140625, -8.1630859375, -7.58203125, -7.0009765625, -6.419921875, -5.8388671875, -5.2578125, -4.6767578125, -4.095703125, -3.5146484375, -2.93359375, -2.3525390625, -1.771484375, -1.1904296875, -0.609375, -0.0283203125, 0.552734375, 1.1337890625, 1.71484375, 2.2958984375, 2.876953125, 3.4580078125, 4.0390625, 4.6201171875, 5.201171875, 5.7822265625, 6.36328125, 6.9443359375, 7.525390625, 8.1064453125, 8.6875, 9.2685546875, 9.849609375, 10.4306640625, 11.01171875, 11.5927734375, 12.173828125, 12.7548828125, 13.3359375, 13.9169921875, 14.498046875, 15.0791015625, 15.66015625, 16.2412109375, 16.822265625, 17.4033203125, 17.984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 8.0, 11.0, 19.0, 20.0, 28.0, 47.0, 68.0, 100.0, 142.0, 193.0, 331.0, 707.0, 1245.0, 399.0, 237.0, 168.0, 107.0, 68.0, 52.0, 29.0, 17.0, 15.0, 16.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -5.987060546875, -5.73974609375, -5.492431640625, -5.2451171875, -4.997802734375, -4.75048828125, -4.503173828125, -4.255859375, -4.008544921875, -3.76123046875, -3.513916015625, -3.2666015625, -3.019287109375, -2.77197265625, -2.524658203125, -2.27734375, -2.030029296875, -1.78271484375, -1.535400390625, -1.2880859375, -1.040771484375, -0.79345703125, -0.546142578125, -0.298828125, -0.051513671875, 0.19580078125, 0.443115234375, 0.6904296875, 0.937744140625, 1.18505859375, 1.432373046875, 1.6796875, 1.927001953125, 2.17431640625, 2.421630859375, 2.6689453125, 2.916259765625, 3.16357421875, 3.410888671875, 3.658203125, 3.905517578125, 4.15283203125, 4.400146484375, 4.6474609375, 4.894775390625, 5.14208984375, 5.389404296875, 5.63671875, 5.884033203125, 6.13134765625, 6.378662109375, 6.6259765625, 6.873291015625, 7.12060546875, 7.367919921875, 7.615234375, 7.862548828125, 8.10986328125, 8.357177734375, 8.6044921875, 8.851806640625, 9.09912109375, 9.346435546875, 9.59375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 12.0, 18.0, 34.0, 58.0, 85.0, 106.0, 138.0, 129.0, 126.0, 111.0, 69.0, 51.0, 24.0, 12.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.6125602722168, -58.34540939331055, -56.07825469970703, -53.81110382080078, -51.543949127197266, -49.276798248291016, -47.0096435546875, -44.74249267578125, -42.475341796875, -40.20819091796875, -37.941036224365234, -35.673885345458984, -33.40673065185547, -31.13957977294922, -28.872426986694336, -26.605274200439453, -24.338119506835938, -22.070966720581055, -19.803813934326172, -17.536663055419922, -15.269509315490723, -13.00235652923584, -10.735204696655273, -8.46805191040039, -6.200899124145508, -3.933746576309204, -1.6665940284729004, 0.6005582809448242, 2.867711067199707, 5.13486385345459, 7.402015686035156, 9.669168472290039, 11.936317443847656, 14.203470230102539, 16.470623016357422, 18.737773895263672, 21.004928588867188, 23.272079467773438, 25.53923225402832, 27.806385040283203, 30.073537826538086, 32.34069061279297, 34.60784149169922, 36.874996185302734, 39.142147064208984, 41.4093017578125, 43.67645263671875, 45.943603515625, 48.210758209228516, 50.477909088134766, 52.74506378173828, 55.01221466064453, 57.27936935424805, 59.5465202331543, 61.81367492675781, 64.08082580566406, 66.34797668457031, 68.61512756347656, 70.88227844238281, 73.1494369506836, 75.41658782958984, 77.6837387084961, 79.95088958740234, 82.21804809570312, 84.48519897460938]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 13.0, 7.0, 9.0, 17.0, 25.0, 19.0, 24.0, 34.0, 30.0, 28.0, 34.0, 31.0, 46.0, 36.0, 42.0, 50.0, 37.0, 38.0, 39.0, 47.0, 51.0, 37.0, 43.0, 30.0, 35.0, 24.0, 32.0, 25.0, 18.0, 9.0, 10.0, 11.0, 7.0, 14.0, 13.0, 1.0, 5.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.631668090820312, -25.734140396118164, -24.836612701416016, -23.939083099365234, -23.041555404663086, -22.144027709960938, -21.24650001525879, -20.34897232055664, -19.45144271850586, -18.55391502380371, -17.656387329101562, -16.75885772705078, -15.861330032348633, -14.963802337646484, -14.066274642944336, -13.168746948242188, -12.271219253540039, -11.37369155883789, -10.476162910461426, -9.578635215759277, -8.681106567382812, -7.783578872680664, -6.886051177978516, -5.988523006439209, -5.090994834899902, -4.193466663360596, -3.295938730239868, -2.3984107971191406, -1.500882625579834, -0.6033544540405273, 0.2941732406616211, 1.1917014122009277, 2.0892295837402344, 2.986757755279541, 3.8842856884002686, 4.781813621520996, 5.679341793060303, 6.576869964599609, 7.474397659301758, 8.371925354003906, 9.269454002380371, 10.16698169708252, 11.064510345458984, 11.962038040161133, 12.859565734863281, 13.757094383239746, 14.654622077941895, 15.55215072631836, 16.449678421020508, 17.347206115722656, 18.244733810424805, 19.142261505126953, 20.039791107177734, 20.937318801879883, 21.83484649658203, 22.73237419128418, 23.629901885986328, 24.527429580688477, 25.424957275390625, 26.322486877441406, 27.220014572143555, 28.117542266845703, 29.01506996154785, 29.91259765625, 30.81012725830078]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 7.0, 8.0, 25.0, 24.0, 51.0, 112.0, 244.0, 533.0, 1711.0, 8902.0, 93079.0, 741358.0, 184277.0, 14511.0, 2447.0, 712.0, 278.0, 136.0, 73.0, 27.0, 16.0, 13.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.5009765625, -33.251953125, -32.0029296875, -30.75390625, -29.5048828125, -28.255859375, -27.0068359375, -25.7578125, -24.5087890625, -23.259765625, -22.0107421875, -20.76171875, -19.5126953125, -18.263671875, -17.0146484375, -15.765625, -14.5166015625, -13.267578125, -12.0185546875, -10.76953125, -9.5205078125, -8.271484375, -7.0224609375, -5.7734375, -4.5244140625, -3.275390625, -2.0263671875, -0.77734375, 0.4716796875, 1.720703125, 2.9697265625, 4.21875, 5.4677734375, 6.716796875, 7.9658203125, 9.21484375, 10.4638671875, 11.712890625, 12.9619140625, 14.2109375, 15.4599609375, 16.708984375, 17.9580078125, 19.20703125, 20.4560546875, 21.705078125, 22.9541015625, 24.203125, 25.4521484375, 26.701171875, 27.9501953125, 29.19921875, 30.4482421875, 31.697265625, 32.9462890625, 34.1953125, 35.4443359375, 36.693359375, 37.9423828125, 39.19140625, 40.4404296875, 41.689453125, 42.9384765625, 44.1875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 9.0, 12.0, 25.0, 28.0, 44.0, 45.0, 69.0, 80.0, 72.0, 82.0, 76.0, 85.0, 88.0, 67.0, 63.0, 34.0, 31.0, 39.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.869140625, -3.696014404296875, -3.52288818359375, -3.349761962890625, -3.1766357421875, -3.003509521484375, -2.83038330078125, -2.657257080078125, -2.484130859375, -2.311004638671875, -2.13787841796875, -1.964752197265625, -1.7916259765625, -1.618499755859375, -1.44537353515625, -1.272247314453125, -1.09912109375, -0.925994873046875, -0.75286865234375, -0.579742431640625, -0.4066162109375, -0.233489990234375, -0.06036376953125, 0.112762451171875, 0.285888671875, 0.459014892578125, 0.63214111328125, 0.805267333984375, 0.9783935546875, 1.151519775390625, 1.32464599609375, 1.497772216796875, 1.6708984375, 1.844024658203125, 2.01715087890625, 2.190277099609375, 2.3634033203125, 2.536529541015625, 2.70965576171875, 2.882781982421875, 3.055908203125, 3.229034423828125, 3.40216064453125, 3.575286865234375, 3.7484130859375, 3.921539306640625, 4.09466552734375, 4.267791748046875, 4.44091796875, 4.614044189453125, 4.78717041015625, 4.960296630859375, 5.1334228515625, 5.306549072265625, 5.47967529296875, 5.652801513671875, 5.825927734375, 5.999053955078125, 6.17218017578125, 6.345306396484375, 6.5184326171875, 6.691558837890625, 6.86468505859375, 7.037811279296875, 7.2109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 7.0, 7.0, 5.0, 15.0, 12.0, 27.0, 37.0, 53.0, 66.0, 105.0, 146.0, 174.0, 274.0, 369.0, 581.0, 927.0, 2007.0, 4952.0, 15885.0, 58169.0, 253198.0, 507997.0, 149640.0, 36077.0, 10459.0, 3540.0, 1474.0, 723.0, 488.0, 314.0, 228.0, 175.0, 129.0, 79.0, 61.0, 37.0, 35.0, 25.0, 17.0, 11.0, 7.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.109375, -16.580078125, -16.05078125, -15.521484375, -14.9921875, -14.462890625, -13.93359375, -13.404296875, -12.875, -12.345703125, -11.81640625, -11.287109375, -10.7578125, -10.228515625, -9.69921875, -9.169921875, -8.640625, -8.111328125, -7.58203125, -7.052734375, -6.5234375, -5.994140625, -5.46484375, -4.935546875, -4.40625, -3.876953125, -3.34765625, -2.818359375, -2.2890625, -1.759765625, -1.23046875, -0.701171875, -0.171875, 0.357421875, 0.88671875, 1.416015625, 1.9453125, 2.474609375, 3.00390625, 3.533203125, 4.0625, 4.591796875, 5.12109375, 5.650390625, 6.1796875, 6.708984375, 7.23828125, 7.767578125, 8.296875, 8.826171875, 9.35546875, 9.884765625, 10.4140625, 10.943359375, 11.47265625, 12.001953125, 12.53125, 13.060546875, 13.58984375, 14.119140625, 14.6484375, 15.177734375, 15.70703125, 16.236328125, 16.765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 11.0, 14.0, 13.0, 10.0, 17.0, 21.0, 21.0, 23.0, 40.0, 31.0, 38.0, 38.0, 44.0, 53.0, 45.0, 43.0, 47.0, 51.0, 50.0, 45.0, 43.0, 45.0, 35.0, 30.0, 24.0, 26.0, 24.0, 16.0, 20.0, 10.0, 9.0, 11.0, 7.0, 10.0, 2.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.5, -12.02392578125, -11.5478515625, -11.07177734375, -10.595703125, -10.11962890625, -9.6435546875, -9.16748046875, -8.69140625, -8.21533203125, -7.7392578125, -7.26318359375, -6.787109375, -6.31103515625, -5.8349609375, -5.35888671875, -4.8828125, -4.40673828125, -3.9306640625, -3.45458984375, -2.978515625, -2.50244140625, -2.0263671875, -1.55029296875, -1.07421875, -0.59814453125, -0.1220703125, 0.35400390625, 0.830078125, 1.30615234375, 1.7822265625, 2.25830078125, 2.734375, 3.21044921875, 3.6865234375, 4.16259765625, 4.638671875, 5.11474609375, 5.5908203125, 6.06689453125, 6.54296875, 7.01904296875, 7.4951171875, 7.97119140625, 8.447265625, 8.92333984375, 9.3994140625, 9.87548828125, 10.3515625, 10.82763671875, 11.3037109375, 11.77978515625, 12.255859375, 12.73193359375, 13.2080078125, 13.68408203125, 14.16015625, 14.63623046875, 15.1123046875, 15.58837890625, 16.064453125, 16.54052734375, 17.0166015625, 17.49267578125, 17.96875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 9.0, 10.0, 10.0, 20.0, 32.0, 32.0, 75.0, 91.0, 164.0, 262.0, 471.0, 716.0, 1480.0, 3219.0, 8442.0, 26174.0, 92159.0, 302682.0, 402587.0, 147520.0, 40919.0, 12703.0, 4541.0, 1887.0, 955.0, 533.0, 309.0, 187.0, 97.0, 90.0, 56.0, 34.0, 26.0, 16.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.7265625, -6.52978515625, -6.3330078125, -6.13623046875, -5.939453125, -5.74267578125, -5.5458984375, -5.34912109375, -5.15234375, -4.95556640625, -4.7587890625, -4.56201171875, -4.365234375, -4.16845703125, -3.9716796875, -3.77490234375, -3.578125, -3.38134765625, -3.1845703125, -2.98779296875, -2.791015625, -2.59423828125, -2.3974609375, -2.20068359375, -2.00390625, -1.80712890625, -1.6103515625, -1.41357421875, -1.216796875, -1.02001953125, -0.8232421875, -0.62646484375, -0.4296875, -0.23291015625, -0.0361328125, 0.16064453125, 0.357421875, 0.55419921875, 0.7509765625, 0.94775390625, 1.14453125, 1.34130859375, 1.5380859375, 1.73486328125, 1.931640625, 2.12841796875, 2.3251953125, 2.52197265625, 2.71875, 2.91552734375, 3.1123046875, 3.30908203125, 3.505859375, 3.70263671875, 3.8994140625, 4.09619140625, 4.29296875, 4.48974609375, 4.6865234375, 4.88330078125, 5.080078125, 5.27685546875, 5.4736328125, 5.67041015625, 5.8671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 6.0, 6.0, 5.0, 3.0, 15.0, 14.0, 24.0, 16.0, 30.0, 38.0, 49.0, 58.0, 57.0, 75.0, 76.0, 78.0, 80.0, 62.0, 59.0, 52.0, 34.0, 33.0, 24.0, 21.0, 15.0, 16.0, 9.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010242462158203125, -0.000990167260169983, -0.0009560883045196533, -0.0009220093488693237, -0.0008879303932189941, -0.0008538514375686646, -0.000819772481918335, -0.0007856935262680054, -0.0007516145706176758, -0.0007175356149673462, -0.0006834566593170166, -0.000649377703666687, -0.0006152987480163574, -0.0005812197923660278, -0.0005471408367156982, -0.0005130618810653687, -0.00047898292541503906, -0.00044490396976470947, -0.0004108250141143799, -0.0003767460584640503, -0.0003426671028137207, -0.0003085881471633911, -0.0002745091915130615, -0.00024043023586273193, -0.00020635128021240234, -0.00017227232456207275, -0.00013819336891174316, -0.00010411441326141357, -7.003545761108398e-05, -3.5956501960754395e-05, -1.8775463104248047e-06, 3.2201409339904785e-05, 6.628036499023438e-05, 0.00010035932064056396, 0.00013443827629089355, 0.00016851723194122314, 0.00020259618759155273, 0.00023667514324188232, 0.0002707540988922119, 0.0003048330545425415, 0.0003389120101928711, 0.0003729909658432007, 0.0004070699214935303, 0.00044114887714385986, 0.00047522783279418945, 0.000509306788444519, 0.0005433857440948486, 0.0005774646997451782, 0.0006115436553955078, 0.0006456226110458374, 0.000679701566696167, 0.0007137805223464966, 0.0007478594779968262, 0.0007819384336471558, 0.0008160173892974854, 0.0008500963449478149, 0.0008841753005981445, 0.0009182542562484741, 0.0009523332118988037, 0.0009864121675491333, 0.0010204911231994629, 0.0010545700788497925, 0.001088649034500122, 0.0011227279901504517, 0.0011568069458007812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 16.0, 14.0, 37.0, 36.0, 53.0, 84.0, 151.0, 261.0, 540.0, 1024.0, 2664.0, 8394.0, 46387.0, 356135.0, 530507.0, 83280.0, 12713.0, 3457.0, 1295.0, 649.0, 341.0, 181.0, 104.0, 75.0, 46.0, 26.0, 23.0, 9.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.19384765625, -11.8564453125, -11.51904296875, -11.181640625, -10.84423828125, -10.5068359375, -10.16943359375, -9.83203125, -9.49462890625, -9.1572265625, -8.81982421875, -8.482421875, -8.14501953125, -7.8076171875, -7.47021484375, -7.1328125, -6.79541015625, -6.4580078125, -6.12060546875, -5.783203125, -5.44580078125, -5.1083984375, -4.77099609375, -4.43359375, -4.09619140625, -3.7587890625, -3.42138671875, -3.083984375, -2.74658203125, -2.4091796875, -2.07177734375, -1.734375, -1.39697265625, -1.0595703125, -0.72216796875, -0.384765625, -0.04736328125, 0.2900390625, 0.62744140625, 0.96484375, 1.30224609375, 1.6396484375, 1.97705078125, 2.314453125, 2.65185546875, 2.9892578125, 3.32666015625, 3.6640625, 4.00146484375, 4.3388671875, 4.67626953125, 5.013671875, 5.35107421875, 5.6884765625, 6.02587890625, 6.36328125, 6.70068359375, 7.0380859375, 7.37548828125, 7.712890625, 8.05029296875, 8.3876953125, 8.72509765625, 9.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 15.0, 13.0, 17.0, 25.0, 38.0, 42.0, 53.0, 66.0, 80.0, 95.0, 93.0, 89.0, 88.0, 59.0, 68.0, 32.0, 20.0, 32.0, 18.0, 15.0, 7.0, 8.0, 2.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.98681640625, -7.7548828125, -7.52294921875, -7.291015625, -7.05908203125, -6.8271484375, -6.59521484375, -6.36328125, -6.13134765625, -5.8994140625, -5.66748046875, -5.435546875, -5.20361328125, -4.9716796875, -4.73974609375, -4.5078125, -4.27587890625, -4.0439453125, -3.81201171875, -3.580078125, -3.34814453125, -3.1162109375, -2.88427734375, -2.65234375, -2.42041015625, -2.1884765625, -1.95654296875, -1.724609375, -1.49267578125, -1.2607421875, -1.02880859375, -0.796875, -0.56494140625, -0.3330078125, -0.10107421875, 0.130859375, 0.36279296875, 0.5947265625, 0.82666015625, 1.05859375, 1.29052734375, 1.5224609375, 1.75439453125, 1.986328125, 2.21826171875, 2.4501953125, 2.68212890625, 2.9140625, 3.14599609375, 3.3779296875, 3.60986328125, 3.841796875, 4.07373046875, 4.3056640625, 4.53759765625, 4.76953125, 5.00146484375, 5.2333984375, 5.46533203125, 5.697265625, 5.92919921875, 6.1611328125, 6.39306640625, 6.625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 13.0, 22.0, 50.0, 94.0, 163.0, 178.0, 186.0, 139.0, 83.0, 40.0, 22.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-277.1130065917969, -271.21820068359375, -265.3233642578125, -259.4285583496094, -253.53372192382812, -247.638916015625, -241.7440948486328, -235.84927368164062, -229.95445251464844, -224.05963134765625, -218.16481018066406, -212.26998901367188, -206.37518310546875, -200.48036193847656, -194.58554077148438, -188.6907196044922, -182.7958984375, -176.9010772705078, -171.00625610351562, -165.11143493652344, -159.21661376953125, -153.32180786132812, -147.42698669433594, -141.53216552734375, -135.63734436035156, -129.74252319335938, -123.84770202636719, -117.95288848876953, -112.05806732177734, -106.16324615478516, -100.2684326171875, -94.37361145019531, -88.47879028320312, -82.58396911621094, -76.68914794921875, -70.7943344116211, -64.8995132446289, -59.00469207763672, -53.1098747253418, -47.215057373046875, -41.32023620605469, -35.4254150390625, -29.530597686767578, -23.635778427124023, -17.74095916748047, -11.846139907836914, -5.951320648193359, -0.0565032958984375, 5.83831787109375, 11.733137130737305, 17.62795639038086, 23.522775650024414, 29.41759490966797, 35.312416076660156, 41.20723342895508, 47.10205078125, 52.99687194824219, 58.891693115234375, 64.78651428222656, 70.68132781982422, 76.5761489868164, 82.4709701538086, 88.36578369140625, 94.26060485839844, 100.15542602539062]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 6.0, 4.0, 3.0, 8.0, 15.0, 9.0, 19.0, 14.0, 17.0, 15.0, 30.0, 30.0, 42.0, 42.0, 43.0, 37.0, 47.0, 53.0, 55.0, 61.0, 61.0, 49.0, 41.0, 38.0, 45.0, 32.0, 28.0, 38.0, 25.0, 19.0, 23.0, 6.0, 13.0, 6.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.02273559570312, -84.3149185180664, -81.60710906982422, -78.8992919921875, -76.19147491455078, -73.48365783691406, -70.77584838867188, -68.06803131103516, -65.36021423339844, -62.652400970458984, -59.944583892822266, -57.23677062988281, -54.528953552246094, -51.82114028930664, -49.11332702636719, -46.40550994873047, -43.69770050048828, -40.98988723754883, -38.28207015991211, -35.574256896972656, -32.86643981933594, -30.158626556396484, -27.45081329345703, -24.742998123168945, -22.03518295288086, -19.327367782592773, -16.619552612304688, -13.911739349365234, -11.203924179077148, -8.496109008789062, -5.788295745849609, -3.0804805755615234, -0.3726654052734375, 2.3351492881774902, 5.042963981628418, 7.7507781982421875, 10.458593368530273, 13.16640853881836, 15.874221801757812, 18.5820369720459, 21.289852142333984, 23.99766731262207, 26.705482482910156, 29.41329574584961, 32.12110900878906, 34.82892608642578, 37.536739349365234, 40.24455261230469, 42.952369689941406, 45.66018295288086, 48.36800003051758, 51.07581329345703, 53.78363037109375, 56.4914436340332, 59.199256896972656, 61.907073974609375, 64.61488342285156, 67.32270050048828, 70.03050994873047, 72.73832702636719, 75.4461441040039, 78.15396118164062, 80.86177062988281, 83.56958770751953, 86.27740478515625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 16.0, 37.0, 81.0, 129.0, 275.0, 667.0, 1962.0, 8350.0, 133038.0, 4029866.0, 15189.0, 3018.0, 907.0, 361.0, 147.0, 76.0, 40.0, 34.0, 19.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.4609375, -61.546875, -59.6328125, -57.71875, -55.8046875, -53.890625, -51.9765625, -50.0625, -48.1484375, -46.234375, -44.3203125, -42.40625, -40.4921875, -38.578125, -36.6640625, -34.75, -32.8359375, -30.921875, -29.0078125, -27.09375, -25.1796875, -23.265625, -21.3515625, -19.4375, -17.5234375, -15.609375, -13.6953125, -11.78125, -9.8671875, -7.953125, -6.0390625, -4.125, -2.2109375, -0.296875, 1.6171875, 3.53125, 5.4453125, 7.359375, 9.2734375, 11.1875, 13.1015625, 15.015625, 16.9296875, 18.84375, 20.7578125, 22.671875, 24.5859375, 26.5, 28.4140625, 30.328125, 32.2421875, 34.15625, 36.0703125, 37.984375, 39.8984375, 41.8125, 43.7265625, 45.640625, 47.5546875, 49.46875, 51.3828125, 53.296875, 55.2109375, 57.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 9.0, 20.0, 22.0, 31.0, 34.0, 52.0, 63.0, 55.0, 59.0, 68.0, 69.0, 78.0, 71.0, 66.0, 62.0, 53.0, 41.0, 40.0, 25.0, 18.0, 20.0, 13.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.791015625, -3.6171875, -3.443359375, -3.26953125, -3.095703125, -2.921875, -2.748046875, -2.57421875, -2.400390625, -2.2265625, -2.052734375, -1.87890625, -1.705078125, -1.53125, -1.357421875, -1.18359375, -1.009765625, -0.8359375, -0.662109375, -0.48828125, -0.314453125, -0.140625, 0.033203125, 0.20703125, 0.380859375, 0.5546875, 0.728515625, 0.90234375, 1.076171875, 1.25, 1.423828125, 1.59765625, 1.771484375, 1.9453125, 2.119140625, 2.29296875, 2.466796875, 2.640625, 2.814453125, 2.98828125, 3.162109375, 3.3359375, 3.509765625, 3.68359375, 3.857421875, 4.03125, 4.205078125, 4.37890625, 4.552734375, 4.7265625, 4.900390625, 5.07421875, 5.248046875, 5.421875, 5.595703125, 5.76953125, 5.943359375, 6.1171875, 6.291015625, 6.46484375, 6.638671875, 6.8125, 6.986328125, 7.16015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 20.0, 25.0, 33.0, 63.0, 132.0, 197.0, 384.0, 670.0, 1308.0, 2635.0, 6319.0, 21173.0, 144911.0, 3936707.0, 58273.0, 12800.0, 4502.0, 1951.0, 986.0, 502.0, 275.0, 176.0, 89.0, 56.0, 40.0, 22.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -33.004150390625, -32.16455078125, -31.324951171875, -30.4853515625, -29.645751953125, -28.80615234375, -27.966552734375, -27.126953125, -26.287353515625, -25.44775390625, -24.608154296875, -23.7685546875, -22.928955078125, -22.08935546875, -21.249755859375, -20.41015625, -19.570556640625, -18.73095703125, -17.891357421875, -17.0517578125, -16.212158203125, -15.37255859375, -14.532958984375, -13.693359375, -12.853759765625, -12.01416015625, -11.174560546875, -10.3349609375, -9.495361328125, -8.65576171875, -7.816162109375, -6.9765625, -6.136962890625, -5.29736328125, -4.457763671875, -3.6181640625, -2.778564453125, -1.93896484375, -1.099365234375, -0.259765625, 0.579833984375, 1.41943359375, 2.259033203125, 3.0986328125, 3.938232421875, 4.77783203125, 5.617431640625, 6.45703125, 7.296630859375, 8.13623046875, 8.975830078125, 9.8154296875, 10.655029296875, 11.49462890625, 12.334228515625, 13.173828125, 14.013427734375, 14.85302734375, 15.692626953125, 16.5322265625, 17.371826171875, 18.21142578125, 19.051025390625, 19.890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 14.0, 7.0, 22.0, 33.0, 34.0, 79.0, 167.0, 3099.0, 320.0, 110.0, 52.0, 36.0, 21.0, 20.0, 12.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.074310302734375, -3.95330810546875, -3.832305908203125, -3.7113037109375, -3.590301513671875, -3.46929931640625, -3.348297119140625, -3.227294921875, -3.106292724609375, -2.98529052734375, -2.864288330078125, -2.7432861328125, -2.622283935546875, -2.50128173828125, -2.380279541015625, -2.25927734375, -2.138275146484375, -2.01727294921875, -1.896270751953125, -1.7752685546875, -1.654266357421875, -1.53326416015625, -1.412261962890625, -1.291259765625, -1.170257568359375, -1.04925537109375, -0.928253173828125, -0.8072509765625, -0.686248779296875, -0.56524658203125, -0.444244384765625, -0.3232421875, -0.202239990234375, -0.08123779296875, 0.039764404296875, 0.1607666015625, 0.281768798828125, 0.40277099609375, 0.523773193359375, 0.644775390625, 0.765777587890625, 0.88677978515625, 1.007781982421875, 1.1287841796875, 1.249786376953125, 1.37078857421875, 1.491790771484375, 1.61279296875, 1.733795166015625, 1.85479736328125, 1.975799560546875, 2.0968017578125, 2.217803955078125, 2.33880615234375, 2.459808349609375, 2.580810546875, 2.701812744140625, 2.82281494140625, 2.943817138671875, 3.0648193359375, 3.185821533203125, 3.30682373046875, 3.427825927734375, 3.548828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 8.0, 12.0, 17.0, 33.0, 41.0, 62.0, 60.0, 76.0, 99.0, 91.0, 89.0, 96.0, 80.0, 67.0, 43.0, 37.0, 23.0, 11.0, 15.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.29732894897461, -18.775888442993164, -18.25444793701172, -17.733007431030273, -17.211566925048828, -16.690128326416016, -16.16868782043457, -15.647247314453125, -15.12580680847168, -14.604366302490234, -14.082925796508789, -13.56148624420166, -13.040045738220215, -12.51860523223877, -11.99716567993164, -11.475725173950195, -10.95428466796875, -10.432844161987305, -9.91140365600586, -9.38996410369873, -8.868523597717285, -8.34708309173584, -7.825643062591553, -7.304203033447266, -6.78276252746582, -6.261322021484375, -5.739881992340088, -5.218441963195801, -4.6970014572143555, -4.17556095123291, -3.654120922088623, -3.132680654525757, -2.6112422943115234, -2.0898020267486572, -1.568361759185791, -1.0469214916229248, -0.5254812240600586, -0.004040956497192383, 0.5173993110656738, 1.03883957862854, 1.5602798461914062, 2.0817201137542725, 2.6031603813171387, 3.124600648880005, 3.646040916442871, 4.167481422424316, 4.6889214515686035, 5.210361480712891, 5.731801986694336, 6.253242492675781, 6.774682521820068, 7.2961225509643555, 7.817563056945801, 8.339003562927246, 8.860443115234375, 9.38188362121582, 9.903324127197266, 10.424764633178711, 10.946205139160156, 11.467644691467285, 11.98908519744873, 12.510525703430176, 13.031965255737305, 13.55340576171875, 14.074846267700195]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 12.0, 12.0, 13.0, 16.0, 16.0, 17.0, 27.0, 18.0, 32.0, 31.0, 44.0, 35.0, 41.0, 44.0, 45.0, 35.0, 44.0, 33.0, 48.0, 29.0, 36.0, 42.0, 29.0, 30.0, 35.0, 30.0, 24.0, 27.0, 25.0, 22.0, 14.0, 9.0, 14.0, 9.0, 11.0, 5.0, 6.0, 7.0, 3.0, 7.0, 1.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.998217582702637, -7.764782428741455, -7.531347274780273, -7.297912120819092, -7.06447696685791, -6.8310418128967285, -6.597606658935547, -6.364171504974365, -6.130736351013184, -5.897301197052002, -5.66386604309082, -5.430430889129639, -5.196995735168457, -4.963560581207275, -4.730125427246094, -4.496690273284912, -4.2632551193237305, -4.029819965362549, -3.796384811401367, -3.5629496574401855, -3.329514503479004, -3.0960793495178223, -2.8626441955566406, -2.629209041595459, -2.3957738876342773, -2.1623387336730957, -1.928903579711914, -1.6954684257507324, -1.4620332717895508, -1.2285981178283691, -0.9951629638671875, -0.7617278099060059, -0.5282926559448242, -0.2948575019836426, -0.06142234802246094, 0.1720128059387207, 0.40544795989990234, 0.638883113861084, 0.8723182678222656, 1.1057534217834473, 1.339188575744629, 1.5726237297058105, 1.8060588836669922, 2.039494037628174, 2.2729291915893555, 2.506364345550537, 2.7397994995117188, 2.9732346534729004, 3.206669807434082, 3.4401049613952637, 3.6735401153564453, 3.906975269317627, 4.140410423278809, 4.37384557723999, 4.607280731201172, 4.8407158851623535, 5.074151039123535, 5.307586193084717, 5.541021347045898, 5.77445650100708, 6.007891654968262, 6.241326808929443, 6.474761962890625, 6.708197116851807, 6.941632270812988]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 13.0, 33.0, 36.0, 68.0, 120.0, 245.0, 540.0, 1358.0, 4731.0, 22283.0, 121462.0, 574537.0, 265471.0, 45099.0, 8768.0, 2299.0, 779.0, 319.0, 159.0, 92.0, 39.0, 33.0, 26.0, 15.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.078125, -25.347900390625, -24.61767578125, -23.887451171875, -23.1572265625, -22.427001953125, -21.69677734375, -20.966552734375, -20.236328125, -19.506103515625, -18.77587890625, -18.045654296875, -17.3154296875, -16.585205078125, -15.85498046875, -15.124755859375, -14.39453125, -13.664306640625, -12.93408203125, -12.203857421875, -11.4736328125, -10.743408203125, -10.01318359375, -9.282958984375, -8.552734375, -7.822509765625, -7.09228515625, -6.362060546875, -5.6318359375, -4.901611328125, -4.17138671875, -3.441162109375, -2.7109375, -1.980712890625, -1.25048828125, -0.520263671875, 0.2099609375, 0.940185546875, 1.67041015625, 2.400634765625, 3.130859375, 3.861083984375, 4.59130859375, 5.321533203125, 6.0517578125, 6.781982421875, 7.51220703125, 8.242431640625, 8.97265625, 9.702880859375, 10.43310546875, 11.163330078125, 11.8935546875, 12.623779296875, 13.35400390625, 14.084228515625, 14.814453125, 15.544677734375, 16.27490234375, 17.005126953125, 17.7353515625, 18.465576171875, 19.19580078125, 19.926025390625, 20.65625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 1.0, 4.0, 8.0, 16.0, 15.0, 20.0, 20.0, 28.0, 35.0, 48.0, 49.0, 47.0, 69.0, 52.0, 74.0, 75.0, 78.0, 55.0, 48.0, 53.0, 42.0, 45.0, 26.0, 23.0, 24.0, 18.0, 6.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.8719482421875, -3.697021484375, -3.5220947265625, -3.34716796875, -3.1722412109375, -2.997314453125, -2.8223876953125, -2.6474609375, -2.4725341796875, -2.297607421875, -2.1226806640625, -1.94775390625, -1.7728271484375, -1.597900390625, -1.4229736328125, -1.248046875, -1.0731201171875, -0.898193359375, -0.7232666015625, -0.54833984375, -0.3734130859375, -0.198486328125, -0.0235595703125, 0.1513671875, 0.3262939453125, 0.501220703125, 0.6761474609375, 0.85107421875, 1.0260009765625, 1.200927734375, 1.3758544921875, 1.55078125, 1.7257080078125, 1.900634765625, 2.0755615234375, 2.25048828125, 2.4254150390625, 2.600341796875, 2.7752685546875, 2.9501953125, 3.1251220703125, 3.300048828125, 3.4749755859375, 3.64990234375, 3.8248291015625, 3.999755859375, 4.1746826171875, 4.349609375, 4.5245361328125, 4.699462890625, 4.8743896484375, 5.04931640625, 5.2242431640625, 5.399169921875, 5.5740966796875, 5.7490234375, 5.9239501953125, 6.098876953125, 6.2738037109375, 6.44873046875, 6.6236572265625, 6.798583984375, 6.9735107421875, 7.1484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 15.0, 12.0, 16.0, 27.0, 38.0, 40.0, 67.0, 77.0, 126.0, 131.0, 199.0, 268.0, 433.0, 517.0, 883.0, 1542.0, 3660.0, 12252.0, 50825.0, 278105.0, 557140.0, 106926.0, 23340.0, 6212.0, 2208.0, 1081.0, 679.0, 486.0, 349.0, 233.0, 181.0, 138.0, 92.0, 66.0, 55.0, 41.0, 28.0, 16.0, 8.0, 13.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.546875, -16.01708984375, -15.4873046875, -14.95751953125, -14.427734375, -13.89794921875, -13.3681640625, -12.83837890625, -12.30859375, -11.77880859375, -11.2490234375, -10.71923828125, -10.189453125, -9.65966796875, -9.1298828125, -8.60009765625, -8.0703125, -7.54052734375, -7.0107421875, -6.48095703125, -5.951171875, -5.42138671875, -4.8916015625, -4.36181640625, -3.83203125, -3.30224609375, -2.7724609375, -2.24267578125, -1.712890625, -1.18310546875, -0.6533203125, -0.12353515625, 0.40625, 0.93603515625, 1.4658203125, 1.99560546875, 2.525390625, 3.05517578125, 3.5849609375, 4.11474609375, 4.64453125, 5.17431640625, 5.7041015625, 6.23388671875, 6.763671875, 7.29345703125, 7.8232421875, 8.35302734375, 8.8828125, 9.41259765625, 9.9423828125, 10.47216796875, 11.001953125, 11.53173828125, 12.0615234375, 12.59130859375, 13.12109375, 13.65087890625, 14.1806640625, 14.71044921875, 15.240234375, 15.77001953125, 16.2998046875, 16.82958984375, 17.359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 4.0, 8.0, 18.0, 17.0, 21.0, 30.0, 27.0, 34.0, 38.0, 36.0, 44.0, 55.0, 44.0, 51.0, 56.0, 50.0, 58.0, 47.0, 50.0, 59.0, 39.0, 32.0, 33.0, 24.0, 20.0, 26.0, 16.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.171875, -20.55078125, -19.9296875, -19.30859375, -18.6875, -18.06640625, -17.4453125, -16.82421875, -16.203125, -15.58203125, -14.9609375, -14.33984375, -13.71875, -13.09765625, -12.4765625, -11.85546875, -11.234375, -10.61328125, -9.9921875, -9.37109375, -8.75, -8.12890625, -7.5078125, -6.88671875, -6.265625, -5.64453125, -5.0234375, -4.40234375, -3.78125, -3.16015625, -2.5390625, -1.91796875, -1.296875, -0.67578125, -0.0546875, 0.56640625, 1.1875, 1.80859375, 2.4296875, 3.05078125, 3.671875, 4.29296875, 4.9140625, 5.53515625, 6.15625, 6.77734375, 7.3984375, 8.01953125, 8.640625, 9.26171875, 9.8828125, 10.50390625, 11.125, 11.74609375, 12.3671875, 12.98828125, 13.609375, 14.23046875, 14.8515625, 15.47265625, 16.09375, 16.71484375, 17.3359375, 17.95703125, 18.578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 34.0, 40.0, 74.0, 107.0, 152.0, 228.0, 459.0, 854.0, 1898.0, 4350.0, 12983.0, 49121.0, 253997.0, 560317.0, 123151.0, 26998.0, 7969.0, 2928.0, 1268.0, 677.0, 339.0, 218.0, 123.0, 87.0, 45.0, 36.0, 20.0, 11.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.15716552734375, -6.9041748046875, -6.65118408203125, -6.398193359375, -6.14520263671875, -5.8922119140625, -5.63922119140625, -5.38623046875, -5.13323974609375, -4.8802490234375, -4.62725830078125, -4.374267578125, -4.12127685546875, -3.8682861328125, -3.61529541015625, -3.3623046875, -3.10931396484375, -2.8563232421875, -2.60333251953125, -2.350341796875, -2.09735107421875, -1.8443603515625, -1.59136962890625, -1.33837890625, -1.08538818359375, -0.8323974609375, -0.57940673828125, -0.326416015625, -0.07342529296875, 0.1795654296875, 0.43255615234375, 0.685546875, 0.93853759765625, 1.1915283203125, 1.44451904296875, 1.697509765625, 1.95050048828125, 2.2034912109375, 2.45648193359375, 2.70947265625, 2.96246337890625, 3.2154541015625, 3.46844482421875, 3.721435546875, 3.97442626953125, 4.2274169921875, 4.48040771484375, 4.7333984375, 4.98638916015625, 5.2393798828125, 5.49237060546875, 5.745361328125, 5.99835205078125, 6.2513427734375, 6.50433349609375, 6.75732421875, 7.01031494140625, 7.2633056640625, 7.51629638671875, 7.769287109375, 8.02227783203125, 8.2752685546875, 8.52825927734375, 8.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 12.0, 14.0, 21.0, 13.0, 37.0, 34.0, 42.0, 58.0, 65.0, 73.0, 83.0, 81.0, 75.0, 82.0, 80.0, 48.0, 34.0, 27.0, 20.0, 17.0, 13.0, 7.0, 12.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0013275146484375, -0.0012937411665916443, -0.0012599676847457886, -0.0012261942028999329, -0.0011924207210540771, -0.0011586472392082214, -0.0011248737573623657, -0.00109110027551651, -0.0010573267936706543, -0.0010235533118247986, -0.0009897798299789429, -0.0009560063481330872, -0.0009222328662872314, -0.0008884593844413757, -0.00085468590259552, -0.0008209124207496643, -0.0007871389389038086, -0.0007533654570579529, -0.0007195919752120972, -0.0006858184933662415, -0.0006520450115203857, -0.00061827152967453, -0.0005844980478286743, -0.0005507245659828186, -0.0005169510841369629, -0.0004831776022911072, -0.00044940412044525146, -0.00041563063859939575, -0.00038185715675354004, -0.0003480836749076843, -0.0003143101930618286, -0.0002805367112159729, -0.0002467632293701172, -0.00021298974752426147, -0.00017921626567840576, -0.00014544278383255005, -0.00011166930198669434, -7.789582014083862e-05, -4.412233829498291e-05, -1.0348856449127197e-05, 2.3424625396728516e-05, 5.719810724258423e-05, 9.097158908843994e-05, 0.00012474507093429565, 0.00015851855278015137, 0.00019229203462600708, 0.0002260655164718628, 0.0002598389983177185, 0.0002936124801635742, 0.00032738596200942993, 0.00036115944385528564, 0.00039493292570114136, 0.00042870640754699707, 0.0004624798893928528, 0.0004962533712387085, 0.0005300268530845642, 0.0005638003349304199, 0.0005975738167762756, 0.0006313472986221313, 0.0006651207804679871, 0.0006988942623138428, 0.0007326677441596985, 0.0007664412260055542, 0.0008002147078514099, 0.0008339881896972656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 6.0, 17.0, 34.0, 54.0, 96.0, 142.0, 338.0, 696.0, 1820.0, 6689.0, 41693.0, 575256.0, 384428.0, 29143.0, 5301.0, 1583.0, 634.0, 271.0, 151.0, 67.0, 43.0, 28.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.4571533203125, -11.031494140625, -10.6058349609375, -10.18017578125, -9.7545166015625, -9.328857421875, -8.9031982421875, -8.4775390625, -8.0518798828125, -7.626220703125, -7.2005615234375, -6.77490234375, -6.3492431640625, -5.923583984375, -5.4979248046875, -5.072265625, -4.6466064453125, -4.220947265625, -3.7952880859375, -3.36962890625, -2.9439697265625, -2.518310546875, -2.0926513671875, -1.6669921875, -1.2413330078125, -0.815673828125, -0.3900146484375, 0.03564453125, 0.4613037109375, 0.886962890625, 1.3126220703125, 1.73828125, 2.1639404296875, 2.589599609375, 3.0152587890625, 3.44091796875, 3.8665771484375, 4.292236328125, 4.7178955078125, 5.1435546875, 5.5692138671875, 5.994873046875, 6.4205322265625, 6.84619140625, 7.2718505859375, 7.697509765625, 8.1231689453125, 8.548828125, 8.9744873046875, 9.400146484375, 9.8258056640625, 10.25146484375, 10.6771240234375, 11.102783203125, 11.5284423828125, 11.9541015625, 12.3797607421875, 12.805419921875, 13.2310791015625, 13.65673828125, 14.0823974609375, 14.508056640625, 14.9337158203125, 15.359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 13.0, 18.0, 25.0, 27.0, 39.0, 64.0, 92.0, 109.0, 114.0, 129.0, 95.0, 71.0, 61.0, 43.0, 28.0, 12.0, 18.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.15435791015625, -5.8438720703125, -5.53338623046875, -5.222900390625, -4.91241455078125, -4.6019287109375, -4.29144287109375, -3.98095703125, -3.67047119140625, -3.3599853515625, -3.04949951171875, -2.739013671875, -2.42852783203125, -2.1180419921875, -1.80755615234375, -1.4970703125, -1.18658447265625, -0.8760986328125, -0.56561279296875, -0.255126953125, 0.05535888671875, 0.3658447265625, 0.67633056640625, 0.98681640625, 1.29730224609375, 1.6077880859375, 1.91827392578125, 2.228759765625, 2.53924560546875, 2.8497314453125, 3.16021728515625, 3.470703125, 3.78118896484375, 4.0916748046875, 4.40216064453125, 4.712646484375, 5.02313232421875, 5.3336181640625, 5.64410400390625, 5.95458984375, 6.26507568359375, 6.5755615234375, 6.88604736328125, 7.196533203125, 7.50701904296875, 7.8175048828125, 8.12799072265625, 8.4384765625, 8.74896240234375, 9.0594482421875, 9.36993408203125, 9.680419921875, 9.99090576171875, 10.3013916015625, 10.61187744140625, 10.92236328125, 11.23284912109375, 11.5433349609375, 11.85382080078125, 12.164306640625, 12.47479248046875, 12.7852783203125, 13.09576416015625, 13.40625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 12.0, 21.0, 43.0, 64.0, 121.0, 144.0, 165.0, 170.0, 109.0, 66.0, 44.0, 19.0, 15.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-171.34573364257812, -166.12405395507812, -160.90235900878906, -155.68067932128906, -150.45899963378906, -145.2373046875, -140.015625, -134.7939453125, -129.57225036621094, -124.3505630493164, -119.1288833618164, -113.90719604492188, -108.68550872802734, -103.46382141113281, -98.24214172363281, -93.02045440673828, -87.79877471923828, -82.57708740234375, -77.35540771484375, -72.13372039794922, -66.91203308105469, -61.69034957885742, -56.468666076660156, -51.246978759765625, -46.02529525756836, -40.803611755371094, -35.58192443847656, -30.360240936279297, -25.1385555267334, -19.9168701171875, -14.695186614990234, -9.473499298095703, -4.2518157958984375, 0.9698691368103027, 6.191554069519043, 11.413238525390625, 16.634923934936523, 21.856609344482422, 27.078292846679688, 32.29998016357422, 37.521663665771484, 42.74334716796875, 47.96503448486328, 53.18671798706055, 58.40840148925781, 63.630088806152344, 68.85177612304688, 74.07345581054688, 79.2951431274414, 84.51683044433594, 89.73851013183594, 94.96019744873047, 100.181884765625, 105.403564453125, 110.62525177001953, 115.84693908691406, 121.06861877441406, 126.2903060913086, 131.51199340820312, 136.73367309570312, 141.95535278320312, 147.1770477294922, 152.3987274169922, 157.62042236328125, 162.84210205078125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 9.0, 11.0, 9.0, 9.0, 15.0, 17.0, 16.0, 21.0, 26.0, 33.0, 36.0, 33.0, 38.0, 42.0, 34.0, 40.0, 50.0, 52.0, 49.0, 64.0, 42.0, 41.0, 43.0, 28.0, 46.0, 21.0, 25.0, 19.0, 16.0, 19.0, 12.0, 13.0, 10.0, 6.0, 5.0, 11.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.07047271728516, -75.499755859375, -72.92903137207031, -70.35831451416016, -67.78759765625, -65.21687316894531, -62.646156311035156, -60.075435638427734, -57.50471496582031, -54.93399429321289, -52.36327362060547, -49.79255676269531, -47.22183609008789, -44.65111541748047, -42.08039855957031, -39.50967788696289, -36.93895721435547, -34.36823654174805, -31.797517776489258, -29.22679901123047, -26.656078338623047, -24.085357666015625, -21.514638900756836, -18.943920135498047, -16.373199462890625, -13.80247974395752, -11.231760025024414, -8.661040306091309, -6.090320587158203, -3.5196008682250977, -0.9488811492919922, 1.6218376159667969, 4.1925506591796875, 6.763270378112793, 9.333990097045898, 11.904709815979004, 14.47542953491211, 17.04615020751953, 19.61686897277832, 22.18758773803711, 24.75830841064453, 27.329029083251953, 29.899747848510742, 32.47046661376953, 35.04118728637695, 37.611907958984375, 40.18262481689453, 42.75334548950195, 45.324066162109375, 47.8947868347168, 50.46550750732422, 53.036224365234375, 55.6069450378418, 58.17766571044922, 60.748382568359375, 63.3191032409668, 65.88982391357422, 68.46054077148438, 71.03126525878906, 73.60198211669922, 76.17269897460938, 78.74342346191406, 81.31414031982422, 83.88485717773438, 86.45558166503906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 5.0, 9.0, 10.0, 20.0, 25.0, 54.0, 73.0, 153.0, 293.0, 679.0, 1806.0, 5839.0, 31804.0, 4001709.0, 133753.0, 12762.0, 3138.0, 1168.0, 471.0, 217.0, 112.0, 67.0, 30.0, 23.0, 14.0, 13.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.77685546875, -31.3974609375, -30.01806640625, -28.638671875, -27.25927734375, -25.8798828125, -24.50048828125, -23.12109375, -21.74169921875, -20.3623046875, -18.98291015625, -17.603515625, -16.22412109375, -14.8447265625, -13.46533203125, -12.0859375, -10.70654296875, -9.3271484375, -7.94775390625, -6.568359375, -5.18896484375, -3.8095703125, -2.43017578125, -1.05078125, 0.32861328125, 1.7080078125, 3.08740234375, 4.466796875, 5.84619140625, 7.2255859375, 8.60498046875, 9.984375, 11.36376953125, 12.7431640625, 14.12255859375, 15.501953125, 16.88134765625, 18.2607421875, 19.64013671875, 21.01953125, 22.39892578125, 23.7783203125, 25.15771484375, 26.537109375, 27.91650390625, 29.2958984375, 30.67529296875, 32.0546875, 33.43408203125, 34.8134765625, 36.19287109375, 37.572265625, 38.95166015625, 40.3310546875, 41.71044921875, 43.08984375, 44.46923828125, 45.8486328125, 47.22802734375, 48.607421875, 49.98681640625, 51.3662109375, 52.74560546875, 54.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 14.0, 18.0, 21.0, 26.0, 25.0, 50.0, 51.0, 41.0, 61.0, 54.0, 74.0, 90.0, 64.0, 65.0, 68.0, 40.0, 55.0, 42.0, 28.0, 29.0, 20.0, 18.0, 12.0, 12.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.807342529296875, -3.63226318359375, -3.457183837890625, -3.2821044921875, -3.107025146484375, -2.93194580078125, -2.756866455078125, -2.581787109375, -2.406707763671875, -2.23162841796875, -2.056549072265625, -1.8814697265625, -1.706390380859375, -1.53131103515625, -1.356231689453125, -1.18115234375, -1.006072998046875, -0.83099365234375, -0.655914306640625, -0.4808349609375, -0.305755615234375, -0.13067626953125, 0.044403076171875, 0.219482421875, 0.394561767578125, 0.56964111328125, 0.744720458984375, 0.9197998046875, 1.094879150390625, 1.26995849609375, 1.445037841796875, 1.6201171875, 1.795196533203125, 1.97027587890625, 2.145355224609375, 2.3204345703125, 2.495513916015625, 2.67059326171875, 2.845672607421875, 3.020751953125, 3.195831298828125, 3.37091064453125, 3.545989990234375, 3.7210693359375, 3.896148681640625, 4.07122802734375, 4.246307373046875, 4.42138671875, 4.596466064453125, 4.77154541015625, 4.946624755859375, 5.1217041015625, 5.296783447265625, 5.47186279296875, 5.646942138671875, 5.822021484375, 5.997100830078125, 6.17218017578125, 6.347259521484375, 6.5223388671875, 6.697418212890625, 6.87249755859375, 7.047576904296875, 7.22265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 17.0, 16.0, 35.0, 47.0, 88.0, 99.0, 177.0, 248.0, 376.0, 615.0, 921.0, 1478.0, 2427.0, 4201.0, 7355.0, 14419.0, 31117.0, 84851.0, 2928091.0, 972600.0, 82682.0, 30531.0, 14092.0, 7220.0, 4162.0, 2380.0, 1423.0, 888.0, 577.0, 390.0, 252.0, 166.0, 109.0, 71.0, 46.0, 39.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.1920166015625, -10.805908203125, -10.4197998046875, -10.03369140625, -9.6475830078125, -9.261474609375, -8.8753662109375, -8.4892578125, -8.1031494140625, -7.717041015625, -7.3309326171875, -6.94482421875, -6.5587158203125, -6.172607421875, -5.7864990234375, -5.400390625, -5.0142822265625, -4.628173828125, -4.2420654296875, -3.85595703125, -3.4698486328125, -3.083740234375, -2.6976318359375, -2.3115234375, -1.9254150390625, -1.539306640625, -1.1531982421875, -0.76708984375, -0.3809814453125, 0.005126953125, 0.3912353515625, 0.77734375, 1.1634521484375, 1.549560546875, 1.9356689453125, 2.32177734375, 2.7078857421875, 3.093994140625, 3.4801025390625, 3.8662109375, 4.2523193359375, 4.638427734375, 5.0245361328125, 5.41064453125, 5.7967529296875, 6.182861328125, 6.5689697265625, 6.955078125, 7.3411865234375, 7.727294921875, 8.1134033203125, 8.49951171875, 8.8856201171875, 9.271728515625, 9.6578369140625, 10.0439453125, 10.4300537109375, 10.816162109375, 11.2022705078125, 11.58837890625, 11.9744873046875, 12.360595703125, 12.7467041015625, 13.1328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 9.0, 7.0, 11.0, 7.0, 20.0, 19.0, 30.0, 56.0, 49.0, 85.0, 184.0, 2544.0, 622.0, 162.0, 69.0, 45.0, 29.0, 21.0, 24.0, 11.0, 16.0, 12.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.672943115234375, -3.56463623046875, -3.456329345703125, -3.3480224609375, -3.239715576171875, -3.13140869140625, -3.023101806640625, -2.914794921875, -2.806488037109375, -2.69818115234375, -2.589874267578125, -2.4815673828125, -2.373260498046875, -2.26495361328125, -2.156646728515625, -2.04833984375, -1.940032958984375, -1.83172607421875, -1.723419189453125, -1.6151123046875, -1.506805419921875, -1.39849853515625, -1.290191650390625, -1.181884765625, -1.073577880859375, -0.96527099609375, -0.856964111328125, -0.7486572265625, -0.640350341796875, -0.53204345703125, -0.423736572265625, -0.3154296875, -0.207122802734375, -0.09881591796875, 0.009490966796875, 0.1177978515625, 0.226104736328125, 0.33441162109375, 0.442718505859375, 0.551025390625, 0.659332275390625, 0.76763916015625, 0.875946044921875, 0.9842529296875, 1.092559814453125, 1.20086669921875, 1.309173583984375, 1.41748046875, 1.525787353515625, 1.63409423828125, 1.742401123046875, 1.8507080078125, 1.959014892578125, 2.06732177734375, 2.175628662109375, 2.283935546875, 2.392242431640625, 2.50054931640625, 2.608856201171875, 2.7171630859375, 2.825469970703125, 2.93377685546875, 3.042083740234375, 3.150390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 14.0, 9.0, 22.0, 37.0, 42.0, 52.0, 64.0, 80.0, 92.0, 81.0, 96.0, 83.0, 74.0, 64.0, 63.0, 41.0, 28.0, 24.0, 14.0, 12.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78056526184082, -21.241167068481445, -20.701766967773438, -20.162368774414062, -19.622970581054688, -19.08357048034668, -18.544172286987305, -18.004772186279297, -17.465373992919922, -16.925975799560547, -16.38657569885254, -15.847177505493164, -15.307778358459473, -14.768379211425781, -14.228981018066406, -13.689581871032715, -13.150182723999023, -12.610783576965332, -12.07138442993164, -11.531986236572266, -10.992587089538574, -10.453187942504883, -9.913789749145508, -9.374390602111816, -8.834991455078125, -8.295592308044434, -7.7561936378479, -7.216794967651367, -6.677395820617676, -6.137996673583984, -5.598598003387451, -5.059199333190918, -4.519800186157227, -3.9804012775421143, -3.441002368927002, -2.9016034603118896, -2.3622045516967773, -1.822805643081665, -1.2834067344665527, -0.7440078258514404, -0.20460891723632812, 0.3347899913787842, 0.8741888999938965, 1.4135878086090088, 1.952986717224121, 2.4923856258392334, 3.0317845344543457, 3.571183443069458, 4.11058235168457, 4.649981498718262, 5.189380168914795, 5.728778839111328, 6.2681779861450195, 6.807577133178711, 7.346975803375244, 7.886374473571777, 8.425773620605469, 8.96517276763916, 9.504571914672852, 10.043970108032227, 10.583369255065918, 11.12276840209961, 11.662166595458984, 12.201565742492676, 12.740964889526367]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 6.0, 7.0, 9.0, 19.0, 23.0, 13.0, 14.0, 21.0, 19.0, 22.0, 32.0, 37.0, 29.0, 32.0, 41.0, 36.0, 46.0, 47.0, 45.0, 28.0, 47.0, 39.0, 35.0, 30.0, 33.0, 32.0, 23.0, 24.0, 27.0, 27.0, 26.0, 16.0, 12.0, 16.0, 8.0, 8.0, 10.0, 13.0, 4.0, 5.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.702902793884277, -8.4434814453125, -8.184060096740723, -7.924638748168945, -7.665217399597168, -7.405796051025391, -7.146374702453613, -6.886953353881836, -6.627532005310059, -6.368110656738281, -6.108689308166504, -5.849267959594727, -5.589846611022949, -5.330425262451172, -5.0710039138793945, -4.811582565307617, -4.552161693572998, -4.292740345001221, -4.033318996429443, -3.773897647857666, -3.5144762992858887, -3.2550549507141113, -2.995633840560913, -2.7362124919891357, -2.4767911434173584, -2.217369794845581, -1.9579484462738037, -1.698527216911316, -1.4391058683395386, -1.1796845197677612, -0.9202632904052734, -0.6608419418334961, -0.40142059326171875, -0.1419992744922638, 0.11742204427719116, 0.37684333324432373, 0.6362646818161011, 0.8956860303878784, 1.1551072597503662, 1.4145286083221436, 1.673949956893921, 1.9333713054656982, 2.1927926540374756, 2.452213764190674, 2.711635112762451, 2.9710564613342285, 3.230477809906006, 3.489899158477783, 3.7493205070495605, 4.008741855621338, 4.268163204193115, 4.527584552764893, 4.78700590133667, 5.046427249908447, 5.305848121643066, 5.565269470214844, 5.824690818786621, 6.084112167358398, 6.343533515930176, 6.602954864501953, 6.8623762130737305, 7.121797561645508, 7.381218910217285, 7.6406402587890625, 7.90006160736084]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 20.0, 25.0, 48.0, 70.0, 144.0, 271.0, 638.0, 1778.0, 5685.0, 23299.0, 128421.0, 511452.0, 304329.0, 55752.0, 11521.0, 3083.0, 1077.0, 437.0, 209.0, 141.0, 57.0, 29.0, 22.0, 18.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.4429931640625, -19.901611328125, -19.3602294921875, -18.81884765625, -18.2774658203125, -17.736083984375, -17.1947021484375, -16.6533203125, -16.1119384765625, -15.570556640625, -15.0291748046875, -14.48779296875, -13.9464111328125, -13.405029296875, -12.8636474609375, -12.322265625, -11.7808837890625, -11.239501953125, -10.6981201171875, -10.15673828125, -9.6153564453125, -9.073974609375, -8.5325927734375, -7.9912109375, -7.4498291015625, -6.908447265625, -6.3670654296875, -5.82568359375, -5.2843017578125, -4.742919921875, -4.2015380859375, -3.66015625, -3.1187744140625, -2.577392578125, -2.0360107421875, -1.49462890625, -0.9532470703125, -0.411865234375, 0.1295166015625, 0.6708984375, 1.2122802734375, 1.753662109375, 2.2950439453125, 2.83642578125, 3.3778076171875, 3.919189453125, 4.4605712890625, 5.001953125, 5.5433349609375, 6.084716796875, 6.6260986328125, 7.16748046875, 7.7088623046875, 8.250244140625, 8.7916259765625, 9.3330078125, 9.8743896484375, 10.415771484375, 10.9571533203125, 11.49853515625, 12.0399169921875, 12.581298828125, 13.1226806640625, 13.6640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 18.0, 21.0, 23.0, 39.0, 39.0, 43.0, 47.0, 52.0, 57.0, 70.0, 74.0, 72.0, 57.0, 66.0, 50.0, 51.0, 38.0, 29.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.84356689453125, -3.6676025390625, -3.49163818359375, -3.315673828125, -3.13970947265625, -2.9637451171875, -2.78778076171875, -2.61181640625, -2.43585205078125, -2.2598876953125, -2.08392333984375, -1.907958984375, -1.73199462890625, -1.5560302734375, -1.38006591796875, -1.2041015625, -1.02813720703125, -0.8521728515625, -0.67620849609375, -0.500244140625, -0.32427978515625, -0.1483154296875, 0.02764892578125, 0.20361328125, 0.37957763671875, 0.5555419921875, 0.73150634765625, 0.907470703125, 1.08343505859375, 1.2593994140625, 1.43536376953125, 1.611328125, 1.78729248046875, 1.9632568359375, 2.13922119140625, 2.315185546875, 2.49114990234375, 2.6671142578125, 2.84307861328125, 3.01904296875, 3.19500732421875, 3.3709716796875, 3.54693603515625, 3.722900390625, 3.89886474609375, 4.0748291015625, 4.25079345703125, 4.4267578125, 4.60272216796875, 4.7786865234375, 4.95465087890625, 5.130615234375, 5.30657958984375, 5.4825439453125, 5.65850830078125, 5.83447265625, 6.01043701171875, 6.1864013671875, 6.36236572265625, 6.538330078125, 6.71429443359375, 6.8902587890625, 7.06622314453125, 7.2421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 10.0, 19.0, 42.0, 59.0, 129.0, 223.0, 364.0, 650.0, 1356.0, 4078.0, 38437.0, 773800.0, 214567.0, 10527.0, 2160.0, 948.0, 516.0, 290.0, 163.0, 84.0, 53.0, 34.0, 19.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.77099609375, -20.8544921875, -19.93798828125, -19.021484375, -18.10498046875, -17.1884765625, -16.27197265625, -15.35546875, -14.43896484375, -13.5224609375, -12.60595703125, -11.689453125, -10.77294921875, -9.8564453125, -8.93994140625, -8.0234375, -7.10693359375, -6.1904296875, -5.27392578125, -4.357421875, -3.44091796875, -2.5244140625, -1.60791015625, -0.69140625, 0.22509765625, 1.1416015625, 2.05810546875, 2.974609375, 3.89111328125, 4.8076171875, 5.72412109375, 6.640625, 7.55712890625, 8.4736328125, 9.39013671875, 10.306640625, 11.22314453125, 12.1396484375, 13.05615234375, 13.97265625, 14.88916015625, 15.8056640625, 16.72216796875, 17.638671875, 18.55517578125, 19.4716796875, 20.38818359375, 21.3046875, 22.22119140625, 23.1376953125, 24.05419921875, 24.970703125, 25.88720703125, 26.8037109375, 27.72021484375, 28.63671875, 29.55322265625, 30.4697265625, 31.38623046875, 32.302734375, 33.21923828125, 34.1357421875, 35.05224609375, 35.96875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 11.0, 15.0, 22.0, 22.0, 22.0, 37.0, 31.0, 32.0, 56.0, 29.0, 42.0, 43.0, 35.0, 45.0, 45.0, 30.0, 46.0, 56.0, 40.0, 40.0, 33.0, 31.0, 30.0, 27.0, 28.0, 16.0, 17.0, 14.0, 9.0, 11.0, 5.0, 8.0, 9.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.7138671875, -16.193359375, -15.6728515625, -15.15234375, -14.6318359375, -14.111328125, -13.5908203125, -13.0703125, -12.5498046875, -12.029296875, -11.5087890625, -10.98828125, -10.4677734375, -9.947265625, -9.4267578125, -8.90625, -8.3857421875, -7.865234375, -7.3447265625, -6.82421875, -6.3037109375, -5.783203125, -5.2626953125, -4.7421875, -4.2216796875, -3.701171875, -3.1806640625, -2.66015625, -2.1396484375, -1.619140625, -1.0986328125, -0.578125, -0.0576171875, 0.462890625, 0.9833984375, 1.50390625, 2.0244140625, 2.544921875, 3.0654296875, 3.5859375, 4.1064453125, 4.626953125, 5.1474609375, 5.66796875, 6.1884765625, 6.708984375, 7.2294921875, 7.75, 8.2705078125, 8.791015625, 9.3115234375, 9.83203125, 10.3525390625, 10.873046875, 11.3935546875, 11.9140625, 12.4345703125, 12.955078125, 13.4755859375, 13.99609375, 14.5166015625, 15.037109375, 15.5576171875, 16.078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 27.0, 33.0, 58.0, 85.0, 144.0, 235.0, 423.0, 870.0, 2120.0, 6913.0, 31118.0, 261956.0, 650603.0, 74148.0, 13251.0, 3680.0, 1295.0, 605.0, 313.0, 174.0, 114.0, 83.0, 57.0, 41.0, 24.0, 20.0, 16.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.4921875, -9.20654296875, -8.9208984375, -8.63525390625, -8.349609375, -8.06396484375, -7.7783203125, -7.49267578125, -7.20703125, -6.92138671875, -6.6357421875, -6.35009765625, -6.064453125, -5.77880859375, -5.4931640625, -5.20751953125, -4.921875, -4.63623046875, -4.3505859375, -4.06494140625, -3.779296875, -3.49365234375, -3.2080078125, -2.92236328125, -2.63671875, -2.35107421875, -2.0654296875, -1.77978515625, -1.494140625, -1.20849609375, -0.9228515625, -0.63720703125, -0.3515625, -0.06591796875, 0.2197265625, 0.50537109375, 0.791015625, 1.07666015625, 1.3623046875, 1.64794921875, 1.93359375, 2.21923828125, 2.5048828125, 2.79052734375, 3.076171875, 3.36181640625, 3.6474609375, 3.93310546875, 4.21875, 4.50439453125, 4.7900390625, 5.07568359375, 5.361328125, 5.64697265625, 5.9326171875, 6.21826171875, 6.50390625, 6.78955078125, 7.0751953125, 7.36083984375, 7.646484375, 7.93212890625, 8.2177734375, 8.50341796875, 8.7890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 19.0, 30.0, 51.0, 83.0, 117.0, 168.0, 172.0, 127.0, 76.0, 39.0, 26.0, 16.0, 8.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001140594482421875, -0.001079946756362915, -0.001019299030303955, -0.0009586513042449951, -0.0008980035781860352, -0.0008373558521270752, -0.0007767081260681152, -0.0007160604000091553, -0.0006554126739501953, -0.0005947649478912354, -0.0005341172218322754, -0.00047346949577331543, -0.00041282176971435547, -0.0003521740436553955, -0.00029152631759643555, -0.00023087859153747559, -0.00017023086547851562, -0.00010958313941955566, -4.89354133605957e-05, 1.1712312698364258e-05, 7.236003875732422e-05, 0.00013300776481628418, 0.00019365549087524414, 0.0002543032169342041, 0.00031495094299316406, 0.000375598669052124, 0.000436246395111084, 0.0004968941211700439, 0.0005575418472290039, 0.0006181895732879639, 0.0006788372993469238, 0.0007394850254058838, 0.0008001327514648438, 0.0008607804775238037, 0.0009214282035827637, 0.0009820759296417236, 0.0010427236557006836, 0.0011033713817596436, 0.0011640191078186035, 0.0012246668338775635, 0.0012853145599365234, 0.0013459622859954834, 0.0014066100120544434, 0.0014672577381134033, 0.0015279054641723633, 0.0015885531902313232, 0.0016492009162902832, 0.0017098486423492432, 0.0017704963684082031, 0.001831144094467163, 0.001891791820526123, 0.001952439546585083, 0.002013087272644043, 0.002073734998703003, 0.002134382724761963, 0.002195030450820923, 0.002255678176879883, 0.0023163259029388428, 0.0023769736289978027, 0.0024376213550567627, 0.0024982690811157227, 0.0025589168071746826, 0.0026195645332336426, 0.0026802122592926025, 0.0027408599853515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 24.0, 36.0, 59.0, 94.0, 185.0, 305.0, 668.0, 2143.0, 10363.0, 150358.0, 823110.0, 52897.0, 5756.0, 1364.0, 546.0, 282.0, 146.0, 62.0, 34.0, 32.0, 20.0, 10.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8660888671875, -15.404052734375, -14.9420166015625, -14.47998046875, -14.0179443359375, -13.555908203125, -13.0938720703125, -12.6318359375, -12.1697998046875, -11.707763671875, -11.2457275390625, -10.78369140625, -10.3216552734375, -9.859619140625, -9.3975830078125, -8.935546875, -8.4735107421875, -8.011474609375, -7.5494384765625, -7.08740234375, -6.6253662109375, -6.163330078125, -5.7012939453125, -5.2392578125, -4.7772216796875, -4.315185546875, -3.8531494140625, -3.39111328125, -2.9290771484375, -2.467041015625, -2.0050048828125, -1.54296875, -1.0809326171875, -0.618896484375, -0.1568603515625, 0.30517578125, 0.7672119140625, 1.229248046875, 1.6912841796875, 2.1533203125, 2.6153564453125, 3.077392578125, 3.5394287109375, 4.00146484375, 4.4635009765625, 4.925537109375, 5.3875732421875, 5.849609375, 6.3116455078125, 6.773681640625, 7.2357177734375, 7.69775390625, 8.1597900390625, 8.621826171875, 9.0838623046875, 9.5458984375, 10.0079345703125, 10.469970703125, 10.9320068359375, 11.39404296875, 11.8560791015625, 12.318115234375, 12.7801513671875, 13.2421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 12.0, 12.0, 20.0, 28.0, 64.0, 93.0, 121.0, 142.0, 150.0, 101.0, 89.0, 53.0, 40.0, 22.0, 12.0, 4.0, 6.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-15.8359375, -15.4912109375, -15.146484375, -14.8017578125, -14.45703125, -14.1123046875, -13.767578125, -13.4228515625, -13.078125, -12.7333984375, -12.388671875, -12.0439453125, -11.69921875, -11.3544921875, -11.009765625, -10.6650390625, -10.3203125, -9.9755859375, -9.630859375, -9.2861328125, -8.94140625, -8.5966796875, -8.251953125, -7.9072265625, -7.5625, -7.2177734375, -6.873046875, -6.5283203125, -6.18359375, -5.8388671875, -5.494140625, -5.1494140625, -4.8046875, -4.4599609375, -4.115234375, -3.7705078125, -3.42578125, -3.0810546875, -2.736328125, -2.3916015625, -2.046875, -1.7021484375, -1.357421875, -1.0126953125, -0.66796875, -0.3232421875, 0.021484375, 0.3662109375, 0.7109375, 1.0556640625, 1.400390625, 1.7451171875, 2.08984375, 2.4345703125, 2.779296875, 3.1240234375, 3.46875, 3.8134765625, 4.158203125, 4.5029296875, 4.84765625, 5.1923828125, 5.537109375, 5.8818359375, 6.2265625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 12.0, 27.0, 76.0, 104.0, 149.0, 171.0, 165.0, 133.0, 68.0, 40.0, 14.0, 18.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.68679809570312, -84.5965805053711, -79.50636291503906, -74.41615295410156, -69.32593536376953, -64.2357177734375, -59.145503997802734, -54.05529022216797, -48.96507263183594, -43.874855041503906, -38.78464126586914, -33.694427490234375, -28.604209899902344, -23.513994216918945, -18.423778533935547, -13.333564758300781, -8.24334716796875, -3.1531314849853516, 1.9370841979980469, 7.027299880981445, 12.117515563964844, 17.207731246948242, 22.29794692993164, 27.388160705566406, 32.47837829589844, 37.56859588623047, 42.658809661865234, 47.7490234375, 52.83924102783203, 57.92945861816406, 63.01967239379883, 68.1098861694336, 73.20008850097656, 78.2903060913086, 83.38052368164062, 88.47073364257812, 93.56095123291016, 98.65116882324219, 103.74137878417969, 108.83159637451172, 113.92181396484375, 119.01203155517578, 124.10224914550781, 129.1924591064453, 134.28268432617188, 139.37289428710938, 144.46310424804688, 149.55331420898438, 154.64353942871094, 159.73374938964844, 164.823974609375, 169.9141845703125, 175.00439453125, 180.09461975097656, 185.18482971191406, 190.27505493164062, 195.36526489257812, 200.45547485351562, 205.5457000732422, 210.6359100341797, 215.72613525390625, 220.81634521484375, 225.90655517578125, 230.99676513671875, 236.0869903564453]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 8.0, 9.0, 18.0, 23.0, 27.0, 22.0, 25.0, 32.0, 31.0, 54.0, 39.0, 50.0, 45.0, 46.0, 62.0, 48.0, 49.0, 47.0, 38.0, 49.0, 36.0, 31.0, 25.0, 29.0, 28.0, 15.0, 17.0, 15.0, 14.0, 6.0, 16.0, 8.0, 5.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.55218505859375, -72.94676971435547, -70.34136199951172, -67.73594665527344, -65.13053894042969, -62.525123596191406, -59.919708251953125, -57.31429672241211, -54.708885192871094, -52.10347366333008, -49.49806213378906, -46.89264678955078, -44.287235260009766, -41.68182373046875, -39.07640838623047, -36.47099685668945, -33.86558532714844, -31.260173797607422, -28.654760360717773, -26.049346923828125, -23.44393539428711, -20.838523864746094, -18.233110427856445, -15.627696990966797, -13.022285461425781, -10.41687297821045, -7.811460494995117, -5.206048011779785, -2.600635528564453, 0.004776954650878906, 2.610189437866211, 5.215602874755859, 7.821014404296875, 10.426426887512207, 13.031839370727539, 15.637251853942871, 18.242664337158203, 20.84807586669922, 23.453489303588867, 26.058902740478516, 28.66431427001953, 31.269725799560547, 33.87513732910156, 36.480552673339844, 39.08596420288086, 41.691375732421875, 44.296791076660156, 46.90220260620117, 49.50761413574219, 52.1130256652832, 54.71843719482422, 57.3238525390625, 59.929264068603516, 62.53467559814453, 65.14009094238281, 67.74549865722656, 70.35091400146484, 72.95632934570312, 75.56173706054688, 78.16715240478516, 80.77256774902344, 83.37797546386719, 85.98339080810547, 88.58880615234375, 91.1942138671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 8.0, 13.0, 21.0, 41.0, 58.0, 78.0, 127.0, 253.0, 521.0, 1080.0, 2553.0, 6606.0, 24020.0, 4024467.0, 111675.0, 14509.0, 4673.0, 1831.0, 839.0, 406.0, 200.0, 112.0, 70.0, 32.0, 16.0, 19.0, 7.0, 12.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.8125, -32.841552734375, -31.87060546875, -30.899658203125, -29.9287109375, -28.957763671875, -27.98681640625, -27.015869140625, -26.044921875, -25.073974609375, -24.10302734375, -23.132080078125, -22.1611328125, -21.190185546875, -20.21923828125, -19.248291015625, -18.27734375, -17.306396484375, -16.33544921875, -15.364501953125, -14.3935546875, -13.422607421875, -12.45166015625, -11.480712890625, -10.509765625, -9.538818359375, -8.56787109375, -7.596923828125, -6.6259765625, -5.655029296875, -4.68408203125, -3.713134765625, -2.7421875, -1.771240234375, -0.80029296875, 0.170654296875, 1.1416015625, 2.112548828125, 3.08349609375, 4.054443359375, 5.025390625, 5.996337890625, 6.96728515625, 7.938232421875, 8.9091796875, 9.880126953125, 10.85107421875, 11.822021484375, 12.79296875, 13.763916015625, 14.73486328125, 15.705810546875, 16.6767578125, 17.647705078125, 18.61865234375, 19.589599609375, 20.560546875, 21.531494140625, 22.50244140625, 23.473388671875, 24.4443359375, 25.415283203125, 26.38623046875, 27.357177734375, 28.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 19.0, 16.0, 17.0, 27.0, 24.0, 38.0, 48.0, 44.0, 53.0, 53.0, 73.0, 76.0, 58.0, 50.0, 53.0, 71.0, 46.0, 33.0, 36.0, 37.0, 15.0, 24.0, 14.0, 9.0, 5.0, 13.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.824127197265625, -3.65020751953125, -3.476287841796875, -3.3023681640625, -3.128448486328125, -2.95452880859375, -2.780609130859375, -2.606689453125, -2.432769775390625, -2.25885009765625, -2.084930419921875, -1.9110107421875, -1.737091064453125, -1.56317138671875, -1.389251708984375, -1.21533203125, -1.041412353515625, -0.86749267578125, -0.693572998046875, -0.5196533203125, -0.345733642578125, -0.17181396484375, 0.002105712890625, 0.176025390625, 0.349945068359375, 0.52386474609375, 0.697784423828125, 0.8717041015625, 1.045623779296875, 1.21954345703125, 1.393463134765625, 1.5673828125, 1.741302490234375, 1.91522216796875, 2.089141845703125, 2.2630615234375, 2.436981201171875, 2.61090087890625, 2.784820556640625, 2.958740234375, 3.132659912109375, 3.30657958984375, 3.480499267578125, 3.6544189453125, 3.828338623046875, 4.00225830078125, 4.176177978515625, 4.35009765625, 4.524017333984375, 4.69793701171875, 4.871856689453125, 5.0457763671875, 5.219696044921875, 5.39361572265625, 5.567535400390625, 5.741455078125, 5.915374755859375, 6.08929443359375, 6.263214111328125, 6.4371337890625, 6.611053466796875, 6.78497314453125, 6.958892822265625, 7.1328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 16.0, 21.0, 32.0, 43.0, 98.0, 107.0, 204.0, 362.0, 608.0, 1099.0, 2037.0, 4160.0, 9508.0, 29304.0, 3782421.0, 321699.0, 25664.0, 8701.0, 3837.0, 1900.0, 1010.0, 579.0, 347.0, 191.0, 107.0, 74.0, 54.0, 40.0, 18.0, 12.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.88525390625, -26.1767578125, -25.46826171875, -24.759765625, -24.05126953125, -23.3427734375, -22.63427734375, -21.92578125, -21.21728515625, -20.5087890625, -19.80029296875, -19.091796875, -18.38330078125, -17.6748046875, -16.96630859375, -16.2578125, -15.54931640625, -14.8408203125, -14.13232421875, -13.423828125, -12.71533203125, -12.0068359375, -11.29833984375, -10.58984375, -9.88134765625, -9.1728515625, -8.46435546875, -7.755859375, -7.04736328125, -6.3388671875, -5.63037109375, -4.921875, -4.21337890625, -3.5048828125, -2.79638671875, -2.087890625, -1.37939453125, -0.6708984375, 0.03759765625, 0.74609375, 1.45458984375, 2.1630859375, 2.87158203125, 3.580078125, 4.28857421875, 4.9970703125, 5.70556640625, 6.4140625, 7.12255859375, 7.8310546875, 8.53955078125, 9.248046875, 9.95654296875, 10.6650390625, 11.37353515625, 12.08203125, 12.79052734375, 13.4990234375, 14.20751953125, 14.916015625, 15.62451171875, 16.3330078125, 17.04150390625, 17.75]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 3.0, 12.0, 20.0, 17.0, 26.0, 79.0, 645.0, 3027.0, 82.0, 40.0, 21.0, 23.0, 14.0, 13.0, 4.0, 4.0, 7.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.0562744140625, -3.921142578125, -3.7860107421875, -3.65087890625, -3.5157470703125, -3.380615234375, -3.2454833984375, -3.1103515625, -2.9752197265625, -2.840087890625, -2.7049560546875, -2.56982421875, -2.4346923828125, -2.299560546875, -2.1644287109375, -2.029296875, -1.8941650390625, -1.759033203125, -1.6239013671875, -1.48876953125, -1.3536376953125, -1.218505859375, -1.0833740234375, -0.9482421875, -0.8131103515625, -0.677978515625, -0.5428466796875, -0.40771484375, -0.2725830078125, -0.137451171875, -0.0023193359375, 0.1328125, 0.2679443359375, 0.403076171875, 0.5382080078125, 0.67333984375, 0.8084716796875, 0.943603515625, 1.0787353515625, 1.2138671875, 1.3489990234375, 1.484130859375, 1.6192626953125, 1.75439453125, 1.8895263671875, 2.024658203125, 2.1597900390625, 2.294921875, 2.4300537109375, 2.565185546875, 2.7003173828125, 2.83544921875, 2.9705810546875, 3.105712890625, 3.2408447265625, 3.3759765625, 3.5111083984375, 3.646240234375, 3.7813720703125, 3.91650390625, 4.0516357421875, 4.186767578125, 4.3218994140625, 4.45703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 15.0, 33.0, 37.0, 61.0, 52.0, 85.0, 92.0, 111.0, 124.0, 91.0, 74.0, 55.0, 40.0, 34.0, 31.0, 14.0, 7.0, 9.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.199918746948242, -17.660322189331055, -17.1207275390625, -16.581130981445312, -16.041534423828125, -15.50193977355957, -14.962343215942383, -14.422747611999512, -13.88315200805664, -13.34355640411377, -12.803960800170898, -12.264364242553711, -11.72476863861084, -11.185173034667969, -10.645576477050781, -10.10598087310791, -9.566385269165039, -9.026789665222168, -8.487194061279297, -7.947597503662109, -7.408001899719238, -6.868406295776367, -6.328810214996338, -5.789214134216309, -5.2496185302734375, -4.710022926330566, -4.170426845550537, -3.630831003189087, -3.0912351608276367, -2.5516393184661865, -2.0120434761047363, -1.4724476337432861, -0.9328498840332031, -0.39325404167175293, 0.14634180068969727, 0.6859376430511475, 1.2255334854125977, 1.7651293277740479, 2.304725170135498, 2.8443210124969482, 3.3839168548583984, 3.9235126972198486, 4.463108539581299, 5.002704620361328, 5.542300224304199, 6.08189582824707, 6.6214919090271, 7.161087989807129, 7.70068359375, 8.240279197692871, 8.779874801635742, 9.31947135925293, 9.8590669631958, 10.398662567138672, 10.93825912475586, 11.47785472869873, 12.017450332641602, 12.557045936584473, 13.096641540527344, 13.636238098144531, 14.175833702087402, 14.715429306030273, 15.255025863647461, 15.794621467590332, 16.334217071533203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 9.0, 8.0, 9.0, 9.0, 7.0, 16.0, 21.0, 21.0, 24.0, 22.0, 24.0, 25.0, 30.0, 44.0, 34.0, 40.0, 40.0, 41.0, 32.0, 37.0, 45.0, 37.0, 29.0, 40.0, 32.0, 37.0, 28.0, 34.0, 32.0, 28.0, 25.0, 23.0, 12.0, 16.0, 13.0, 8.0, 5.0, 10.0, 6.0, 6.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.987802505493164, -7.732031345367432, -7.476259708404541, -7.220488548278809, -6.964717388153076, -6.708946228027344, -6.453174591064453, -6.197403430938721, -5.941632270812988, -5.685861110687256, -5.430089473724365, -5.174318313598633, -4.9185471534729, -4.662775993347168, -4.407004356384277, -4.151233196258545, -3.8954615592956543, -3.6396901607513428, -3.3839190006256104, -3.128147602081299, -2.8723764419555664, -2.616605043411255, -2.3608336448669434, -2.105062484741211, -1.8492910861968994, -1.5935198068618774, -1.3377485275268555, -1.081977128982544, -0.826205849647522, -0.5704345703125, -0.3146631717681885, -0.058891892433166504, 0.19687938690185547, 0.45265069603919983, 0.7084220051765442, 0.9641933441162109, 1.219964623451233, 1.4757359027862549, 1.7315073013305664, 1.9872785806655884, 2.2430498600006104, 2.498821258544922, 2.7545924186706543, 3.010363817214966, 3.2661352157592773, 3.5219063758850098, 3.7776777744293213, 4.033449172973633, 4.289220333099365, 4.544991493225098, 4.800763130187988, 5.056534290313721, 5.312305450439453, 5.568077087402344, 5.823848247528076, 6.079619407653809, 6.335391044616699, 6.591162204742432, 6.846933841705322, 7.102705001831055, 7.358476161956787, 7.6142473220825195, 7.87001895904541, 8.1257905960083, 8.381561279296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 21.0, 35.0, 55.0, 95.0, 139.0, 260.0, 477.0, 1126.0, 2731.0, 7795.0, 25658.0, 93392.0, 314884.0, 404607.0, 140615.0, 38772.0, 11315.0, 3691.0, 1432.0, 643.0, 367.0, 154.0, 102.0, 59.0, 49.0, 18.0, 15.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.8792724609375, -10.492919921875, -10.1065673828125, -9.72021484375, -9.3338623046875, -8.947509765625, -8.5611572265625, -8.1748046875, -7.7884521484375, -7.402099609375, -7.0157470703125, -6.62939453125, -6.2430419921875, -5.856689453125, -5.4703369140625, -5.083984375, -4.6976318359375, -4.311279296875, -3.9249267578125, -3.53857421875, -3.1522216796875, -2.765869140625, -2.3795166015625, -1.9931640625, -1.6068115234375, -1.220458984375, -0.8341064453125, -0.44775390625, -0.0614013671875, 0.324951171875, 0.7113037109375, 1.09765625, 1.4840087890625, 1.870361328125, 2.2567138671875, 2.64306640625, 3.0294189453125, 3.415771484375, 3.8021240234375, 4.1884765625, 4.5748291015625, 4.961181640625, 5.3475341796875, 5.73388671875, 6.1202392578125, 6.506591796875, 6.8929443359375, 7.279296875, 7.6656494140625, 8.052001953125, 8.4383544921875, 8.82470703125, 9.2110595703125, 9.597412109375, 9.9837646484375, 10.3701171875, 10.7564697265625, 11.142822265625, 11.5291748046875, 11.91552734375, 12.3018798828125, 12.688232421875, 13.0745849609375, 13.4609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 19.0, 14.0, 21.0, 27.0, 30.0, 41.0, 39.0, 44.0, 51.0, 57.0, 67.0, 62.0, 62.0, 57.0, 58.0, 42.0, 60.0, 40.0, 24.0, 29.0, 21.0, 30.0, 15.0, 11.0, 8.0, 6.0, 7.0, 8.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0347900390625, -3.858642578125, -3.6824951171875, -3.50634765625, -3.3302001953125, -3.154052734375, -2.9779052734375, -2.8017578125, -2.6256103515625, -2.449462890625, -2.2733154296875, -2.09716796875, -1.9210205078125, -1.744873046875, -1.5687255859375, -1.392578125, -1.2164306640625, -1.040283203125, -0.8641357421875, -0.68798828125, -0.5118408203125, -0.335693359375, -0.1595458984375, 0.0166015625, 0.1927490234375, 0.368896484375, 0.5450439453125, 0.72119140625, 0.8973388671875, 1.073486328125, 1.2496337890625, 1.42578125, 1.6019287109375, 1.778076171875, 1.9542236328125, 2.13037109375, 2.3065185546875, 2.482666015625, 2.6588134765625, 2.8349609375, 3.0111083984375, 3.187255859375, 3.3634033203125, 3.53955078125, 3.7156982421875, 3.891845703125, 4.0679931640625, 4.244140625, 4.4202880859375, 4.596435546875, 4.7725830078125, 4.94873046875, 5.1248779296875, 5.301025390625, 5.4771728515625, 5.6533203125, 5.8294677734375, 6.005615234375, 6.1817626953125, 6.35791015625, 6.5340576171875, 6.710205078125, 6.8863525390625, 7.0625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 8.0, 20.0, 16.0, 24.0, 29.0, 56.0, 63.0, 108.0, 162.0, 209.0, 295.0, 423.0, 733.0, 1113.0, 2581.0, 10957.0, 101474.0, 746283.0, 161853.0, 15421.0, 3157.0, 1297.0, 675.0, 482.0, 339.0, 206.0, 163.0, 124.0, 76.0, 60.0, 33.0, 34.0, 19.0, 18.0, 9.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.296875, -17.69873046875, -17.1005859375, -16.50244140625, -15.904296875, -15.30615234375, -14.7080078125, -14.10986328125, -13.51171875, -12.91357421875, -12.3154296875, -11.71728515625, -11.119140625, -10.52099609375, -9.9228515625, -9.32470703125, -8.7265625, -8.12841796875, -7.5302734375, -6.93212890625, -6.333984375, -5.73583984375, -5.1376953125, -4.53955078125, -3.94140625, -3.34326171875, -2.7451171875, -2.14697265625, -1.548828125, -0.95068359375, -0.3525390625, 0.24560546875, 0.84375, 1.44189453125, 2.0400390625, 2.63818359375, 3.236328125, 3.83447265625, 4.4326171875, 5.03076171875, 5.62890625, 6.22705078125, 6.8251953125, 7.42333984375, 8.021484375, 8.61962890625, 9.2177734375, 9.81591796875, 10.4140625, 11.01220703125, 11.6103515625, 12.20849609375, 12.806640625, 13.40478515625, 14.0029296875, 14.60107421875, 15.19921875, 15.79736328125, 16.3955078125, 16.99365234375, 17.591796875, 18.18994140625, 18.7880859375, 19.38623046875, 19.984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 5.0, 10.0, 14.0, 16.0, 26.0, 23.0, 18.0, 29.0, 37.0, 43.0, 53.0, 40.0, 43.0, 54.0, 59.0, 50.0, 48.0, 55.0, 43.0, 46.0, 42.0, 30.0, 25.0, 29.0, 28.0, 25.0, 11.0, 17.0, 21.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.927490234375, -21.26123046875, -20.594970703125, -19.9287109375, -19.262451171875, -18.59619140625, -17.929931640625, -17.263671875, -16.597412109375, -15.93115234375, -15.264892578125, -14.5986328125, -13.932373046875, -13.26611328125, -12.599853515625, -11.93359375, -11.267333984375, -10.60107421875, -9.934814453125, -9.2685546875, -8.602294921875, -7.93603515625, -7.269775390625, -6.603515625, -5.937255859375, -5.27099609375, -4.604736328125, -3.9384765625, -3.272216796875, -2.60595703125, -1.939697265625, -1.2734375, -0.607177734375, 0.05908203125, 0.725341796875, 1.3916015625, 2.057861328125, 2.72412109375, 3.390380859375, 4.056640625, 4.722900390625, 5.38916015625, 6.055419921875, 6.7216796875, 7.387939453125, 8.05419921875, 8.720458984375, 9.38671875, 10.052978515625, 10.71923828125, 11.385498046875, 12.0517578125, 12.718017578125, 13.38427734375, 14.050537109375, 14.716796875, 15.383056640625, 16.04931640625, 16.715576171875, 17.3818359375, 18.048095703125, 18.71435546875, 19.380615234375, 20.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 12.0, 7.0, 14.0, 15.0, 24.0, 46.0, 59.0, 106.0, 160.0, 247.0, 516.0, 1272.0, 4753.0, 34527.0, 590646.0, 385539.0, 24693.0, 3766.0, 1076.0, 434.0, 232.0, 125.0, 95.0, 61.0, 41.0, 19.0, 17.0, 13.0, 10.0, 3.0, 10.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1015625, -9.7640380859375, -9.426513671875, -9.0889892578125, -8.75146484375, -8.4139404296875, -8.076416015625, -7.7388916015625, -7.4013671875, -7.0638427734375, -6.726318359375, -6.3887939453125, -6.05126953125, -5.7137451171875, -5.376220703125, -5.0386962890625, -4.701171875, -4.3636474609375, -4.026123046875, -3.6885986328125, -3.35107421875, -3.0135498046875, -2.676025390625, -2.3385009765625, -2.0009765625, -1.6634521484375, -1.325927734375, -0.9884033203125, -0.65087890625, -0.3133544921875, 0.024169921875, 0.3616943359375, 0.69921875, 1.0367431640625, 1.374267578125, 1.7117919921875, 2.04931640625, 2.3868408203125, 2.724365234375, 3.0618896484375, 3.3994140625, 3.7369384765625, 4.074462890625, 4.4119873046875, 4.74951171875, 5.0870361328125, 5.424560546875, 5.7620849609375, 6.099609375, 6.4371337890625, 6.774658203125, 7.1121826171875, 7.44970703125, 7.7872314453125, 8.124755859375, 8.4622802734375, 8.7998046875, 9.1373291015625, 9.474853515625, 9.8123779296875, 10.14990234375, 10.4874267578125, 10.824951171875, 11.1624755859375, 11.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 11.0, 14.0, 13.0, 15.0, 29.0, 41.0, 57.0, 56.0, 100.0, 131.0, 117.0, 91.0, 74.0, 60.0, 41.0, 35.0, 23.0, 17.0, 16.0, 12.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010431110858917236, -0.0010085701942443848, -0.0009740293025970459, -0.000939488410949707, -0.0009049475193023682, -0.0008704066276550293, -0.0008358657360076904, -0.0008013248443603516, -0.0007667839527130127, -0.0007322430610656738, -0.000697702169418335, -0.0006631612777709961, -0.0006286203861236572, -0.0005940794944763184, -0.0005595386028289795, -0.0005249977111816406, -0.0004904568195343018, -0.0004559159278869629, -0.000421375036239624, -0.00038683414459228516, -0.0003522932529449463, -0.0003177523612976074, -0.00028321146965026855, -0.0002486705780029297, -0.00021412968635559082, -0.00017958879470825195, -0.00014504790306091309, -0.00011050701141357422, -7.596611976623535e-05, -4.1425228118896484e-05, -6.884336471557617e-06, 2.765655517578125e-05, 6.219744682312012e-05, 9.673833847045898e-05, 0.00013127923011779785, 0.00016582012176513672, 0.00020036101341247559, 0.00023490190505981445, 0.0002694427967071533, 0.0003039836883544922, 0.00033852458000183105, 0.0003730654716491699, 0.0004076063632965088, 0.00044214725494384766, 0.0004766881465911865, 0.0005112290382385254, 0.0005457699298858643, 0.0005803108215332031, 0.000614851713180542, 0.0006493926048278809, 0.0006839334964752197, 0.0007184743881225586, 0.0007530152797698975, 0.0007875561714172363, 0.0008220970630645752, 0.0008566379547119141, 0.0008911788463592529, 0.0009257197380065918, 0.0009602606296539307, 0.0009948015213012695, 0.0010293424129486084, 0.0010638833045959473, 0.0010984241962432861, 0.001132965087890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 13.0, 15.0, 36.0, 55.0, 101.0, 155.0, 338.0, 718.0, 2007.0, 8034.0, 89338.0, 827586.0, 107431.0, 9055.0, 2100.0, 765.0, 345.0, 176.0, 102.0, 61.0, 42.0, 29.0, 11.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.375, -7.967041015625, -7.55908203125, -7.151123046875, -6.7431640625, -6.335205078125, -5.92724609375, -5.519287109375, -5.111328125, -4.703369140625, -4.29541015625, -3.887451171875, -3.4794921875, -3.071533203125, -2.66357421875, -2.255615234375, -1.84765625, -1.439697265625, -1.03173828125, -0.623779296875, -0.2158203125, 0.192138671875, 0.60009765625, 1.008056640625, 1.416015625, 1.823974609375, 2.23193359375, 2.639892578125, 3.0478515625, 3.455810546875, 3.86376953125, 4.271728515625, 4.6796875, 5.087646484375, 5.49560546875, 5.903564453125, 6.3115234375, 6.719482421875, 7.12744140625, 7.535400390625, 7.943359375, 8.351318359375, 8.75927734375, 9.167236328125, 9.5751953125, 9.983154296875, 10.39111328125, 10.799072265625, 11.20703125, 11.614990234375, 12.02294921875, 12.430908203125, 12.8388671875, 13.246826171875, 13.65478515625, 14.062744140625, 14.470703125, 14.878662109375, 15.28662109375, 15.694580078125, 16.1025390625, 16.510498046875, 16.91845703125, 17.326416015625, 17.734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 13.0, 21.0, 15.0, 29.0, 33.0, 48.0, 60.0, 70.0, 98.0, 95.0, 84.0, 92.0, 69.0, 54.0, 38.0, 42.0, 32.0, 23.0, 19.0, 10.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.23858642578125, -4.9888916015625, -4.73919677734375, -4.489501953125, -4.23980712890625, -3.9901123046875, -3.74041748046875, -3.49072265625, -3.24102783203125, -2.9913330078125, -2.74163818359375, -2.491943359375, -2.24224853515625, -1.9925537109375, -1.74285888671875, -1.4931640625, -1.24346923828125, -0.9937744140625, -0.74407958984375, -0.494384765625, -0.24468994140625, 0.0050048828125, 0.25469970703125, 0.50439453125, 0.75408935546875, 1.0037841796875, 1.25347900390625, 1.503173828125, 1.75286865234375, 2.0025634765625, 2.25225830078125, 2.501953125, 2.75164794921875, 3.0013427734375, 3.25103759765625, 3.500732421875, 3.75042724609375, 4.0001220703125, 4.24981689453125, 4.49951171875, 4.74920654296875, 4.9989013671875, 5.24859619140625, 5.498291015625, 5.74798583984375, 5.9976806640625, 6.24737548828125, 6.4970703125, 6.74676513671875, 6.9964599609375, 7.24615478515625, 7.495849609375, 7.74554443359375, 7.9952392578125, 8.24493408203125, 8.49462890625, 8.74432373046875, 8.9940185546875, 9.24371337890625, 9.493408203125, 9.74310302734375, 9.9927978515625, 10.24249267578125, 10.4921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 58.0, 378.0, 467.0, 81.0, 20.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-569.9039916992188, -554.0897216796875, -538.2754516601562, -522.461181640625, -506.6469421386719, -490.83270263671875, -475.0184326171875, -459.20416259765625, -443.389892578125, -427.57562255859375, -411.7613830566406, -395.9471130371094, -380.1328430175781, -364.318603515625, -348.50433349609375, -332.6900634765625, -316.87579345703125, -301.0615234375, -285.2472839355469, -269.4330139160156, -253.61874389648438, -237.8044891357422, -221.990234375, -206.17596435546875, -190.36172485351562, -174.54747009277344, -158.7332000732422, -142.9189453125, -127.10467529296875, -111.29042053222656, -95.47615814208984, -79.66189575195312, -63.847625732421875, -48.033363342285156, -32.21910095214844, -16.404842376708984, -0.5905799865722656, 15.223678588867188, 31.037940979003906, 46.852203369140625, 62.666465759277344, 78.48072814941406, 94.29499053955078, 110.1092529296875, 125.92350769042969, 141.73776245117188, 157.55203247070312, 173.36630249023438, 189.18055725097656, 204.99481201171875, 220.80908203125, 236.6233367919922, 252.43760681152344, 268.2518615722656, 284.0661315917969, 299.88037109375, 315.69464111328125, 331.5089111328125, 347.3231506347656, 363.1374206542969, 378.9516906738281, 394.76593017578125, 410.5802001953125, 426.39447021484375, 442.208740234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 5.0, 10.0, 20.0, 21.0, 20.0, 22.0, 22.0, 23.0, 33.0, 29.0, 27.0, 41.0, 44.0, 55.0, 40.0, 50.0, 49.0, 34.0, 48.0, 34.0, 48.0, 41.0, 39.0, 30.0, 33.0, 27.0, 15.0, 22.0, 20.0, 20.0, 15.0, 10.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.88735961914062, -79.22712707519531, -76.56689453125, -73.90666198730469, -71.2464370727539, -68.5862045288086, -65.92597198486328, -63.26573944091797, -60.605506896972656, -57.945274353027344, -55.2850456237793, -52.624813079833984, -49.96458053588867, -47.304351806640625, -44.64411926269531, -41.98388671875, -39.32365798950195, -36.66342544555664, -34.003196716308594, -31.34296417236328, -28.68273162841797, -26.02250099182129, -23.36227035522461, -20.702037811279297, -18.041807174682617, -15.381575584411621, -12.721343994140625, -10.061113357543945, -7.400881767272949, -4.740650177001953, -2.0804195404052734, 0.5798130035400391, 3.2400436401367188, 5.900275230407715, 8.560506820678711, 11.22073745727539, 13.880969047546387, 16.541200637817383, 19.201431274414062, 21.861663818359375, 24.521894454956055, 27.182125091552734, 29.842357635498047, 32.502586364746094, 35.162818908691406, 37.82305145263672, 40.48328399658203, 43.143516540527344, 45.80374526977539, 48.4639778137207, 51.12420654296875, 53.78443908691406, 56.444671630859375, 59.10490417480469, 61.765132904052734, 64.42536926269531, 67.0855941772461, 69.7458267211914, 72.40605926513672, 75.0662841796875, 77.72651672363281, 80.38674926757812, 83.04698181152344, 85.70721435546875, 88.36744689941406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 5.0, 12.0, 10.0, 24.0, 49.0, 91.0, 141.0, 287.0, 628.0, 1324.0, 4011.0, 14591.0, 135207.0, 3992015.0, 34687.0, 7312.0, 2214.0, 836.0, 396.0, 192.0, 116.0, 42.0, 36.0, 15.0, 16.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.75, -21.88330078125, -21.0166015625, -20.14990234375, -19.283203125, -18.41650390625, -17.5498046875, -16.68310546875, -15.81640625, -14.94970703125, -14.0830078125, -13.21630859375, -12.349609375, -11.48291015625, -10.6162109375, -9.74951171875, -8.8828125, -8.01611328125, -7.1494140625, -6.28271484375, -5.416015625, -4.54931640625, -3.6826171875, -2.81591796875, -1.94921875, -1.08251953125, -0.2158203125, 0.65087890625, 1.517578125, 2.38427734375, 3.2509765625, 4.11767578125, 4.984375, 5.85107421875, 6.7177734375, 7.58447265625, 8.451171875, 9.31787109375, 10.1845703125, 11.05126953125, 11.91796875, 12.78466796875, 13.6513671875, 14.51806640625, 15.384765625, 16.25146484375, 17.1181640625, 17.98486328125, 18.8515625, 19.71826171875, 20.5849609375, 21.45166015625, 22.318359375, 23.18505859375, 24.0517578125, 24.91845703125, 25.78515625, 26.65185546875, 27.5185546875, 28.38525390625, 29.251953125, 30.11865234375, 30.9853515625, 31.85205078125, 32.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 16.0, 18.0, 22.0, 25.0, 40.0, 48.0, 47.0, 65.0, 56.0, 64.0, 73.0, 63.0, 74.0, 55.0, 51.0, 37.0, 44.0, 35.0, 26.0, 26.0, 13.0, 14.0, 5.0, 15.0, 5.0, 13.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.3380126953125, -4.156494140625, -3.9749755859375, -3.79345703125, -3.6119384765625, -3.430419921875, -3.2489013671875, -3.0673828125, -2.8858642578125, -2.704345703125, -2.5228271484375, -2.34130859375, -2.1597900390625, -1.978271484375, -1.7967529296875, -1.615234375, -1.4337158203125, -1.252197265625, -1.0706787109375, -0.88916015625, -0.7076416015625, -0.526123046875, -0.3446044921875, -0.1630859375, 0.0184326171875, 0.199951171875, 0.3814697265625, 0.56298828125, 0.7445068359375, 0.926025390625, 1.1075439453125, 1.2890625, 1.4705810546875, 1.652099609375, 1.8336181640625, 2.01513671875, 2.1966552734375, 2.378173828125, 2.5596923828125, 2.7412109375, 2.9227294921875, 3.104248046875, 3.2857666015625, 3.46728515625, 3.6488037109375, 3.830322265625, 4.0118408203125, 4.193359375, 4.3748779296875, 4.556396484375, 4.7379150390625, 4.91943359375, 5.1009521484375, 5.282470703125, 5.4639892578125, 5.6455078125, 5.8270263671875, 6.008544921875, 6.1900634765625, 6.37158203125, 6.5531005859375, 6.734619140625, 6.9161376953125, 7.09765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 16.0, 21.0, 22.0, 41.0, 51.0, 83.0, 135.0, 228.0, 445.0, 873.0, 1727.0, 4537.0, 13553.0, 78514.0, 3971090.0, 98426.0, 15538.0, 4905.0, 2017.0, 924.0, 487.0, 239.0, 134.0, 88.0, 46.0, 31.0, 30.0, 15.0, 25.0, 12.0, 3.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0], "bins": [-27.765625, -27.0972900390625, -26.428955078125, -25.7606201171875, -25.09228515625, -24.4239501953125, -23.755615234375, -23.0872802734375, -22.4189453125, -21.7506103515625, -21.082275390625, -20.4139404296875, -19.74560546875, -19.0772705078125, -18.408935546875, -17.7406005859375, -17.072265625, -16.4039306640625, -15.735595703125, -15.0672607421875, -14.39892578125, -13.7305908203125, -13.062255859375, -12.3939208984375, -11.7255859375, -11.0572509765625, -10.388916015625, -9.7205810546875, -9.05224609375, -8.3839111328125, -7.715576171875, -7.0472412109375, -6.37890625, -5.7105712890625, -5.042236328125, -4.3739013671875, -3.70556640625, -3.0372314453125, -2.368896484375, -1.7005615234375, -1.0322265625, -0.3638916015625, 0.304443359375, 0.9727783203125, 1.64111328125, 2.3094482421875, 2.977783203125, 3.6461181640625, 4.314453125, 4.9827880859375, 5.651123046875, 6.3194580078125, 6.98779296875, 7.6561279296875, 8.324462890625, 8.9927978515625, 9.6611328125, 10.3294677734375, 10.997802734375, 11.6661376953125, 12.33447265625, 13.0028076171875, 13.671142578125, 14.3394775390625, 15.0078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 14.0, 14.0, 22.0, 25.0, 56.0, 117.0, 328.0, 3038.0, 233.0, 88.0, 44.0, 22.0, 15.0, 12.0, 14.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.68414306640625, -7.4542236328125, -7.22430419921875, -6.994384765625, -6.76446533203125, -6.5345458984375, -6.30462646484375, -6.07470703125, -5.84478759765625, -5.6148681640625, -5.38494873046875, -5.155029296875, -4.92510986328125, -4.6951904296875, -4.46527099609375, -4.2353515625, -4.00543212890625, -3.7755126953125, -3.54559326171875, -3.315673828125, -3.08575439453125, -2.8558349609375, -2.62591552734375, -2.39599609375, -2.16607666015625, -1.9361572265625, -1.70623779296875, -1.476318359375, -1.24639892578125, -1.0164794921875, -0.78656005859375, -0.556640625, -0.32672119140625, -0.0968017578125, 0.13311767578125, 0.363037109375, 0.59295654296875, 0.8228759765625, 1.05279541015625, 1.28271484375, 1.51263427734375, 1.7425537109375, 1.97247314453125, 2.202392578125, 2.43231201171875, 2.6622314453125, 2.89215087890625, 3.1220703125, 3.35198974609375, 3.5819091796875, 3.81182861328125, 4.041748046875, 4.27166748046875, 4.5015869140625, 4.73150634765625, 4.96142578125, 5.19134521484375, 5.4212646484375, 5.65118408203125, 5.881103515625, 6.11102294921875, 6.3409423828125, 6.57086181640625, 6.80078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 17.0, 31.0, 61.0, 108.0, 148.0, 141.0, 164.0, 127.0, 74.0, 55.0, 28.0, 17.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-61.56011962890625, -60.20906448364258, -58.85800552368164, -57.50695037841797, -56.1558952331543, -54.80483627319336, -53.45378112792969, -52.10272216796875, -50.75166702270508, -49.400611877441406, -48.04955291748047, -46.6984977722168, -45.347442626953125, -43.99638366699219, -42.645328521728516, -41.294273376464844, -39.943214416503906, -38.592159271240234, -37.2411003112793, -35.890045166015625, -34.53899002075195, -33.187931060791016, -31.836875915527344, -30.48581886291504, -29.134765625, -27.783708572387695, -26.432653427124023, -25.08159637451172, -23.730539321899414, -22.37948226928711, -21.028427124023438, -19.677370071411133, -18.326311111450195, -16.97525405883789, -15.624197959899902, -14.273141860961914, -12.92208480834961, -11.571028709411621, -10.219972610473633, -8.868915557861328, -7.51785945892334, -6.166802883148193, -4.815746307373047, -3.4646902084350586, -2.113633632659912, -0.7625770568847656, 0.5884790420532227, 1.9395360946655273, 3.2905921936035156, 4.641648769378662, 5.992705345153809, 7.343761444091797, 8.694818496704102, 10.04587459564209, 11.396930694580078, 12.747987747192383, 14.099043846130371, 15.45009994506836, 16.801156997680664, 18.15221405029297, 19.50326919555664, 20.854326248168945, 22.20538330078125, 23.556438446044922, 24.907495498657227]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 16.0, 20.0, 22.0, 24.0, 21.0, 26.0, 29.0, 43.0, 36.0, 34.0, 45.0, 39.0, 57.0, 43.0, 44.0, 41.0, 56.0, 39.0, 41.0, 49.0, 32.0, 37.0, 31.0, 27.0, 19.0, 20.0, 21.0, 16.0, 6.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.312578201293945, -15.806832313537598, -15.301087379455566, -14.795341491699219, -14.289596557617188, -13.78385066986084, -13.278104782104492, -12.772359848022461, -12.266613960266113, -11.760868072509766, -11.255123138427734, -10.749377250671387, -10.243631362915039, -9.737886428833008, -9.23214054107666, -8.726394653320312, -8.220649719238281, -7.714904308319092, -7.209158897399902, -6.703413009643555, -6.197667598724365, -5.691922187805176, -5.186176300048828, -4.680430889129639, -4.174685478210449, -3.6689400672912598, -3.163194417953491, -2.6574487686157227, -2.151703357696533, -1.6459579467773438, -1.1402122974395752, -0.6344666481018066, -0.12871932983398438, 0.37702620029449463, 0.8827717304229736, 1.3885172605514526, 1.8942627906799316, 2.400008201599121, 2.9057538509368896, 3.411499500274658, 3.9172449111938477, 4.422990322113037, 4.928735733032227, 5.434481620788574, 5.940227031707764, 6.445972442626953, 6.951718330383301, 7.45746374130249, 7.96320915222168, 8.468955039978027, 8.974699974060059, 9.480445861816406, 9.986190795898438, 10.491936683654785, 10.997682571411133, 11.503427505493164, 12.009173393249512, 12.51491928100586, 13.02066421508789, 13.526410102844238, 14.032155990600586, 14.537900924682617, 15.043646812438965, 15.549392700195312, 16.055137634277344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 16.0, 24.0, 47.0, 78.0, 142.0, 249.0, 489.0, 1050.0, 2452.0, 7092.0, 23054.0, 88408.0, 341679.0, 425838.0, 114107.0, 29894.0, 8500.0, 3019.0, 1151.0, 575.0, 290.0, 140.0, 89.0, 58.0, 36.0, 16.0, 9.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-24.921875, -24.30029296875, -23.6787109375, -23.05712890625, -22.435546875, -21.81396484375, -21.1923828125, -20.57080078125, -19.94921875, -19.32763671875, -18.7060546875, -18.08447265625, -17.462890625, -16.84130859375, -16.2197265625, -15.59814453125, -14.9765625, -14.35498046875, -13.7333984375, -13.11181640625, -12.490234375, -11.86865234375, -11.2470703125, -10.62548828125, -10.00390625, -9.38232421875, -8.7607421875, -8.13916015625, -7.517578125, -6.89599609375, -6.2744140625, -5.65283203125, -5.03125, -4.40966796875, -3.7880859375, -3.16650390625, -2.544921875, -1.92333984375, -1.3017578125, -0.68017578125, -0.05859375, 0.56298828125, 1.1845703125, 1.80615234375, 2.427734375, 3.04931640625, 3.6708984375, 4.29248046875, 4.9140625, 5.53564453125, 6.1572265625, 6.77880859375, 7.400390625, 8.02197265625, 8.6435546875, 9.26513671875, 9.88671875, 10.50830078125, 11.1298828125, 11.75146484375, 12.373046875, 12.99462890625, 13.6162109375, 14.23779296875, 14.859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 6.0, 10.0, 6.0, 11.0, 15.0, 15.0, 18.0, 27.0, 26.0, 42.0, 41.0, 39.0, 65.0, 73.0, 52.0, 79.0, 71.0, 55.0, 65.0, 48.0, 42.0, 28.0, 37.0, 24.0, 26.0, 14.0, 13.0, 14.0, 14.0, 10.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.92645263671875, -4.7357177734375, -4.54498291015625, -4.354248046875, -4.16351318359375, -3.9727783203125, -3.78204345703125, -3.59130859375, -3.40057373046875, -3.2098388671875, -3.01910400390625, -2.828369140625, -2.63763427734375, -2.4468994140625, -2.25616455078125, -2.0654296875, -1.87469482421875, -1.6839599609375, -1.49322509765625, -1.302490234375, -1.11175537109375, -0.9210205078125, -0.73028564453125, -0.53955078125, -0.34881591796875, -0.1580810546875, 0.03265380859375, 0.223388671875, 0.41412353515625, 0.6048583984375, 0.79559326171875, 0.986328125, 1.17706298828125, 1.3677978515625, 1.55853271484375, 1.749267578125, 1.94000244140625, 2.1307373046875, 2.32147216796875, 2.51220703125, 2.70294189453125, 2.8936767578125, 3.08441162109375, 3.275146484375, 3.46588134765625, 3.6566162109375, 3.84735107421875, 4.0380859375, 4.22882080078125, 4.4195556640625, 4.61029052734375, 4.801025390625, 4.99176025390625, 5.1824951171875, 5.37322998046875, 5.56396484375, 5.75469970703125, 5.9454345703125, 6.13616943359375, 6.326904296875, 6.51763916015625, 6.7083740234375, 6.89910888671875, 7.08984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 9.0, 9.0, 21.0, 40.0, 61.0, 106.0, 179.0, 309.0, 584.0, 1327.0, 4097.0, 39276.0, 790051.0, 197810.0, 10656.0, 2162.0, 825.0, 428.0, 248.0, 116.0, 89.0, 55.0, 32.0, 21.0, 11.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.388671875, -35.27734375, -34.166015625, -33.0546875, -31.943359375, -30.83203125, -29.720703125, -28.609375, -27.498046875, -26.38671875, -25.275390625, -24.1640625, -23.052734375, -21.94140625, -20.830078125, -19.71875, -18.607421875, -17.49609375, -16.384765625, -15.2734375, -14.162109375, -13.05078125, -11.939453125, -10.828125, -9.716796875, -8.60546875, -7.494140625, -6.3828125, -5.271484375, -4.16015625, -3.048828125, -1.9375, -0.826171875, 0.28515625, 1.396484375, 2.5078125, 3.619140625, 4.73046875, 5.841796875, 6.953125, 8.064453125, 9.17578125, 10.287109375, 11.3984375, 12.509765625, 13.62109375, 14.732421875, 15.84375, 16.955078125, 18.06640625, 19.177734375, 20.2890625, 21.400390625, 22.51171875, 23.623046875, 24.734375, 25.845703125, 26.95703125, 28.068359375, 29.1796875, 30.291015625, 31.40234375, 32.513671875, 33.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 11.0, 10.0, 15.0, 12.0, 22.0, 23.0, 29.0, 25.0, 28.0, 35.0, 32.0, 44.0, 37.0, 42.0, 38.0, 40.0, 45.0, 38.0, 39.0, 42.0, 24.0, 33.0, 37.0, 36.0, 29.0, 25.0, 28.0, 22.0, 18.0, 23.0, 14.0, 12.0, 12.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.9296875, -14.4205322265625, -13.911376953125, -13.4022216796875, -12.89306640625, -12.3839111328125, -11.874755859375, -11.3656005859375, -10.8564453125, -10.3472900390625, -9.838134765625, -9.3289794921875, -8.81982421875, -8.3106689453125, -7.801513671875, -7.2923583984375, -6.783203125, -6.2740478515625, -5.764892578125, -5.2557373046875, -4.74658203125, -4.2374267578125, -3.728271484375, -3.2191162109375, -2.7099609375, -2.2008056640625, -1.691650390625, -1.1824951171875, -0.67333984375, -0.1641845703125, 0.344970703125, 0.8541259765625, 1.36328125, 1.8724365234375, 2.381591796875, 2.8907470703125, 3.39990234375, 3.9090576171875, 4.418212890625, 4.9273681640625, 5.4365234375, 5.9456787109375, 6.454833984375, 6.9639892578125, 7.47314453125, 7.9822998046875, 8.491455078125, 9.0006103515625, 9.509765625, 10.0189208984375, 10.528076171875, 11.0372314453125, 11.54638671875, 12.0555419921875, 12.564697265625, 13.0738525390625, 13.5830078125, 14.0921630859375, 14.601318359375, 15.1104736328125, 15.61962890625, 16.1287841796875, 16.637939453125, 17.1470947265625, 17.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 25.0, 31.0, 48.0, 62.0, 101.0, 197.0, 366.0, 687.0, 1518.0, 3737.0, 11686.0, 55358.0, 404600.0, 486311.0, 63347.0, 13206.0, 4095.0, 1555.0, 714.0, 387.0, 186.0, 121.0, 64.0, 45.0, 22.0, 10.0, 15.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.45513916015625, -7.2149658203125, -6.97479248046875, -6.734619140625, -6.49444580078125, -6.2542724609375, -6.01409912109375, -5.77392578125, -5.53375244140625, -5.2935791015625, -5.05340576171875, -4.813232421875, -4.57305908203125, -4.3328857421875, -4.09271240234375, -3.8525390625, -3.61236572265625, -3.3721923828125, -3.13201904296875, -2.891845703125, -2.65167236328125, -2.4114990234375, -2.17132568359375, -1.93115234375, -1.69097900390625, -1.4508056640625, -1.21063232421875, -0.970458984375, -0.73028564453125, -0.4901123046875, -0.24993896484375, -0.009765625, 0.23040771484375, 0.4705810546875, 0.71075439453125, 0.950927734375, 1.19110107421875, 1.4312744140625, 1.67144775390625, 1.91162109375, 2.15179443359375, 2.3919677734375, 2.63214111328125, 2.872314453125, 3.11248779296875, 3.3526611328125, 3.59283447265625, 3.8330078125, 4.07318115234375, 4.3133544921875, 4.55352783203125, 4.793701171875, 5.03387451171875, 5.2740478515625, 5.51422119140625, 5.75439453125, 5.99456787109375, 6.2347412109375, 6.47491455078125, 6.715087890625, 6.95526123046875, 7.1954345703125, 7.43560791015625, 7.67578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 13.0, 14.0, 10.0, 10.0, 15.0, 24.0, 26.0, 18.0, 37.0, 40.0, 41.0, 70.0, 83.0, 103.0, 110.0, 81.0, 54.0, 44.0, 34.0, 34.0, 27.0, 25.0, 11.0, 19.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.001495361328125, -0.0014546513557434082, -0.0014139413833618164, -0.0013732314109802246, -0.0013325214385986328, -0.001291811466217041, -0.0012511014938354492, -0.0012103915214538574, -0.0011696815490722656, -0.0011289715766906738, -0.001088261604309082, -0.0010475516319274902, -0.0010068416595458984, -0.0009661316871643066, -0.0009254217147827148, -0.000884711742401123, -0.0008440017700195312, -0.0008032917976379395, -0.0007625818252563477, -0.0007218718528747559, -0.0006811618804931641, -0.0006404519081115723, -0.0005997419357299805, -0.0005590319633483887, -0.0005183219909667969, -0.0004776120185852051, -0.0004369020462036133, -0.0003961920738220215, -0.0003554821014404297, -0.0003147721290588379, -0.0002740621566772461, -0.0002333521842956543, -0.0001926422119140625, -0.0001519322395324707, -0.0001112222671508789, -7.051229476928711e-05, -2.9802322387695312e-05, 1.0907649993896484e-05, 5.161762237548828e-05, 9.232759475708008e-05, 0.00013303756713867188, 0.00017374753952026367, 0.00021445751190185547, 0.00025516748428344727, 0.00029587745666503906, 0.00033658742904663086, 0.00037729740142822266, 0.00041800737380981445, 0.00045871734619140625, 0.000499427318572998, 0.0005401372909545898, 0.0005808472633361816, 0.0006215572357177734, 0.0006622672080993652, 0.000702977180480957, 0.0007436871528625488, 0.0007843971252441406, 0.0008251070976257324, 0.0008658170700073242, 0.000906527042388916, 0.0009472370147705078, 0.0009879469871520996, 0.0010286569595336914, 0.0010693669319152832, 0.001110076904296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 6.0, 20.0, 12.0, 23.0, 36.0, 38.0, 47.0, 72.0, 114.0, 189.0, 330.0, 563.0, 1121.0, 2534.0, 7517.0, 34216.0, 283265.0, 618654.0, 78887.0, 13560.0, 4000.0, 1531.0, 747.0, 374.0, 230.0, 123.0, 89.0, 59.0, 42.0, 35.0, 30.0, 24.0, 16.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9765625, -8.706298828125, -8.43603515625, -8.165771484375, -7.8955078125, -7.625244140625, -7.35498046875, -7.084716796875, -6.814453125, -6.544189453125, -6.27392578125, -6.003662109375, -5.7333984375, -5.463134765625, -5.19287109375, -4.922607421875, -4.65234375, -4.382080078125, -4.11181640625, -3.841552734375, -3.5712890625, -3.301025390625, -3.03076171875, -2.760498046875, -2.490234375, -2.219970703125, -1.94970703125, -1.679443359375, -1.4091796875, -1.138916015625, -0.86865234375, -0.598388671875, -0.328125, -0.057861328125, 0.21240234375, 0.482666015625, 0.7529296875, 1.023193359375, 1.29345703125, 1.563720703125, 1.833984375, 2.104248046875, 2.37451171875, 2.644775390625, 2.9150390625, 3.185302734375, 3.45556640625, 3.725830078125, 3.99609375, 4.266357421875, 4.53662109375, 4.806884765625, 5.0771484375, 5.347412109375, 5.61767578125, 5.887939453125, 6.158203125, 6.428466796875, 6.69873046875, 6.968994140625, 7.2392578125, 7.509521484375, 7.77978515625, 8.050048828125, 8.3203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 7.0, 13.0, 12.0, 12.0, 12.0, 23.0, 30.0, 34.0, 32.0, 50.0, 48.0, 72.0, 67.0, 61.0, 64.0, 56.0, 75.0, 69.0, 48.0, 38.0, 28.0, 25.0, 16.0, 18.0, 14.0, 8.0, 18.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.55126953125, -4.3837890625, -4.21630859375, -4.048828125, -3.88134765625, -3.7138671875, -3.54638671875, -3.37890625, -3.21142578125, -3.0439453125, -2.87646484375, -2.708984375, -2.54150390625, -2.3740234375, -2.20654296875, -2.0390625, -1.87158203125, -1.7041015625, -1.53662109375, -1.369140625, -1.20166015625, -1.0341796875, -0.86669921875, -0.69921875, -0.53173828125, -0.3642578125, -0.19677734375, -0.029296875, 0.13818359375, 0.3056640625, 0.47314453125, 0.640625, 0.80810546875, 0.9755859375, 1.14306640625, 1.310546875, 1.47802734375, 1.6455078125, 1.81298828125, 1.98046875, 2.14794921875, 2.3154296875, 2.48291015625, 2.650390625, 2.81787109375, 2.9853515625, 3.15283203125, 3.3203125, 3.48779296875, 3.6552734375, 3.82275390625, 3.990234375, 4.15771484375, 4.3251953125, 4.49267578125, 4.66015625, 4.82763671875, 4.9951171875, 5.16259765625, 5.330078125, 5.49755859375, 5.6650390625, 5.83251953125, 6.0]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 14.0, 28.0, 67.0, 117.0, 202.0, 208.0, 163.0, 114.0, 38.0, 25.0, 10.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.2626953125, -342.99365234375, -335.724609375, -328.45556640625, -321.1864929199219, -313.9174499511719, -306.6484069824219, -299.3793640136719, -292.1103210449219, -284.8412780761719, -277.5722351074219, -270.30316162109375, -263.03411865234375, -255.76507568359375, -248.49603271484375, -241.22698974609375, -233.9579315185547, -226.6888885498047, -219.41983032226562, -212.15078735351562, -204.88174438476562, -197.61270141601562, -190.34364318847656, -183.07460021972656, -175.8055419921875, -168.5364990234375, -161.26744079589844, -153.99839782714844, -146.72935485839844, -139.46029663085938, -132.19125366210938, -124.92221069335938, -117.65316009521484, -110.38410949707031, -103.11506652832031, -95.84601593017578, -88.57696533203125, -81.30792236328125, -74.03887176513672, -66.76982116699219, -59.50077819824219, -52.23173141479492, -44.962684631347656, -37.693634033203125, -30.42458724975586, -23.155540466308594, -15.886489868164062, -8.617443084716797, -1.3483963012695312, 5.920651435852051, 13.189699172973633, 20.45874786376953, 27.727794647216797, 34.99684143066406, 42.265892028808594, 49.53493881225586, 56.803985595703125, 64.07303619384766, 71.34207916259766, 78.61112976074219, 85.88017272949219, 93.14922332763672, 100.41827392578125, 107.68731689453125, 114.95636749267578]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 17.0, 8.0, 16.0, 17.0, 18.0, 15.0, 24.0, 34.0, 35.0, 41.0, 44.0, 53.0, 44.0, 52.0, 58.0, 48.0, 59.0, 53.0, 46.0, 36.0, 30.0, 38.0, 28.0, 28.0, 34.0, 23.0, 15.0, 17.0, 16.0, 7.0, 5.0, 4.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.4207763671875, -80.5611801147461, -77.70158386230469, -74.84198760986328, -71.98239135742188, -69.12278747558594, -66.26319885253906, -63.403594970703125, -60.54399871826172, -57.68440246582031, -54.824806213378906, -51.9652099609375, -49.10560989379883, -46.24601364135742, -43.386417388916016, -40.526817321777344, -37.6672248840332, -34.8076286315918, -31.948030471801758, -29.08843421936035, -26.228836059570312, -23.369239807128906, -20.5096435546875, -17.65004539489746, -14.790449142456055, -11.930851936340332, -9.07125473022461, -6.211658477783203, -3.3520612716674805, -0.4924640655517578, 2.3671321868896484, 5.2267303466796875, 8.086326599121094, 10.945923805236816, 13.805521011352539, 16.665117263793945, 19.524715423583984, 22.38431167602539, 25.243907928466797, 28.103506088256836, 30.963102340698242, 33.82270050048828, 36.68229675292969, 39.541893005371094, 42.4014892578125, 45.261085510253906, 48.12068176269531, 50.980281829833984, 53.83987808227539, 56.6994743347168, 59.5590705871582, 62.418670654296875, 65.27826690673828, 68.13786315917969, 70.9974594116211, 73.8570556640625, 76.7166519165039, 79.57624816894531, 82.43584442138672, 85.29544067382812, 88.15503692626953, 91.01463317871094, 93.87423706054688, 96.73383331298828, 99.59342956542969]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 5.0, 6.0, 10.0, 15.0, 21.0, 19.0, 40.0, 62.0, 94.0, 158.0, 218.0, 413.0, 669.0, 1240.0, 2376.0, 4768.0, 10230.0, 23543.0, 64721.0, 259439.0, 2578862.0, 1032371.0, 141509.0, 42068.0, 16479.0, 7227.0, 3536.0, 1791.0, 883.0, 568.0, 300.0, 205.0, 132.0, 81.0, 52.0, 54.0, 32.0, 21.0, 13.0, 15.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.92401123046875, -6.6331787109375, -6.34234619140625, -6.051513671875, -5.76068115234375, -5.4698486328125, -5.17901611328125, -4.88818359375, -4.59735107421875, -4.3065185546875, -4.01568603515625, -3.724853515625, -3.43402099609375, -3.1431884765625, -2.85235595703125, -2.5615234375, -2.27069091796875, -1.9798583984375, -1.68902587890625, -1.398193359375, -1.10736083984375, -0.8165283203125, -0.52569580078125, -0.23486328125, 0.05596923828125, 0.3468017578125, 0.63763427734375, 0.928466796875, 1.21929931640625, 1.5101318359375, 1.80096435546875, 2.091796875, 2.38262939453125, 2.6734619140625, 2.96429443359375, 3.255126953125, 3.54595947265625, 3.8367919921875, 4.12762451171875, 4.41845703125, 4.70928955078125, 5.0001220703125, 5.29095458984375, 5.581787109375, 5.87261962890625, 6.1634521484375, 6.45428466796875, 6.7451171875, 7.03594970703125, 7.3267822265625, 7.61761474609375, 7.908447265625, 8.19927978515625, 8.4901123046875, 8.78094482421875, 9.07177734375, 9.36260986328125, 9.6534423828125, 9.94427490234375, 10.235107421875, 10.52593994140625, 10.8167724609375, 11.10760498046875, 11.3984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 7.0, 8.0, 5.0, 13.0, 18.0, 24.0, 26.0, 34.0, 32.0, 41.0, 53.0, 46.0, 46.0, 77.0, 57.0, 68.0, 56.0, 61.0, 41.0, 50.0, 49.0, 31.0, 30.0, 27.0, 20.0, 26.0, 13.0, 15.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.16455078125, -3.9853515625, -3.80615234375, -3.626953125, -3.44775390625, -3.2685546875, -3.08935546875, -2.91015625, -2.73095703125, -2.5517578125, -2.37255859375, -2.193359375, -2.01416015625, -1.8349609375, -1.65576171875, -1.4765625, -1.29736328125, -1.1181640625, -0.93896484375, -0.759765625, -0.58056640625, -0.4013671875, -0.22216796875, -0.04296875, 0.13623046875, 0.3154296875, 0.49462890625, 0.673828125, 0.85302734375, 1.0322265625, 1.21142578125, 1.390625, 1.56982421875, 1.7490234375, 1.92822265625, 2.107421875, 2.28662109375, 2.4658203125, 2.64501953125, 2.82421875, 3.00341796875, 3.1826171875, 3.36181640625, 3.541015625, 3.72021484375, 3.8994140625, 4.07861328125, 4.2578125, 4.43701171875, 4.6162109375, 4.79541015625, 4.974609375, 5.15380859375, 5.3330078125, 5.51220703125, 5.69140625, 5.87060546875, 6.0498046875, 6.22900390625, 6.408203125, 6.58740234375, 6.7666015625, 6.94580078125, 7.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 24.0, 28.0, 47.0, 95.0, 200.0, 375.0, 1060.0, 3148.0, 11401.0, 54108.0, 597135.0, 3340933.0, 151927.0, 24324.0, 6180.0, 1964.0, 697.0, 266.0, 128.0, 77.0, 46.0, 20.0, 16.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.5848388671875, -19.044677734375, -18.5045166015625, -17.96435546875, -17.4241943359375, -16.884033203125, -16.3438720703125, -15.8037109375, -15.2635498046875, -14.723388671875, -14.1832275390625, -13.64306640625, -13.1029052734375, -12.562744140625, -12.0225830078125, -11.482421875, -10.9422607421875, -10.402099609375, -9.8619384765625, -9.32177734375, -8.7816162109375, -8.241455078125, -7.7012939453125, -7.1611328125, -6.6209716796875, -6.080810546875, -5.5406494140625, -5.00048828125, -4.4603271484375, -3.920166015625, -3.3800048828125, -2.83984375, -2.2996826171875, -1.759521484375, -1.2193603515625, -0.67919921875, -0.1390380859375, 0.401123046875, 0.9412841796875, 1.4814453125, 2.0216064453125, 2.561767578125, 3.1019287109375, 3.64208984375, 4.1822509765625, 4.722412109375, 5.2625732421875, 5.802734375, 6.3428955078125, 6.883056640625, 7.4232177734375, 7.96337890625, 8.5035400390625, 9.043701171875, 9.5838623046875, 10.1240234375, 10.6641845703125, 11.204345703125, 11.7445068359375, 12.28466796875, 12.8248291015625, 13.364990234375, 13.9051513671875, 14.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 17.0, 20.0, 30.0, 31.0, 51.0, 82.0, 117.0, 190.0, 267.0, 567.0, 947.0, 679.0, 358.0, 213.0, 144.0, 82.0, 56.0, 44.0, 28.0, 24.0, 13.0, 13.0, 13.0, 13.0, 10.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8553466796875, -11.468505859375, -11.0816650390625, -10.69482421875, -10.3079833984375, -9.921142578125, -9.5343017578125, -9.1474609375, -8.7606201171875, -8.373779296875, -7.9869384765625, -7.60009765625, -7.2132568359375, -6.826416015625, -6.4395751953125, -6.052734375, -5.6658935546875, -5.279052734375, -4.8922119140625, -4.50537109375, -4.1185302734375, -3.731689453125, -3.3448486328125, -2.9580078125, -2.5711669921875, -2.184326171875, -1.7974853515625, -1.41064453125, -1.0238037109375, -0.636962890625, -0.2501220703125, 0.13671875, 0.5235595703125, 0.910400390625, 1.2972412109375, 1.68408203125, 2.0709228515625, 2.457763671875, 2.8446044921875, 3.2314453125, 3.6182861328125, 4.005126953125, 4.3919677734375, 4.77880859375, 5.1656494140625, 5.552490234375, 5.9393310546875, 6.326171875, 6.7130126953125, 7.099853515625, 7.4866943359375, 7.87353515625, 8.2603759765625, 8.647216796875, 9.0340576171875, 9.4208984375, 9.8077392578125, 10.194580078125, 10.5814208984375, 10.96826171875, 11.3551025390625, 11.741943359375, 12.1287841796875, 12.515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 12.0, 24.0, 37.0, 95.0, 216.0, 271.0, 193.0, 72.0, 34.0, 19.0, 5.0, 11.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.68299865722656, -107.0890121459961, -100.49502563476562, -93.90104675292969, -87.30706024169922, -80.71307373046875, -74.11909484863281, -67.52510833740234, -60.931121826171875, -54.337135314941406, -47.7431526184082, -41.149169921875, -34.55518341064453, -27.961196899414062, -21.36721420288086, -14.773231506347656, -8.179244995117188, -1.5852603912353516, 5.008724212646484, 11.60270881652832, 18.196693420410156, 24.790679931640625, 31.384662628173828, 37.97864532470703, 44.5726318359375, 51.16661834716797, 57.76060104370117, 64.35458374023438, 70.94857025146484, 77.54255676269531, 84.13653564453125, 90.73052215576172, 97.32452392578125, 103.91851043701172, 110.51249694824219, 117.10647583007812, 123.7004623413086, 130.29444885253906, 136.888427734375, 143.482421875, 150.07640075683594, 156.67037963867188, 163.26437377929688, 169.8583526611328, 176.45233154296875, 183.04632568359375, 189.6403045654297, 196.23428344726562, 202.82827758789062, 209.42225646972656, 216.01625061035156, 222.6102294921875, 229.2042236328125, 235.79820251464844, 242.39218139648438, 248.98617553710938, 255.5801544189453, 262.17413330078125, 268.76812744140625, 275.36212158203125, 281.9560852050781, 288.5500793457031, 295.1440734863281, 301.738037109375, 308.33203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 13.0, 5.0, 8.0, 14.0, 10.0, 18.0, 22.0, 25.0, 22.0, 25.0, 32.0, 34.0, 37.0, 37.0, 41.0, 36.0, 43.0, 52.0, 50.0, 43.0, 45.0, 46.0, 42.0, 30.0, 31.0, 53.0, 28.0, 18.0, 16.0, 27.0, 16.0, 11.0, 20.0, 11.0, 5.0, 7.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.31375122070312, -68.34270477294922, -66.37165832519531, -64.4006118774414, -62.429569244384766, -60.45852279663086, -58.48748016357422, -56.51643371582031, -54.545387268066406, -52.5743408203125, -50.603294372558594, -48.63225173950195, -46.66120529174805, -44.69015884399414, -42.7191162109375, -40.748069763183594, -38.77702331542969, -36.80597686767578, -34.834930419921875, -32.863887786865234, -30.892841339111328, -28.921794891357422, -26.95075035095215, -24.979705810546875, -23.00865936279297, -21.037612915039062, -19.06656837463379, -17.095523834228516, -15.12447738647461, -13.15343189239502, -11.18238639831543, -9.21134090423584, -7.24029541015625, -5.26924991607666, -3.2982044219970703, -1.3271589279174805, 0.6438865661621094, 2.614932060241699, 4.585977554321289, 6.557023048400879, 8.528068542480469, 10.499114036560059, 12.470159530639648, 14.441205024719238, 16.412250518798828, 18.383296966552734, 20.354341506958008, 22.32538604736328, 24.296432495117188, 26.267478942871094, 28.238523483276367, 30.20956802368164, 32.18061447143555, 34.15166091918945, 36.122703552246094, 38.09375, 40.064796447753906, 42.03584289550781, 44.00688934326172, 45.97793197631836, 47.948978424072266, 49.92002487182617, 51.89106750488281, 53.86211395263672, 55.833160400390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 10.0, 15.0, 17.0, 26.0, 38.0, 81.0, 150.0, 213.0, 401.0, 770.0, 1499.0, 3062.0, 7076.0, 17537.0, 49133.0, 147556.0, 454754.0, 247304.0, 74369.0, 25992.0, 10026.0, 4299.0, 2026.0, 998.0, 504.0, 271.0, 163.0, 104.0, 57.0, 30.0, 21.0, 10.0, 11.0, 5.0, 3.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.664794921875, -11.24365234375, -10.822509765625, -10.4013671875, -9.980224609375, -9.55908203125, -9.137939453125, -8.716796875, -8.295654296875, -7.87451171875, -7.453369140625, -7.0322265625, -6.611083984375, -6.18994140625, -5.768798828125, -5.34765625, -4.926513671875, -4.50537109375, -4.084228515625, -3.6630859375, -3.241943359375, -2.82080078125, -2.399658203125, -1.978515625, -1.557373046875, -1.13623046875, -0.715087890625, -0.2939453125, 0.127197265625, 0.54833984375, 0.969482421875, 1.390625, 1.811767578125, 2.23291015625, 2.654052734375, 3.0751953125, 3.496337890625, 3.91748046875, 4.338623046875, 4.759765625, 5.180908203125, 5.60205078125, 6.023193359375, 6.4443359375, 6.865478515625, 7.28662109375, 7.707763671875, 8.12890625, 8.550048828125, 8.97119140625, 9.392333984375, 9.8134765625, 10.234619140625, 10.65576171875, 11.076904296875, 11.498046875, 11.919189453125, 12.34033203125, 12.761474609375, 13.1826171875, 13.603759765625, 14.02490234375, 14.446044921875, 14.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 7.0, 9.0, 5.0, 8.0, 21.0, 22.0, 24.0, 29.0, 42.0, 33.0, 39.0, 55.0, 50.0, 53.0, 57.0, 66.0, 72.0, 54.0, 52.0, 53.0, 41.0, 53.0, 35.0, 20.0, 17.0, 25.0, 21.0, 12.0, 14.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.27947998046875, -4.0980224609375, -3.91656494140625, -3.735107421875, -3.55364990234375, -3.3721923828125, -3.19073486328125, -3.00927734375, -2.82781982421875, -2.6463623046875, -2.46490478515625, -2.283447265625, -2.10198974609375, -1.9205322265625, -1.73907470703125, -1.5576171875, -1.37615966796875, -1.1947021484375, -1.01324462890625, -0.831787109375, -0.65032958984375, -0.4688720703125, -0.28741455078125, -0.10595703125, 0.07550048828125, 0.2569580078125, 0.43841552734375, 0.619873046875, 0.80133056640625, 0.9827880859375, 1.16424560546875, 1.345703125, 1.52716064453125, 1.7086181640625, 1.89007568359375, 2.071533203125, 2.25299072265625, 2.4344482421875, 2.61590576171875, 2.79736328125, 2.97882080078125, 3.1602783203125, 3.34173583984375, 3.523193359375, 3.70465087890625, 3.8861083984375, 4.06756591796875, 4.2490234375, 4.43048095703125, 4.6119384765625, 4.79339599609375, 4.974853515625, 5.15631103515625, 5.3377685546875, 5.51922607421875, 5.70068359375, 5.88214111328125, 6.0635986328125, 6.24505615234375, 6.426513671875, 6.60797119140625, 6.7894287109375, 6.97088623046875, 7.15234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 18.0, 23.0, 30.0, 57.0, 67.0, 99.0, 127.0, 248.0, 375.0, 737.0, 1498.0, 3860.0, 19586.0, 253895.0, 715485.0, 42105.0, 6228.0, 1935.0, 895.0, 427.0, 290.0, 195.0, 108.0, 65.0, 49.0, 36.0, 32.0, 23.0, 12.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.234619140625, -20.39111328125, -19.547607421875, -18.7041015625, -17.860595703125, -17.01708984375, -16.173583984375, -15.330078125, -14.486572265625, -13.64306640625, -12.799560546875, -11.9560546875, -11.112548828125, -10.26904296875, -9.425537109375, -8.58203125, -7.738525390625, -6.89501953125, -6.051513671875, -5.2080078125, -4.364501953125, -3.52099609375, -2.677490234375, -1.833984375, -0.990478515625, -0.14697265625, 0.696533203125, 1.5400390625, 2.383544921875, 3.22705078125, 4.070556640625, 4.9140625, 5.757568359375, 6.60107421875, 7.444580078125, 8.2880859375, 9.131591796875, 9.97509765625, 10.818603515625, 11.662109375, 12.505615234375, 13.34912109375, 14.192626953125, 15.0361328125, 15.879638671875, 16.72314453125, 17.566650390625, 18.41015625, 19.253662109375, 20.09716796875, 20.940673828125, 21.7841796875, 22.627685546875, 23.47119140625, 24.314697265625, 25.158203125, 26.001708984375, 26.84521484375, 27.688720703125, 28.5322265625, 29.375732421875, 30.21923828125, 31.062744140625, 31.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 4.0, 9.0, 7.0, 9.0, 12.0, 16.0, 27.0, 20.0, 28.0, 38.0, 34.0, 41.0, 66.0, 40.0, 65.0, 49.0, 56.0, 53.0, 56.0, 58.0, 49.0, 41.0, 37.0, 41.0, 32.0, 21.0, 18.0, 17.0, 9.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-29.78125, -29.025146484375, -28.26904296875, -27.512939453125, -26.7568359375, -26.000732421875, -25.24462890625, -24.488525390625, -23.732421875, -22.976318359375, -22.22021484375, -21.464111328125, -20.7080078125, -19.951904296875, -19.19580078125, -18.439697265625, -17.68359375, -16.927490234375, -16.17138671875, -15.415283203125, -14.6591796875, -13.903076171875, -13.14697265625, -12.390869140625, -11.634765625, -10.878662109375, -10.12255859375, -9.366455078125, -8.6103515625, -7.854248046875, -7.09814453125, -6.342041015625, -5.5859375, -4.829833984375, -4.07373046875, -3.317626953125, -2.5615234375, -1.805419921875, -1.04931640625, -0.293212890625, 0.462890625, 1.218994140625, 1.97509765625, 2.731201171875, 3.4873046875, 4.243408203125, 4.99951171875, 5.755615234375, 6.51171875, 7.267822265625, 8.02392578125, 8.780029296875, 9.5361328125, 10.292236328125, 11.04833984375, 11.804443359375, 12.560546875, 13.316650390625, 14.07275390625, 14.828857421875, 15.5849609375, 16.341064453125, 17.09716796875, 17.853271484375, 18.609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 15.0, 14.0, 23.0, 30.0, 50.0, 105.0, 166.0, 413.0, 1158.0, 4823.0, 40159.0, 811002.0, 174596.0, 12510.0, 2237.0, 639.0, 294.0, 136.0, 66.0, 27.0, 29.0, 20.0, 7.0, 7.0, 6.0, 4.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0, -14.6026611328125, -14.205322265625, -13.8079833984375, -13.41064453125, -13.0133056640625, -12.615966796875, -12.2186279296875, -11.8212890625, -11.4239501953125, -11.026611328125, -10.6292724609375, -10.23193359375, -9.8345947265625, -9.437255859375, -9.0399169921875, -8.642578125, -8.2452392578125, -7.847900390625, -7.4505615234375, -7.05322265625, -6.6558837890625, -6.258544921875, -5.8612060546875, -5.4638671875, -5.0665283203125, -4.669189453125, -4.2718505859375, -3.87451171875, -3.4771728515625, -3.079833984375, -2.6824951171875, -2.28515625, -1.8878173828125, -1.490478515625, -1.0931396484375, -0.69580078125, -0.2984619140625, 0.098876953125, 0.4962158203125, 0.8935546875, 1.2908935546875, 1.688232421875, 2.0855712890625, 2.48291015625, 2.8802490234375, 3.277587890625, 3.6749267578125, 4.072265625, 4.4696044921875, 4.866943359375, 5.2642822265625, 5.66162109375, 6.0589599609375, 6.456298828125, 6.8536376953125, 7.2509765625, 7.6483154296875, 8.045654296875, 8.4429931640625, 8.84033203125, 9.2376708984375, 9.635009765625, 10.0323486328125, 10.4296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 8.0, 14.0, 11.0, 19.0, 14.0, 12.0, 18.0, 31.0, 37.0, 74.0, 106.0, 173.0, 150.0, 84.0, 49.0, 39.0, 28.0, 24.0, 18.0, 14.0, 15.0, 9.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013780593872070312, -0.0013283789157867432, -0.001278698444366455, -0.001229017972946167, -0.001179337501525879, -0.0011296570301055908, -0.0010799765586853027, -0.0010302960872650146, -0.0009806156158447266, -0.0009309351444244385, -0.0008812546730041504, -0.0008315742015838623, -0.0007818937301635742, -0.0007322132587432861, -0.000682532787322998, -0.00063285231590271, -0.0005831718444824219, -0.0005334913730621338, -0.0004838109016418457, -0.0004341304302215576, -0.00038444995880126953, -0.00033476948738098145, -0.00028508901596069336, -0.00023540854454040527, -0.0001857280731201172, -0.0001360476016998291, -8.636713027954102e-05, -3.668665885925293e-05, 1.2993812561035156e-05, 6.267428398132324e-05, 0.00011235475540161133, 0.00016203522682189941, 0.0002117156982421875, 0.0002613961696624756, 0.00031107664108276367, 0.00036075711250305176, 0.00041043758392333984, 0.00046011805534362793, 0.000509798526763916, 0.0005594789981842041, 0.0006091594696044922, 0.0006588399410247803, 0.0007085204124450684, 0.0007582008838653564, 0.0008078813552856445, 0.0008575618267059326, 0.0009072422981262207, 0.0009569227695465088, 0.0010066032409667969, 0.001056283712387085, 0.001105964183807373, 0.0011556446552276611, 0.0012053251266479492, 0.0012550055980682373, 0.0013046860694885254, 0.0013543665409088135, 0.0014040470123291016, 0.0014537274837493896, 0.0015034079551696777, 0.0015530884265899658, 0.001602768898010254, 0.001652449369430542, 0.00170212984085083, 0.0017518103122711182, 0.0018014907836914062]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 22.0, 26.0, 34.0, 54.0, 105.0, 115.0, 164.0, 299.0, 585.0, 1031.0, 2349.0, 7500.0, 40156.0, 487434.0, 457646.0, 38768.0, 7431.0, 2373.0, 1014.0, 519.0, 330.0, 190.0, 120.0, 71.0, 54.0, 32.0, 28.0, 17.0, 10.0, 10.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5859375, -8.2996826171875, -8.013427734375, -7.7271728515625, -7.44091796875, -7.1546630859375, -6.868408203125, -6.5821533203125, -6.2958984375, -6.0096435546875, -5.723388671875, -5.4371337890625, -5.15087890625, -4.8646240234375, -4.578369140625, -4.2921142578125, -4.005859375, -3.7196044921875, -3.433349609375, -3.1470947265625, -2.86083984375, -2.5745849609375, -2.288330078125, -2.0020751953125, -1.7158203125, -1.4295654296875, -1.143310546875, -0.8570556640625, -0.57080078125, -0.2845458984375, 0.001708984375, 0.2879638671875, 0.57421875, 0.8604736328125, 1.146728515625, 1.4329833984375, 1.71923828125, 2.0054931640625, 2.291748046875, 2.5780029296875, 2.8642578125, 3.1505126953125, 3.436767578125, 3.7230224609375, 4.00927734375, 4.2955322265625, 4.581787109375, 4.8680419921875, 5.154296875, 5.4405517578125, 5.726806640625, 6.0130615234375, 6.29931640625, 6.5855712890625, 6.871826171875, 7.1580810546875, 7.4443359375, 7.7305908203125, 8.016845703125, 8.3031005859375, 8.58935546875, 8.8756103515625, 9.161865234375, 9.4481201171875, 9.734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 5.0, 8.0, 22.0, 12.0, 12.0, 18.0, 17.0, 22.0, 30.0, 33.0, 48.0, 56.0, 57.0, 55.0, 56.0, 83.0, 70.0, 70.0, 53.0, 35.0, 38.0, 37.0, 25.0, 21.0, 13.0, 11.0, 8.0, 16.0, 9.0, 7.0, 5.0, 2.0, 5.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4715576171875, -4.310302734375, -4.1490478515625, -3.98779296875, -3.8265380859375, -3.665283203125, -3.5040283203125, -3.3427734375, -3.1815185546875, -3.020263671875, -2.8590087890625, -2.69775390625, -2.5364990234375, -2.375244140625, -2.2139892578125, -2.052734375, -1.8914794921875, -1.730224609375, -1.5689697265625, -1.40771484375, -1.2464599609375, -1.085205078125, -0.9239501953125, -0.7626953125, -0.6014404296875, -0.440185546875, -0.2789306640625, -0.11767578125, 0.0435791015625, 0.204833984375, 0.3660888671875, 0.52734375, 0.6885986328125, 0.849853515625, 1.0111083984375, 1.17236328125, 1.3336181640625, 1.494873046875, 1.6561279296875, 1.8173828125, 1.9786376953125, 2.139892578125, 2.3011474609375, 2.46240234375, 2.6236572265625, 2.784912109375, 2.9461669921875, 3.107421875, 3.2686767578125, 3.429931640625, 3.5911865234375, 3.75244140625, 3.9136962890625, 4.074951171875, 4.2362060546875, 4.3974609375, 4.5587158203125, 4.719970703125, 4.8812255859375, 5.04248046875, 5.2037353515625, 5.364990234375, 5.5262451171875, 5.6875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 31.0, 64.0, 118.0, 228.0, 228.0, 147.0, 95.0, 38.0, 17.0, 13.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.19520568847656, -146.1154327392578, -140.03565979003906, -133.95590209960938, -127.87612915039062, -121.79635620117188, -115.71658325195312, -109.63681030273438, -103.55704498291016, -97.4772720336914, -91.39750671386719, -85.31773376464844, -79.23796081542969, -73.15819549560547, -67.07842254638672, -60.998653411865234, -54.91888427734375, -48.839115142822266, -42.75934600830078, -36.67957305908203, -30.599803924560547, -24.520034790039062, -18.440261840820312, -12.360492706298828, -6.280723571777344, -0.20095348358154297, 5.878816604614258, 11.958587646484375, 18.03835678100586, 24.118125915527344, 30.197898864746094, 36.27766799926758, 42.35743713378906, 48.43720626831055, 54.51697540283203, 60.59674835205078, 66.676513671875, 72.75628662109375, 78.8360595703125, 84.91583251953125, 90.99559783935547, 97.07537078857422, 103.15513610839844, 109.23490905761719, 115.31468200683594, 121.39444732666016, 127.4742202758789, 133.55398559570312, 139.63375854492188, 145.71353149414062, 151.79330444335938, 157.87307739257812, 163.9528350830078, 170.03260803222656, 176.1123809814453, 182.19215393066406, 188.27191162109375, 194.3516845703125, 200.43145751953125, 206.51123046875, 212.5909881591797, 218.67076110839844, 224.7505340576172, 230.83030700683594, 236.9100799560547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 15.0, 16.0, 11.0, 23.0, 20.0, 13.0, 21.0, 28.0, 29.0, 40.0, 29.0, 48.0, 42.0, 48.0, 63.0, 55.0, 65.0, 47.0, 47.0, 45.0, 36.0, 31.0, 30.0, 32.0, 26.0, 13.0, 27.0, 21.0, 15.0, 14.0, 13.0, 9.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.97138977050781, -68.39381408691406, -65.81623840332031, -63.2386589050293, -60.66108322143555, -58.0835075378418, -55.50592803955078, -52.92835235595703, -50.35077667236328, -47.77320098876953, -45.19562530517578, -42.618045806884766, -40.040470123291016, -37.462894439697266, -34.88531494140625, -32.3077392578125, -29.73016357421875, -27.152587890625, -24.575010299682617, -21.997432708740234, -19.419857025146484, -16.842281341552734, -14.264703750610352, -11.687126159667969, -9.109550476074219, -6.531973838806152, -3.954397201538086, -1.3768205642700195, 1.2007560729980469, 3.7783327102661133, 6.35590934753418, 8.933486938476562, 11.511062622070312, 14.088639259338379, 16.666215896606445, 19.243793487548828, 21.821369171142578, 24.398944854736328, 26.97652244567871, 29.554100036621094, 32.131675720214844, 34.709251403808594, 37.286827087402344, 39.86440658569336, 42.44198226928711, 45.01955795288086, 47.597137451171875, 50.174713134765625, 52.752288818359375, 55.329864501953125, 57.907440185546875, 60.48501968383789, 63.06259536743164, 65.64017486572266, 68.2177505493164, 70.79532623291016, 73.3729019165039, 75.95047760009766, 78.5280532836914, 81.10562896728516, 83.68321228027344, 86.26078796386719, 88.83836364746094, 91.41593933105469, 93.99351501464844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 12.0, 17.0, 32.0, 30.0, 32.0, 54.0, 72.0, 85.0, 135.0, 162.0, 329.0, 1231.0, 11079.0, 2270857.0, 1897233.0, 10674.0, 1200.0, 335.0, 173.0, 135.0, 93.0, 60.0, 67.0, 43.0, 29.0, 14.0, 26.0, 12.0, 10.0, 6.0, 5.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-42.25, -41.137939453125, -40.02587890625, -38.913818359375, -37.8017578125, -36.689697265625, -35.57763671875, -34.465576171875, -33.353515625, -32.241455078125, -31.12939453125, -30.017333984375, -28.9052734375, -27.793212890625, -26.68115234375, -25.569091796875, -24.45703125, -23.344970703125, -22.23291015625, -21.120849609375, -20.0087890625, -18.896728515625, -17.78466796875, -16.672607421875, -15.560546875, -14.448486328125, -13.33642578125, -12.224365234375, -11.1123046875, -10.000244140625, -8.88818359375, -7.776123046875, -6.6640625, -5.552001953125, -4.43994140625, -3.327880859375, -2.2158203125, -1.103759765625, 0.00830078125, 1.120361328125, 2.232421875, 3.344482421875, 4.45654296875, 5.568603515625, 6.6806640625, 7.792724609375, 8.90478515625, 10.016845703125, 11.12890625, 12.240966796875, 13.35302734375, 14.465087890625, 15.5771484375, 16.689208984375, 17.80126953125, 18.913330078125, 20.025390625, 21.137451171875, 22.24951171875, 23.361572265625, 24.4736328125, 25.585693359375, 26.69775390625, 27.809814453125, 28.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 22.0, 33.0, 55.0, 57.0, 87.0, 113.0, 137.0, 137.0, 107.0, 88.0, 63.0, 42.0, 21.0, 14.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9405517578125, -11.576416015625, -11.2122802734375, -10.84814453125, -10.4840087890625, -10.119873046875, -9.7557373046875, -9.3916015625, -9.0274658203125, -8.663330078125, -8.2991943359375, -7.93505859375, -7.5709228515625, -7.206787109375, -6.8426513671875, -6.478515625, -6.1143798828125, -5.750244140625, -5.3861083984375, -5.02197265625, -4.6578369140625, -4.293701171875, -3.9295654296875, -3.5654296875, -3.2012939453125, -2.837158203125, -2.4730224609375, -2.10888671875, -1.7447509765625, -1.380615234375, -1.0164794921875, -0.65234375, -0.2882080078125, 0.075927734375, 0.4400634765625, 0.80419921875, 1.1683349609375, 1.532470703125, 1.8966064453125, 2.2607421875, 2.6248779296875, 2.989013671875, 3.3531494140625, 3.71728515625, 4.0814208984375, 4.445556640625, 4.8096923828125, 5.173828125, 5.5379638671875, 5.902099609375, 6.2662353515625, 6.63037109375, 6.9945068359375, 7.358642578125, 7.7227783203125, 8.0869140625, 8.4510498046875, 8.815185546875, 9.1793212890625, 9.54345703125, 9.9075927734375, 10.271728515625, 10.6358642578125, 11.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 20.0, 17.0, 30.0, 49.0, 95.0, 138.0, 261.0, 590.0, 1285.0, 3463.0, 11894.0, 56687.0, 924001.0, 3068882.0, 102290.0, 17233.0, 4519.0, 1510.0, 623.0, 264.0, 168.0, 103.0, 67.0, 35.0, 14.0, 18.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.439208984375, -14.90966796875, -14.380126953125, -13.8505859375, -13.321044921875, -12.79150390625, -12.261962890625, -11.732421875, -11.202880859375, -10.67333984375, -10.143798828125, -9.6142578125, -9.084716796875, -8.55517578125, -8.025634765625, -7.49609375, -6.966552734375, -6.43701171875, -5.907470703125, -5.3779296875, -4.848388671875, -4.31884765625, -3.789306640625, -3.259765625, -2.730224609375, -2.20068359375, -1.671142578125, -1.1416015625, -0.612060546875, -0.08251953125, 0.447021484375, 0.9765625, 1.506103515625, 2.03564453125, 2.565185546875, 3.0947265625, 3.624267578125, 4.15380859375, 4.683349609375, 5.212890625, 5.742431640625, 6.27197265625, 6.801513671875, 7.3310546875, 7.860595703125, 8.39013671875, 8.919677734375, 9.44921875, 9.978759765625, 10.50830078125, 11.037841796875, 11.5673828125, 12.096923828125, 12.62646484375, 13.156005859375, 13.685546875, 14.215087890625, 14.74462890625, 15.274169921875, 15.8037109375, 16.333251953125, 16.86279296875, 17.392333984375, 17.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 27.0, 32.0, 28.0, 52.0, 77.0, 114.0, 189.0, 337.0, 588.0, 952.0, 703.0, 382.0, 194.0, 123.0, 57.0, 50.0, 24.0, 27.0, 18.0, 12.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.4609375, -13.0926513671875, -12.724365234375, -12.3560791015625, -11.98779296875, -11.6195068359375, -11.251220703125, -10.8829345703125, -10.5146484375, -10.1463623046875, -9.778076171875, -9.4097900390625, -9.04150390625, -8.6732177734375, -8.304931640625, -7.9366455078125, -7.568359375, -7.2000732421875, -6.831787109375, -6.4635009765625, -6.09521484375, -5.7269287109375, -5.358642578125, -4.9903564453125, -4.6220703125, -4.2537841796875, -3.885498046875, -3.5172119140625, -3.14892578125, -2.7806396484375, -2.412353515625, -2.0440673828125, -1.67578125, -1.3074951171875, -0.939208984375, -0.5709228515625, -0.20263671875, 0.1656494140625, 0.533935546875, 0.9022216796875, 1.2705078125, 1.6387939453125, 2.007080078125, 2.3753662109375, 2.74365234375, 3.1119384765625, 3.480224609375, 3.8485107421875, 4.216796875, 4.5850830078125, 4.953369140625, 5.3216552734375, 5.68994140625, 6.0582275390625, 6.426513671875, 6.7947998046875, 7.1630859375, 7.5313720703125, 7.899658203125, 8.2679443359375, 8.63623046875, 9.0045166015625, 9.372802734375, 9.7410888671875, 10.109375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 6.0, 11.0, 11.0, 19.0, 33.0, 43.0, 76.0, 137.0, 165.0, 168.0, 123.0, 105.0, 53.0, 22.0, 14.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.77225494384766, -112.29562377929688, -108.81898498535156, -105.34235382080078, -101.86572265625, -98.38908386230469, -94.9124526977539, -91.43582153320312, -87.95918273925781, -84.48255157470703, -81.00591278076172, -77.52928161621094, -74.05265045166016, -70.57601928710938, -67.09938049316406, -63.62274932861328, -60.1461181640625, -56.66948318481445, -53.19285202026367, -49.716217041015625, -46.239585876464844, -42.7629508972168, -39.28631591796875, -35.80968475341797, -32.33304977416992, -28.856416702270508, -25.379783630371094, -21.903148651123047, -18.426515579223633, -14.949882507324219, -11.473247528076172, -7.996614456176758, -4.519989013671875, -1.0433554649353027, 2.4332780838012695, 5.909912109375, 9.386545181274414, 12.863178253173828, 16.339813232421875, 19.81644630432129, 23.293079376220703, 26.769712448120117, 30.24634552001953, 33.72298049926758, 37.199615478515625, 40.676246643066406, 44.15288162231445, 47.6295166015625, 51.10614776611328, 54.58278274536133, 58.05941390991211, 61.536048889160156, 65.01268005371094, 68.48931884765625, 71.96595001220703, 75.44258117675781, 78.91921997070312, 82.3958511352539, 85.87248992919922, 89.34912109375, 92.82575225830078, 96.30238342285156, 99.77902221679688, 103.25565338134766, 106.73228454589844]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 16.0, 19.0, 14.0, 15.0, 31.0, 26.0, 34.0, 43.0, 55.0, 36.0, 38.0, 46.0, 53.0, 52.0, 54.0, 51.0, 57.0, 49.0, 45.0, 30.0, 29.0, 36.0, 26.0, 25.0, 21.0, 22.0, 14.0, 1.0, 12.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.971282958984375, -41.211490631103516, -39.45170211791992, -37.69190979003906, -35.93212127685547, -34.17232894897461, -32.412540435791016, -30.652748107910156, -28.892959594726562, -27.133169174194336, -25.37337875366211, -23.613588333129883, -21.853797912597656, -20.094005584716797, -18.334217071533203, -16.574424743652344, -14.814634323120117, -13.05484390258789, -11.295053482055664, -9.535263061523438, -7.775472164154053, -6.015681266784668, -4.255890846252441, -2.496100425720215, -0.7363100051879883, 1.0234805345535278, 2.783271074295044, 4.54306173324585, 6.302852153778076, 8.062643051147461, 9.822433471679688, 11.582223892211914, 13.34201431274414, 15.101804733276367, 16.861595153808594, 18.62138557434082, 20.381175994873047, 22.140968322753906, 23.9007568359375, 25.66054916381836, 27.420337677001953, 29.18012809753418, 30.939918518066406, 32.699710845947266, 34.45949935913086, 36.21929168701172, 37.97908020019531, 39.73887252807617, 41.49866485595703, 43.25845718383789, 45.018245697021484, 46.778038024902344, 48.53782653808594, 50.2976188659668, 52.05740737915039, 53.81719970703125, 55.576988220214844, 57.3367805480957, 59.0965690612793, 60.856361389160156, 62.61614990234375, 64.37593841552734, 66.13573455810547, 67.89552307128906, 69.65531158447266]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 6.0, 7.0, 22.0, 16.0, 20.0, 38.0, 70.0, 87.0, 152.0, 251.0, 501.0, 909.0, 1790.0, 3482.0, 7497.0, 16720.0, 40533.0, 112881.0, 354989.0, 334298.0, 106091.0, 38324.0, 15772.0, 7121.0, 3334.0, 1666.0, 843.0, 456.0, 271.0, 152.0, 85.0, 61.0, 22.0, 31.0, 6.0, 14.0, 9.0, 9.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-11.640625, -11.3077392578125, -10.974853515625, -10.6419677734375, -10.30908203125, -9.9761962890625, -9.643310546875, -9.3104248046875, -8.9775390625, -8.6446533203125, -8.311767578125, -7.9788818359375, -7.64599609375, -7.3131103515625, -6.980224609375, -6.6473388671875, -6.314453125, -5.9815673828125, -5.648681640625, -5.3157958984375, -4.98291015625, -4.6500244140625, -4.317138671875, -3.9842529296875, -3.6513671875, -3.3184814453125, -2.985595703125, -2.6527099609375, -2.31982421875, -1.9869384765625, -1.654052734375, -1.3211669921875, -0.98828125, -0.6553955078125, -0.322509765625, 0.0103759765625, 0.34326171875, 0.6761474609375, 1.009033203125, 1.3419189453125, 1.6748046875, 2.0076904296875, 2.340576171875, 2.6734619140625, 3.00634765625, 3.3392333984375, 3.672119140625, 4.0050048828125, 4.337890625, 4.6707763671875, 5.003662109375, 5.3365478515625, 5.66943359375, 6.0023193359375, 6.335205078125, 6.6680908203125, 7.0009765625, 7.3338623046875, 7.666748046875, 7.9996337890625, 8.33251953125, 8.6654052734375, 8.998291015625, 9.3311767578125, 9.6640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 4.0, 6.0, 8.0, 16.0, 15.0, 17.0, 25.0, 33.0, 33.0, 31.0, 48.0, 56.0, 56.0, 65.0, 56.0, 67.0, 65.0, 52.0, 62.0, 60.0, 39.0, 33.0, 24.0, 38.0, 24.0, 17.0, 12.0, 11.0, 11.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.49151611328125, -4.3072509765625, -4.12298583984375, -3.938720703125, -3.75445556640625, -3.5701904296875, -3.38592529296875, -3.20166015625, -3.01739501953125, -2.8331298828125, -2.64886474609375, -2.464599609375, -2.28033447265625, -2.0960693359375, -1.91180419921875, -1.7275390625, -1.54327392578125, -1.3590087890625, -1.17474365234375, -0.990478515625, -0.80621337890625, -0.6219482421875, -0.43768310546875, -0.25341796875, -0.06915283203125, 0.1151123046875, 0.29937744140625, 0.483642578125, 0.66790771484375, 0.8521728515625, 1.03643798828125, 1.220703125, 1.40496826171875, 1.5892333984375, 1.77349853515625, 1.957763671875, 2.14202880859375, 2.3262939453125, 2.51055908203125, 2.69482421875, 2.87908935546875, 3.0633544921875, 3.24761962890625, 3.431884765625, 3.61614990234375, 3.8004150390625, 3.98468017578125, 4.1689453125, 4.35321044921875, 4.5374755859375, 4.72174072265625, 4.906005859375, 5.09027099609375, 5.2745361328125, 5.45880126953125, 5.64306640625, 5.82733154296875, 6.0115966796875, 6.19586181640625, 6.380126953125, 6.56439208984375, 6.7486572265625, 6.93292236328125, 7.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 15.0, 28.0, 49.0, 66.0, 84.0, 165.0, 256.0, 376.0, 829.0, 1993.0, 6077.0, 28055.0, 215884.0, 697328.0, 77747.0, 13213.0, 3561.0, 1280.0, 642.0, 305.0, 190.0, 114.0, 85.0, 51.0, 36.0, 27.0, 20.0, 15.0, 9.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.212646484375, -16.58154296875, -15.950439453125, -15.3193359375, -14.688232421875, -14.05712890625, -13.426025390625, -12.794921875, -12.163818359375, -11.53271484375, -10.901611328125, -10.2705078125, -9.639404296875, -9.00830078125, -8.377197265625, -7.74609375, -7.114990234375, -6.48388671875, -5.852783203125, -5.2216796875, -4.590576171875, -3.95947265625, -3.328369140625, -2.697265625, -2.066162109375, -1.43505859375, -0.803955078125, -0.1728515625, 0.458251953125, 1.08935546875, 1.720458984375, 2.3515625, 2.982666015625, 3.61376953125, 4.244873046875, 4.8759765625, 5.507080078125, 6.13818359375, 6.769287109375, 7.400390625, 8.031494140625, 8.66259765625, 9.293701171875, 9.9248046875, 10.555908203125, 11.18701171875, 11.818115234375, 12.44921875, 13.080322265625, 13.71142578125, 14.342529296875, 14.9736328125, 15.604736328125, 16.23583984375, 16.866943359375, 17.498046875, 18.129150390625, 18.76025390625, 19.391357421875, 20.0224609375, 20.653564453125, 21.28466796875, 21.915771484375, 22.546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 11.0, 9.0, 22.0, 20.0, 25.0, 27.0, 26.0, 33.0, 41.0, 38.0, 43.0, 31.0, 61.0, 44.0, 46.0, 55.0, 52.0, 35.0, 57.0, 46.0, 40.0, 30.0, 33.0, 27.0, 19.0, 18.0, 18.0, 10.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.421875, -16.849609375, -16.27734375, -15.705078125, -15.1328125, -14.560546875, -13.98828125, -13.416015625, -12.84375, -12.271484375, -11.69921875, -11.126953125, -10.5546875, -9.982421875, -9.41015625, -8.837890625, -8.265625, -7.693359375, -7.12109375, -6.548828125, -5.9765625, -5.404296875, -4.83203125, -4.259765625, -3.6875, -3.115234375, -2.54296875, -1.970703125, -1.3984375, -0.826171875, -0.25390625, 0.318359375, 0.890625, 1.462890625, 2.03515625, 2.607421875, 3.1796875, 3.751953125, 4.32421875, 4.896484375, 5.46875, 6.041015625, 6.61328125, 7.185546875, 7.7578125, 8.330078125, 8.90234375, 9.474609375, 10.046875, 10.619140625, 11.19140625, 11.763671875, 12.3359375, 12.908203125, 13.48046875, 14.052734375, 14.625, 15.197265625, 15.76953125, 16.341796875, 16.9140625, 17.486328125, 18.05859375, 18.630859375, 19.203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 18.0, 25.0, 32.0, 67.0, 140.0, 293.0, 685.0, 3259.0, 26242.0, 719726.0, 281572.0, 13345.0, 2070.0, 541.0, 233.0, 104.0, 54.0, 32.0, 21.0, 15.0, 11.0, 8.0, 7.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.8985595703125, -9.515869140625, -9.1331787109375, -8.75048828125, -8.3677978515625, -7.985107421875, -7.6024169921875, -7.2197265625, -6.8370361328125, -6.454345703125, -6.0716552734375, -5.68896484375, -5.3062744140625, -4.923583984375, -4.5408935546875, -4.158203125, -3.7755126953125, -3.392822265625, -3.0101318359375, -2.62744140625, -2.2447509765625, -1.862060546875, -1.4793701171875, -1.0966796875, -0.7139892578125, -0.331298828125, 0.0513916015625, 0.43408203125, 0.8167724609375, 1.199462890625, 1.5821533203125, 1.96484375, 2.3475341796875, 2.730224609375, 3.1129150390625, 3.49560546875, 3.8782958984375, 4.260986328125, 4.6436767578125, 5.0263671875, 5.4090576171875, 5.791748046875, 6.1744384765625, 6.55712890625, 6.9398193359375, 7.322509765625, 7.7052001953125, 8.087890625, 8.4705810546875, 8.853271484375, 9.2359619140625, 9.61865234375, 10.0013427734375, 10.384033203125, 10.7667236328125, 11.1494140625, 11.5321044921875, 11.914794921875, 12.2974853515625, 12.68017578125, 13.0628662109375, 13.445556640625, 13.8282470703125, 14.2109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 13.0, 12.0, 20.0, 48.0, 114.0, 262.0, 291.0, 114.0, 54.0, 30.0, 18.0, 6.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003963470458984375, -0.0038565993309020996, -0.0037497282028198242, -0.003642857074737549, -0.0035359859466552734, -0.003429114818572998, -0.0033222436904907227, -0.0032153725624084473, -0.003108501434326172, -0.0030016303062438965, -0.002894759178161621, -0.0027878880500793457, -0.0026810169219970703, -0.002574145793914795, -0.0024672746658325195, -0.002360403537750244, -0.0022535324096679688, -0.0021466612815856934, -0.002039790153503418, -0.0019329190254211426, -0.0018260478973388672, -0.0017191767692565918, -0.0016123056411743164, -0.001505434513092041, -0.0013985633850097656, -0.0012916922569274902, -0.0011848211288452148, -0.0010779500007629395, -0.0009710788726806641, -0.0008642077445983887, -0.0007573366165161133, -0.0006504654884338379, -0.0005435943603515625, -0.0004367232322692871, -0.0003298521041870117, -0.00022298097610473633, -0.00011610984802246094, -9.238719940185547e-06, 9.763240814208984e-05, 0.00020450353622436523, 0.0003113746643066406, 0.000418245792388916, 0.0005251169204711914, 0.0006319880485534668, 0.0007388591766357422, 0.0008457303047180176, 0.000952601432800293, 0.0010594725608825684, 0.0011663436889648438, 0.0012732148170471191, 0.0013800859451293945, 0.00148695707321167, 0.0015938282012939453, 0.0017006993293762207, 0.001807570457458496, 0.0019144415855407715, 0.002021312713623047, 0.0021281838417053223, 0.0022350549697875977, 0.002341926097869873, 0.0024487972259521484, 0.002555668354034424, 0.0026625394821166992, 0.0027694106101989746, 0.00287628173828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 50.0, 82.0, 164.0, 268.0, 651.0, 1603.0, 5396.0, 33723.0, 617344.0, 359321.0, 23113.0, 4306.0, 1334.0, 531.0, 282.0, 125.0, 67.0, 48.0, 25.0, 13.0, 13.0, 12.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1749267578125, -8.857666015625, -8.5404052734375, -8.22314453125, -7.9058837890625, -7.588623046875, -7.2713623046875, -6.9541015625, -6.6368408203125, -6.319580078125, -6.0023193359375, -5.68505859375, -5.3677978515625, -5.050537109375, -4.7332763671875, -4.416015625, -4.0987548828125, -3.781494140625, -3.4642333984375, -3.14697265625, -2.8297119140625, -2.512451171875, -2.1951904296875, -1.8779296875, -1.5606689453125, -1.243408203125, -0.9261474609375, -0.60888671875, -0.2916259765625, 0.025634765625, 0.3428955078125, 0.66015625, 0.9774169921875, 1.294677734375, 1.6119384765625, 1.92919921875, 2.2464599609375, 2.563720703125, 2.8809814453125, 3.1982421875, 3.5155029296875, 3.832763671875, 4.1500244140625, 4.46728515625, 4.7845458984375, 5.101806640625, 5.4190673828125, 5.736328125, 6.0535888671875, 6.370849609375, 6.6881103515625, 7.00537109375, 7.3226318359375, 7.639892578125, 7.9571533203125, 8.2744140625, 8.5916748046875, 8.908935546875, 9.2261962890625, 9.54345703125, 9.8607177734375, 10.177978515625, 10.4952392578125, 10.8125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 3.0, 4.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 45.0, 68.0, 69.0, 85.0, 97.0, 87.0, 88.0, 85.0, 66.0, 55.0, 34.0, 30.0, 24.0, 14.0, 8.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9454345703125, -5.750244140625, -5.5550537109375, -5.35986328125, -5.1646728515625, -4.969482421875, -4.7742919921875, -4.5791015625, -4.3839111328125, -4.188720703125, -3.9935302734375, -3.79833984375, -3.6031494140625, -3.407958984375, -3.2127685546875, -3.017578125, -2.8223876953125, -2.627197265625, -2.4320068359375, -2.23681640625, -2.0416259765625, -1.846435546875, -1.6512451171875, -1.4560546875, -1.2608642578125, -1.065673828125, -0.8704833984375, -0.67529296875, -0.4801025390625, -0.284912109375, -0.0897216796875, 0.10546875, 0.3006591796875, 0.495849609375, 0.6910400390625, 0.88623046875, 1.0814208984375, 1.276611328125, 1.4718017578125, 1.6669921875, 1.8621826171875, 2.057373046875, 2.2525634765625, 2.44775390625, 2.6429443359375, 2.838134765625, 3.0333251953125, 3.228515625, 3.4237060546875, 3.618896484375, 3.8140869140625, 4.00927734375, 4.2044677734375, 4.399658203125, 4.5948486328125, 4.7900390625, 4.9852294921875, 5.180419921875, 5.3756103515625, 5.57080078125, 5.7659912109375, 5.961181640625, 6.1563720703125, 6.3515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 4.0, 7.0, 20.0, 37.0, 61.0, 95.0, 124.0, 175.0, 169.0, 114.0, 66.0, 39.0, 38.0, 12.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-131.46990966796875, -127.91560363769531, -124.3613052368164, -120.80699920654297, -117.25269317626953, -113.69839477539062, -110.14408874511719, -106.58978271484375, -103.03548431396484, -99.4811782836914, -95.9268798828125, -92.37257385253906, -88.81826782226562, -85.26396942138672, -81.70966339111328, -78.15536499023438, -74.60105895996094, -71.0467529296875, -67.4924545288086, -63.938148498535156, -60.383846282958984, -56.82954406738281, -53.275238037109375, -49.7209358215332, -46.1666259765625, -42.61232376098633, -39.05801773071289, -35.50371551513672, -31.949413299560547, -28.395109176635742, -24.840805053710938, -21.286502838134766, -17.732200622558594, -14.177897453308105, -10.623594284057617, -7.0692901611328125, -3.514986991882324, 0.03931617736816406, 3.5936203002929688, 7.147922515869141, 10.702226638793945, 14.256529808044434, 17.810832977294922, 21.365137100219727, 24.91944122314453, 28.473743438720703, 32.028045654296875, 35.58235168457031, 39.136653900146484, 42.690956115722656, 46.245262145996094, 49.799564361572266, 53.35386657714844, 56.908172607421875, 60.46247482299805, 64.01677703857422, 67.57108306884766, 71.1253890991211, 74.6796875, 78.23399353027344, 81.78829956054688, 85.34259796142578, 88.89690399169922, 92.45120239257812, 96.00550842285156]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 9.0, 6.0, 13.0, 12.0, 16.0, 13.0, 19.0, 24.0, 25.0, 31.0, 32.0, 35.0, 35.0, 49.0, 48.0, 30.0, 57.0, 63.0, 55.0, 50.0, 52.0, 43.0, 37.0, 36.0, 28.0, 17.0, 30.0, 16.0, 23.0, 16.0, 11.0, 11.0, 10.0, 12.0, 6.0, 4.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-77.99589538574219, -75.7314224243164, -73.46694946289062, -71.20246887207031, -68.93799591064453, -66.67352294921875, -64.40904235839844, -62.144569396972656, -59.880096435546875, -57.615623474121094, -55.35114669799805, -53.086669921875, -50.82219696044922, -48.55772399902344, -46.29324722290039, -44.028770446777344, -41.76429748535156, -39.49982452392578, -37.235347747802734, -34.97087097167969, -32.706398010253906, -30.441923141479492, -28.177448272705078, -25.912973403930664, -23.64849853515625, -21.384023666381836, -19.119548797607422, -16.855073928833008, -14.590599060058594, -12.32612419128418, -10.061649322509766, -7.797174453735352, -5.5326995849609375, -3.2682247161865234, -1.0037498474121094, 1.2607250213623047, 3.5251998901367188, 5.789674758911133, 8.054149627685547, 10.318624496459961, 12.583099365234375, 14.847574234008789, 17.112049102783203, 19.376523971557617, 21.64099884033203, 23.905473709106445, 26.16994857788086, 28.434423446655273, 30.698898315429688, 32.96337127685547, 35.227848052978516, 37.49232482910156, 39.756797790527344, 42.021270751953125, 44.28574752807617, 46.55022430419922, 48.814697265625, 51.07917022705078, 53.34364700317383, 55.608123779296875, 57.872596740722656, 60.13706970214844, 62.401546478271484, 64.66602325439453, 66.93049621582031]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 18.0, 14.0, 20.0, 34.0, 64.0, 92.0, 167.0, 352.0, 658.0, 1399.0, 3503.0, 9308.0, 30035.0, 134144.0, 1286222.0, 2404793.0, 255695.0, 46486.0, 13141.0, 4636.0, 1785.0, 829.0, 383.0, 180.0, 117.0, 67.0, 46.0, 31.0, 20.0, 9.0, 18.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.829833984375, -9.55029296875, -9.270751953125, -8.9912109375, -8.711669921875, -8.43212890625, -8.152587890625, -7.873046875, -7.593505859375, -7.31396484375, -7.034423828125, -6.7548828125, -6.475341796875, -6.19580078125, -5.916259765625, -5.63671875, -5.357177734375, -5.07763671875, -4.798095703125, -4.5185546875, -4.239013671875, -3.95947265625, -3.679931640625, -3.400390625, -3.120849609375, -2.84130859375, -2.561767578125, -2.2822265625, -2.002685546875, -1.72314453125, -1.443603515625, -1.1640625, -0.884521484375, -0.60498046875, -0.325439453125, -0.0458984375, 0.233642578125, 0.51318359375, 0.792724609375, 1.072265625, 1.351806640625, 1.63134765625, 1.910888671875, 2.1904296875, 2.469970703125, 2.74951171875, 3.029052734375, 3.30859375, 3.588134765625, 3.86767578125, 4.147216796875, 4.4267578125, 4.706298828125, 4.98583984375, 5.265380859375, 5.544921875, 5.824462890625, 6.10400390625, 6.383544921875, 6.6630859375, 6.942626953125, 7.22216796875, 7.501708984375, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 18.0, 27.0, 24.0, 28.0, 39.0, 54.0, 59.0, 57.0, 75.0, 74.0, 63.0, 77.0, 55.0, 64.0, 52.0, 40.0, 29.0, 29.0, 28.0, 21.0, 11.0, 11.0, 12.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.561767578125, -4.37353515625, -4.185302734375, -3.9970703125, -3.808837890625, -3.62060546875, -3.432373046875, -3.244140625, -3.055908203125, -2.86767578125, -2.679443359375, -2.4912109375, -2.302978515625, -2.11474609375, -1.926513671875, -1.73828125, -1.550048828125, -1.36181640625, -1.173583984375, -0.9853515625, -0.797119140625, -0.60888671875, -0.420654296875, -0.232421875, -0.044189453125, 0.14404296875, 0.332275390625, 0.5205078125, 0.708740234375, 0.89697265625, 1.085205078125, 1.2734375, 1.461669921875, 1.64990234375, 1.838134765625, 2.0263671875, 2.214599609375, 2.40283203125, 2.591064453125, 2.779296875, 2.967529296875, 3.15576171875, 3.343994140625, 3.5322265625, 3.720458984375, 3.90869140625, 4.096923828125, 4.28515625, 4.473388671875, 4.66162109375, 4.849853515625, 5.0380859375, 5.226318359375, 5.41455078125, 5.602783203125, 5.791015625, 5.979248046875, 6.16748046875, 6.355712890625, 6.5439453125, 6.732177734375, 6.92041015625, 7.108642578125, 7.296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 6.0, 26.0, 26.0, 48.0, 62.0, 91.0, 150.0, 336.0, 656.0, 1671.0, 5573.0, 25266.0, 177935.0, 3167089.0, 741605.0, 58363.0, 10596.0, 2745.0, 950.0, 453.0, 228.0, 132.0, 79.0, 46.0, 37.0, 21.0, 18.0, 15.0, 12.0, 11.0, 13.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.75, -17.2918701171875, -16.833740234375, -16.3756103515625, -15.91748046875, -15.4593505859375, -15.001220703125, -14.5430908203125, -14.0849609375, -13.6268310546875, -13.168701171875, -12.7105712890625, -12.25244140625, -11.7943115234375, -11.336181640625, -10.8780517578125, -10.419921875, -9.9617919921875, -9.503662109375, -9.0455322265625, -8.58740234375, -8.1292724609375, -7.671142578125, -7.2130126953125, -6.7548828125, -6.2967529296875, -5.838623046875, -5.3804931640625, -4.92236328125, -4.4642333984375, -4.006103515625, -3.5479736328125, -3.08984375, -2.6317138671875, -2.173583984375, -1.7154541015625, -1.25732421875, -0.7991943359375, -0.341064453125, 0.1170654296875, 0.5751953125, 1.0333251953125, 1.491455078125, 1.9495849609375, 2.40771484375, 2.8658447265625, 3.323974609375, 3.7821044921875, 4.240234375, 4.6983642578125, 5.156494140625, 5.6146240234375, 6.07275390625, 6.5308837890625, 6.989013671875, 7.4471435546875, 7.9052734375, 8.3634033203125, 8.821533203125, 9.2796630859375, 9.73779296875, 10.1959228515625, 10.654052734375, 11.1121826171875, 11.5703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 17.0, 16.0, 32.0, 37.0, 68.0, 80.0, 143.0, 238.0, 393.0, 697.0, 800.0, 623.0, 328.0, 206.0, 111.0, 80.0, 48.0, 45.0, 25.0, 16.0, 16.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.9241943359375, -13.465576171875, -13.0069580078125, -12.54833984375, -12.0897216796875, -11.631103515625, -11.1724853515625, -10.7138671875, -10.2552490234375, -9.796630859375, -9.3380126953125, -8.87939453125, -8.4207763671875, -7.962158203125, -7.5035400390625, -7.044921875, -6.5863037109375, -6.127685546875, -5.6690673828125, -5.21044921875, -4.7518310546875, -4.293212890625, -3.8345947265625, -3.3759765625, -2.9173583984375, -2.458740234375, -2.0001220703125, -1.54150390625, -1.0828857421875, -0.624267578125, -0.1656494140625, 0.29296875, 0.7515869140625, 1.210205078125, 1.6688232421875, 2.12744140625, 2.5860595703125, 3.044677734375, 3.5032958984375, 3.9619140625, 4.4205322265625, 4.879150390625, 5.3377685546875, 5.79638671875, 6.2550048828125, 6.713623046875, 7.1722412109375, 7.630859375, 8.0894775390625, 8.548095703125, 9.0067138671875, 9.46533203125, 9.9239501953125, 10.382568359375, 10.8411865234375, 11.2998046875, 11.7584228515625, 12.217041015625, 12.6756591796875, 13.13427734375, 13.5928955078125, 14.051513671875, 14.5101318359375, 14.96875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 0.0, 4.0, 4.0, 12.0, 8.0, 17.0, 54.0, 97.0, 181.0, 196.0, 204.0, 121.0, 50.0, 25.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.23287963867188, -143.41714477539062, -138.60140991210938, -133.7856903076172, -128.96995544433594, -124.15422058105469, -119.33848571777344, -114.52275848388672, -109.70703125, -104.89129638671875, -100.07556915283203, -95.25983428955078, -90.44410705566406, -85.62837219238281, -80.81263732910156, -75.99691009521484, -71.1811752319336, -66.36544036865234, -61.549713134765625, -56.733978271484375, -51.918251037597656, -47.102516174316406, -42.28678512573242, -37.47105407714844, -32.65532302856445, -27.83959197998047, -23.023860931396484, -18.208127975463867, -13.392396926879883, -8.576665878295898, -3.7609329223632812, 1.0547981262207031, 5.8705291748046875, 10.686260223388672, 15.501992225646973, 20.317724227905273, 25.133455276489258, 29.949186325073242, 34.76491928100586, 39.580650329589844, 44.39638137817383, 49.21211242675781, 54.0278434753418, 58.84357452392578, 63.65930938720703, 68.47503662109375, 73.290771484375, 78.10650634765625, 82.92223358154297, 87.73796844482422, 92.55369567871094, 97.36943054199219, 102.1851577758789, 107.00089263916016, 111.81661987304688, 116.63235473632812, 121.44808959960938, 126.26382446289062, 131.07955932617188, 135.89527893066406, 140.7110137939453, 145.52674865722656, 150.3424835205078, 155.158203125, 159.97393798828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 17.0, 8.0, 11.0, 16.0, 16.0, 21.0, 15.0, 20.0, 32.0, 32.0, 29.0, 45.0, 30.0, 37.0, 38.0, 49.0, 53.0, 47.0, 56.0, 42.0, 34.0, 46.0, 32.0, 35.0, 39.0, 28.0, 37.0, 20.0, 12.0, 22.0, 16.0, 15.0, 12.0, 8.0, 2.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-58.22266387939453, -56.405364990234375, -54.588069915771484, -52.77077102661133, -50.95347213745117, -49.13617706298828, -47.318878173828125, -45.50157928466797, -43.68428039550781, -41.866981506347656, -40.049686431884766, -38.23238754272461, -36.41508865356445, -34.59779357910156, -32.780494689941406, -30.96319580078125, -29.14590072631836, -27.328603744506836, -25.51130485534668, -23.694007873535156, -21.876708984375, -20.059412002563477, -18.242115020751953, -16.424816131591797, -14.607519149780273, -12.790221214294434, -10.972923278808594, -9.15562629699707, -7.3383283615112305, -5.521030426025391, -3.703733444213867, -1.8864355087280273, -0.06914138793945312, 1.7481563091278076, 3.5654540061950684, 5.38275146484375, 7.20004940032959, 9.01734733581543, 10.834644317626953, 12.651942253112793, 14.469240188598633, 16.286537170410156, 18.103836059570312, 19.921133041381836, 21.73843002319336, 23.555728912353516, 25.37302589416504, 27.190322875976562, 29.00762176513672, 30.824918746948242, 32.642215728759766, 34.45951461791992, 36.27681350708008, 38.09410858154297, 39.911407470703125, 41.72870635986328, 43.54600524902344, 45.363304138183594, 47.180599212646484, 48.99789810180664, 50.8151969909668, 52.63249206542969, 54.449790954589844, 56.26708984375, 58.08438491821289]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 11.0, 9.0, 20.0, 24.0, 54.0, 82.0, 170.0, 290.0, 610.0, 1227.0, 2749.0, 7017.0, 19361.0, 56583.0, 170553.0, 420677.0, 244526.0, 80988.0, 27186.0, 9573.0, 3744.0, 1550.0, 722.0, 381.0, 185.0, 109.0, 65.0, 28.0, 33.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.295654296875, -10.92724609375, -10.558837890625, -10.1904296875, -9.822021484375, -9.45361328125, -9.085205078125, -8.716796875, -8.348388671875, -7.97998046875, -7.611572265625, -7.2431640625, -6.874755859375, -6.50634765625, -6.137939453125, -5.76953125, -5.401123046875, -5.03271484375, -4.664306640625, -4.2958984375, -3.927490234375, -3.55908203125, -3.190673828125, -2.822265625, -2.453857421875, -2.08544921875, -1.717041015625, -1.3486328125, -0.980224609375, -0.61181640625, -0.243408203125, 0.125, 0.493408203125, 0.86181640625, 1.230224609375, 1.5986328125, 1.967041015625, 2.33544921875, 2.703857421875, 3.072265625, 3.440673828125, 3.80908203125, 4.177490234375, 4.5458984375, 4.914306640625, 5.28271484375, 5.651123046875, 6.01953125, 6.387939453125, 6.75634765625, 7.124755859375, 7.4931640625, 7.861572265625, 8.22998046875, 8.598388671875, 8.966796875, 9.335205078125, 9.70361328125, 10.072021484375, 10.4404296875, 10.808837890625, 11.17724609375, 11.545654296875, 11.9140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 10.0, 20.0, 21.0, 32.0, 27.0, 33.0, 46.0, 65.0, 64.0, 78.0, 65.0, 82.0, 62.0, 66.0, 60.0, 47.0, 58.0, 28.0, 27.0, 20.0, 15.0, 13.0, 13.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.92987060546875, -4.7347412109375, -4.53961181640625, -4.344482421875, -4.14935302734375, -3.9542236328125, -3.75909423828125, -3.56396484375, -3.36883544921875, -3.1737060546875, -2.97857666015625, -2.783447265625, -2.58831787109375, -2.3931884765625, -2.19805908203125, -2.0029296875, -1.80780029296875, -1.6126708984375, -1.41754150390625, -1.222412109375, -1.02728271484375, -0.8321533203125, -0.63702392578125, -0.44189453125, -0.24676513671875, -0.0516357421875, 0.14349365234375, 0.338623046875, 0.53375244140625, 0.7288818359375, 0.92401123046875, 1.119140625, 1.31427001953125, 1.5093994140625, 1.70452880859375, 1.899658203125, 2.09478759765625, 2.2899169921875, 2.48504638671875, 2.68017578125, 2.87530517578125, 3.0704345703125, 3.26556396484375, 3.460693359375, 3.65582275390625, 3.8509521484375, 4.04608154296875, 4.2412109375, 4.43634033203125, 4.6314697265625, 4.82659912109375, 5.021728515625, 5.21685791015625, 5.4119873046875, 5.60711669921875, 5.80224609375, 5.99737548828125, 6.1925048828125, 6.38763427734375, 6.582763671875, 6.77789306640625, 6.9730224609375, 7.16815185546875, 7.36328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 9.0, 10.0, 18.0, 22.0, 21.0, 54.0, 64.0, 75.0, 117.0, 135.0, 223.0, 320.0, 470.0, 756.0, 1179.0, 2176.0, 5019.0, 20113.0, 142659.0, 725063.0, 121917.0, 17944.0, 4689.0, 2055.0, 1135.0, 726.0, 454.0, 329.0, 234.0, 151.0, 123.0, 88.0, 57.0, 36.0, 25.0, 24.0, 15.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.359375, -19.7509765625, -19.142578125, -18.5341796875, -17.92578125, -17.3173828125, -16.708984375, -16.1005859375, -15.4921875, -14.8837890625, -14.275390625, -13.6669921875, -13.05859375, -12.4501953125, -11.841796875, -11.2333984375, -10.625, -10.0166015625, -9.408203125, -8.7998046875, -8.19140625, -7.5830078125, -6.974609375, -6.3662109375, -5.7578125, -5.1494140625, -4.541015625, -3.9326171875, -3.32421875, -2.7158203125, -2.107421875, -1.4990234375, -0.890625, -0.2822265625, 0.326171875, 0.9345703125, 1.54296875, 2.1513671875, 2.759765625, 3.3681640625, 3.9765625, 4.5849609375, 5.193359375, 5.8017578125, 6.41015625, 7.0185546875, 7.626953125, 8.2353515625, 8.84375, 9.4521484375, 10.060546875, 10.6689453125, 11.27734375, 11.8857421875, 12.494140625, 13.1025390625, 13.7109375, 14.3193359375, 14.927734375, 15.5361328125, 16.14453125, 16.7529296875, 17.361328125, 17.9697265625, 18.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 9.0, 6.0, 13.0, 17.0, 6.0, 29.0, 29.0, 25.0, 32.0, 25.0, 43.0, 40.0, 36.0, 53.0, 55.0, 45.0, 55.0, 51.0, 32.0, 47.0, 40.0, 37.0, 36.0, 25.0, 33.0, 24.0, 22.0, 14.0, 21.0, 14.0, 13.0, 11.0, 3.0, 5.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.585205078125, -16.98291015625, -16.380615234375, -15.7783203125, -15.176025390625, -14.57373046875, -13.971435546875, -13.369140625, -12.766845703125, -12.16455078125, -11.562255859375, -10.9599609375, -10.357666015625, -9.75537109375, -9.153076171875, -8.55078125, -7.948486328125, -7.34619140625, -6.743896484375, -6.1416015625, -5.539306640625, -4.93701171875, -4.334716796875, -3.732421875, -3.130126953125, -2.52783203125, -1.925537109375, -1.3232421875, -0.720947265625, -0.11865234375, 0.483642578125, 1.0859375, 1.688232421875, 2.29052734375, 2.892822265625, 3.4951171875, 4.097412109375, 4.69970703125, 5.302001953125, 5.904296875, 6.506591796875, 7.10888671875, 7.711181640625, 8.3134765625, 8.915771484375, 9.51806640625, 10.120361328125, 10.72265625, 11.324951171875, 11.92724609375, 12.529541015625, 13.1318359375, 13.734130859375, 14.33642578125, 14.938720703125, 15.541015625, 16.143310546875, 16.74560546875, 17.347900390625, 17.9501953125, 18.552490234375, 19.15478515625, 19.757080078125, 20.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 12.0, 7.0, 5.0, 8.0, 11.0, 16.0, 21.0, 27.0, 30.0, 62.0, 101.0, 135.0, 298.0, 573.0, 1263.0, 3628.0, 13664.0, 76666.0, 673072.0, 234165.0, 33572.0, 7319.0, 2073.0, 847.0, 399.0, 188.0, 136.0, 78.0, 53.0, 36.0, 26.0, 16.0, 19.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.8717041015625, -5.680908203125, -5.4901123046875, -5.29931640625, -5.1085205078125, -4.917724609375, -4.7269287109375, -4.5361328125, -4.3453369140625, -4.154541015625, -3.9637451171875, -3.77294921875, -3.5821533203125, -3.391357421875, -3.2005615234375, -3.009765625, -2.8189697265625, -2.628173828125, -2.4373779296875, -2.24658203125, -2.0557861328125, -1.864990234375, -1.6741943359375, -1.4833984375, -1.2926025390625, -1.101806640625, -0.9110107421875, -0.72021484375, -0.5294189453125, -0.338623046875, -0.1478271484375, 0.04296875, 0.2337646484375, 0.424560546875, 0.6153564453125, 0.80615234375, 0.9969482421875, 1.187744140625, 1.3785400390625, 1.5693359375, 1.7601318359375, 1.950927734375, 2.1417236328125, 2.33251953125, 2.5233154296875, 2.714111328125, 2.9049072265625, 3.095703125, 3.2864990234375, 3.477294921875, 3.6680908203125, 3.85888671875, 4.0496826171875, 4.240478515625, 4.4312744140625, 4.6220703125, 4.8128662109375, 5.003662109375, 5.1944580078125, 5.38525390625, 5.5760498046875, 5.766845703125, 5.9576416015625, 6.1484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 15.0, 16.0, 28.0, 27.0, 37.0, 39.0, 65.0, 84.0, 125.0, 154.0, 98.0, 47.0, 55.0, 38.0, 32.0, 24.0, 19.0, 19.0, 10.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012280046939849854, -0.001182854175567627, -0.0011377036571502686, -0.0010925531387329102, -0.0010474026203155518, -0.0010022521018981934, -0.000957101583480835, -0.0009119510650634766, -0.0008668005466461182, -0.0008216500282287598, -0.0007764995098114014, -0.000731348991394043, -0.0006861984729766846, -0.0006410479545593262, -0.0005958974361419678, -0.0005507469177246094, -0.000505596399307251, -0.0004604458808898926, -0.0004152953624725342, -0.0003701448440551758, -0.0003249943256378174, -0.000279843807220459, -0.00023469328880310059, -0.0001895427703857422, -0.0001443922519683838, -9.924173355102539e-05, -5.409121513366699e-05, -8.940696716308594e-06, 3.6209821701049805e-05, 8.13603401184082e-05, 0.0001265108585357666, 0.000171661376953125, 0.0002168118953704834, 0.0002619624137878418, 0.0003071129322052002, 0.0003522634506225586, 0.000397413969039917, 0.0004425644874572754, 0.0004877150058746338, 0.0005328655242919922, 0.0005780160427093506, 0.000623166561126709, 0.0006683170795440674, 0.0007134675979614258, 0.0007586181163787842, 0.0008037686347961426, 0.000848919153213501, 0.0008940696716308594, 0.0009392201900482178, 0.0009843707084655762, 0.0010295212268829346, 0.001074671745300293, 0.0011198222637176514, 0.0011649727821350098, 0.0012101233005523682, 0.0012552738189697266, 0.001300424337387085, 0.0013455748558044434, 0.0013907253742218018, 0.0014358758926391602, 0.0014810264110565186, 0.001526176929473877, 0.0015713274478912354, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 11.0, 14.0, 22.0, 18.0, 26.0, 45.0, 86.0, 105.0, 186.0, 328.0, 530.0, 949.0, 2197.0, 5619.0, 21237.0, 155382.0, 734398.0, 102818.0, 16091.0, 4462.0, 1758.0, 900.0, 517.0, 299.0, 179.0, 127.0, 67.0, 64.0, 35.0, 30.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.30780029296875, -5.1273193359375, -4.94683837890625, -4.766357421875, -4.58587646484375, -4.4053955078125, -4.22491455078125, -4.04443359375, -3.86395263671875, -3.6834716796875, -3.50299072265625, -3.322509765625, -3.14202880859375, -2.9615478515625, -2.78106689453125, -2.6005859375, -2.42010498046875, -2.2396240234375, -2.05914306640625, -1.878662109375, -1.69818115234375, -1.5177001953125, -1.33721923828125, -1.15673828125, -0.97625732421875, -0.7957763671875, -0.61529541015625, -0.434814453125, -0.25433349609375, -0.0738525390625, 0.10662841796875, 0.287109375, 0.46759033203125, 0.6480712890625, 0.82855224609375, 1.009033203125, 1.18951416015625, 1.3699951171875, 1.55047607421875, 1.73095703125, 1.91143798828125, 2.0919189453125, 2.27239990234375, 2.452880859375, 2.63336181640625, 2.8138427734375, 2.99432373046875, 3.1748046875, 3.35528564453125, 3.5357666015625, 3.71624755859375, 3.896728515625, 4.07720947265625, 4.2576904296875, 4.43817138671875, 4.61865234375, 4.79913330078125, 4.9796142578125, 5.16009521484375, 5.340576171875, 5.52105712890625, 5.7015380859375, 5.88201904296875, 6.0625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 5.0, 3.0, 9.0, 8.0, 6.0, 2.0, 13.0, 14.0, 20.0, 21.0, 28.0, 34.0, 38.0, 41.0, 44.0, 63.0, 49.0, 62.0, 53.0, 52.0, 63.0, 52.0, 47.0, 42.0, 34.0, 24.0, 27.0, 32.0, 19.0, 24.0, 14.0, 5.0, 6.0, 5.0, 7.0, 3.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.634765625, -3.519287109375, -3.40380859375, -3.288330078125, -3.1728515625, -3.057373046875, -2.94189453125, -2.826416015625, -2.7109375, -2.595458984375, -2.47998046875, -2.364501953125, -2.2490234375, -2.133544921875, -2.01806640625, -1.902587890625, -1.787109375, -1.671630859375, -1.55615234375, -1.440673828125, -1.3251953125, -1.209716796875, -1.09423828125, -0.978759765625, -0.86328125, -0.747802734375, -0.63232421875, -0.516845703125, -0.4013671875, -0.285888671875, -0.17041015625, -0.054931640625, 0.060546875, 0.176025390625, 0.29150390625, 0.406982421875, 0.5224609375, 0.637939453125, 0.75341796875, 0.868896484375, 0.984375, 1.099853515625, 1.21533203125, 1.330810546875, 1.4462890625, 1.561767578125, 1.67724609375, 1.792724609375, 1.908203125, 2.023681640625, 2.13916015625, 2.254638671875, 2.3701171875, 2.485595703125, 2.60107421875, 2.716552734375, 2.83203125, 2.947509765625, 3.06298828125, 3.178466796875, 3.2939453125, 3.409423828125, 3.52490234375, 3.640380859375, 3.755859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 25.0, 51.0, 134.0, 243.0, 330.0, 123.0, 42.0, 21.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.59625244140625, -271.1712341308594, -264.7462158203125, -258.3211975097656, -251.89617919921875, -245.47116088867188, -239.046142578125, -232.62112426757812, -226.19610595703125, -219.77108764648438, -213.3460693359375, -206.92105102539062, -200.49603271484375, -194.07101440429688, -187.64599609375, -181.22097778320312, -174.79595947265625, -168.37094116210938, -161.9459228515625, -155.52090454101562, -149.09588623046875, -142.67086791992188, -136.245849609375, -129.82083129882812, -123.39579772949219, -116.97077941894531, -110.54576110839844, -104.12074279785156, -97.69572448730469, -91.27070617675781, -84.84568786621094, -78.42066955566406, -71.99565124511719, -65.57063293457031, -59.14561462402344, -52.72059631347656, -46.29557800292969, -39.87055587768555, -33.44553756713867, -27.020519256591797, -20.595500946044922, -14.170482635498047, -7.7454633712768555, -1.320444107055664, 5.104574203491211, 11.529594421386719, 17.954612731933594, 24.37963104248047, 30.804649353027344, 37.22966766357422, 43.654685974121094, 50.07970428466797, 56.504722595214844, 62.929744720458984, 69.35476684570312, 75.77978515625, 82.20480346679688, 88.62982177734375, 95.05484008789062, 101.4798583984375, 107.90487670898438, 114.32989501953125, 120.75491333007812, 127.179931640625, 133.60494995117188]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 10.0, 12.0, 13.0, 18.0, 23.0, 18.0, 26.0, 28.0, 27.0, 41.0, 41.0, 46.0, 54.0, 69.0, 88.0, 87.0, 53.0, 49.0, 40.0, 32.0, 34.0, 40.0, 32.0, 22.0, 22.0, 17.0, 9.0, 6.0, 11.0, 6.0, 11.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.84745025634766, -80.99778747558594, -78.14812469482422, -75.2984619140625, -72.44879913330078, -69.59913635253906, -66.74946594238281, -63.89980697631836, -61.05014419555664, -58.20048141479492, -55.3508186340332, -52.50115203857422, -49.6514892578125, -46.80182647705078, -43.95216369628906, -41.102500915527344, -38.252838134765625, -35.403175354003906, -32.55351257324219, -29.703847885131836, -26.854185104370117, -24.0045223236084, -21.154857635498047, -18.305194854736328, -15.45553207397461, -12.60586929321289, -9.756205558776855, -6.90654182434082, -4.056879043579102, -1.2072162628173828, 1.6424484252929688, 4.4921112060546875, 7.341773986816406, 10.191436767578125, 13.04110050201416, 15.890764236450195, 18.740427017211914, 21.590089797973633, 24.439754486083984, 27.289417266845703, 30.139080047607422, 32.98874282836914, 35.83840560913086, 38.688072204589844, 41.53773498535156, 44.38739776611328, 47.237060546875, 50.08672332763672, 52.93638610839844, 55.786048889160156, 58.635711669921875, 61.485374450683594, 64.33503723144531, 67.18470001220703, 70.03436279296875, 72.884033203125, 75.73368835449219, 78.5833511352539, 81.43301391601562, 84.28267669677734, 87.13233947753906, 89.98200225830078, 92.8316650390625, 95.68133544921875, 98.53099822998047]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 26.0, 40.0, 83.0, 149.0, 323.0, 742.0, 1787.0, 4393.0, 12485.0, 40840.0, 222417.0, 2410718.0, 1336251.0, 123819.0, 26695.0, 8242.0, 3046.0, 1151.0, 520.0, 205.0, 129.0, 68.0, 41.0, 21.0, 18.0, 16.0, 16.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.43096923828125, -5.1705322265625, -4.91009521484375, -4.649658203125, -4.38922119140625, -4.1287841796875, -3.86834716796875, -3.60791015625, -3.34747314453125, -3.0870361328125, -2.82659912109375, -2.566162109375, -2.30572509765625, -2.0452880859375, -1.78485107421875, -1.5244140625, -1.26397705078125, -1.0035400390625, -0.74310302734375, -0.482666015625, -0.22222900390625, 0.0382080078125, 0.29864501953125, 0.55908203125, 0.81951904296875, 1.0799560546875, 1.34039306640625, 1.600830078125, 1.86126708984375, 2.1217041015625, 2.38214111328125, 2.642578125, 2.90301513671875, 3.1634521484375, 3.42388916015625, 3.684326171875, 3.94476318359375, 4.2052001953125, 4.46563720703125, 4.72607421875, 4.98651123046875, 5.2469482421875, 5.50738525390625, 5.767822265625, 6.02825927734375, 6.2886962890625, 6.54913330078125, 6.8095703125, 7.07000732421875, 7.3304443359375, 7.59088134765625, 7.851318359375, 8.11175537109375, 8.3721923828125, 8.63262939453125, 8.89306640625, 9.15350341796875, 9.4139404296875, 9.67437744140625, 9.934814453125, 10.19525146484375, 10.4556884765625, 10.71612548828125, 10.9765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 20.0, 26.0, 38.0, 39.0, 89.0, 81.0, 86.0, 113.0, 85.0, 107.0, 67.0, 92.0, 44.0, 36.0, 23.0, 16.0, 15.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.00933837890625, -3.7257080078125, -3.44207763671875, -3.158447265625, -2.87481689453125, -2.5911865234375, -2.30755615234375, -2.02392578125, -1.74029541015625, -1.4566650390625, -1.17303466796875, -0.889404296875, -0.60577392578125, -0.3221435546875, -0.03851318359375, 0.2451171875, 0.52874755859375, 0.8123779296875, 1.09600830078125, 1.379638671875, 1.66326904296875, 1.9468994140625, 2.23052978515625, 2.51416015625, 2.79779052734375, 3.0814208984375, 3.36505126953125, 3.648681640625, 3.93231201171875, 4.2159423828125, 4.49957275390625, 4.783203125, 5.06683349609375, 5.3504638671875, 5.63409423828125, 5.917724609375, 6.20135498046875, 6.4849853515625, 6.76861572265625, 7.05224609375, 7.33587646484375, 7.6195068359375, 7.90313720703125, 8.186767578125, 8.47039794921875, 8.7540283203125, 9.03765869140625, 9.3212890625, 9.60491943359375, 9.8885498046875, 10.17218017578125, 10.455810546875, 10.73944091796875, 11.0230712890625, 11.30670166015625, 11.59033203125, 11.87396240234375, 12.1575927734375, 12.44122314453125, 12.724853515625, 13.00848388671875, 13.2921142578125, 13.57574462890625, 13.859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 2.0, 8.0, 8.0, 17.0, 12.0, 22.0, 37.0, 43.0, 66.0, 99.0, 152.0, 263.0, 380.0, 676.0, 1296.0, 2921.0, 7210.0, 22074.0, 88521.0, 820008.0, 2937293.0, 247634.0, 44517.0, 12480.0, 4422.0, 1795.0, 899.0, 482.0, 303.0, 187.0, 124.0, 79.0, 53.0, 54.0, 38.0, 18.0, 23.0, 12.0, 11.0, 7.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.6640625, -10.343505859375, -10.02294921875, -9.702392578125, -9.3818359375, -9.061279296875, -8.74072265625, -8.420166015625, -8.099609375, -7.779052734375, -7.45849609375, -7.137939453125, -6.8173828125, -6.496826171875, -6.17626953125, -5.855712890625, -5.53515625, -5.214599609375, -4.89404296875, -4.573486328125, -4.2529296875, -3.932373046875, -3.61181640625, -3.291259765625, -2.970703125, -2.650146484375, -2.32958984375, -2.009033203125, -1.6884765625, -1.367919921875, -1.04736328125, -0.726806640625, -0.40625, -0.085693359375, 0.23486328125, 0.555419921875, 0.8759765625, 1.196533203125, 1.51708984375, 1.837646484375, 2.158203125, 2.478759765625, 2.79931640625, 3.119873046875, 3.4404296875, 3.760986328125, 4.08154296875, 4.402099609375, 4.72265625, 5.043212890625, 5.36376953125, 5.684326171875, 6.0048828125, 6.325439453125, 6.64599609375, 6.966552734375, 7.287109375, 7.607666015625, 7.92822265625, 8.248779296875, 8.5693359375, 8.889892578125, 9.21044921875, 9.531005859375, 9.8515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 11.0, 10.0, 22.0, 36.0, 39.0, 59.0, 81.0, 134.0, 203.0, 327.0, 561.0, 784.0, 631.0, 415.0, 230.0, 157.0, 105.0, 67.0, 50.0, 32.0, 29.0, 12.0, 15.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.9473876953125, -10.590087890625, -10.2327880859375, -9.87548828125, -9.5181884765625, -9.160888671875, -8.8035888671875, -8.4462890625, -8.0889892578125, -7.731689453125, -7.3743896484375, -7.01708984375, -6.6597900390625, -6.302490234375, -5.9451904296875, -5.587890625, -5.2305908203125, -4.873291015625, -4.5159912109375, -4.15869140625, -3.8013916015625, -3.444091796875, -3.0867919921875, -2.7294921875, -2.3721923828125, -2.014892578125, -1.6575927734375, -1.30029296875, -0.9429931640625, -0.585693359375, -0.2283935546875, 0.12890625, 0.4862060546875, 0.843505859375, 1.2008056640625, 1.55810546875, 1.9154052734375, 2.272705078125, 2.6300048828125, 2.9873046875, 3.3446044921875, 3.701904296875, 4.0592041015625, 4.41650390625, 4.7738037109375, 5.131103515625, 5.4884033203125, 5.845703125, 6.2030029296875, 6.560302734375, 6.9176025390625, 7.27490234375, 7.6322021484375, 7.989501953125, 8.3468017578125, 8.7041015625, 9.0614013671875, 9.418701171875, 9.7760009765625, 10.13330078125, 10.4906005859375, 10.847900390625, 11.2052001953125, 11.5625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 33.0, 95.0, 242.0, 296.0, 195.0, 83.0, 24.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.0605163574219, -269.6875305175781, -263.3145751953125, -256.94158935546875, -250.56863403320312, -244.19564819335938, -237.8226776123047, -231.44970703125, -225.0767364501953, -218.70376586914062, -212.33079528808594, -205.95782470703125, -199.5848388671875, -193.2118682861328, -186.83889770507812, -180.46592712402344, -174.09295654296875, -167.71998596191406, -161.34701538085938, -154.9740447998047, -148.60107421875, -142.22808837890625, -135.85511779785156, -129.48214721679688, -123.10917663574219, -116.7362060546875, -110.36323547363281, -103.9902572631836, -97.6172866821289, -91.24431610107422, -84.871337890625, -78.49836730957031, -72.12541198730469, -65.75244140625, -59.37946701049805, -53.006492614746094, -46.633522033691406, -40.26055145263672, -33.887577056884766, -27.514602661132812, -21.141632080078125, -14.768659591674805, -8.395687103271484, -2.022714614868164, 4.350257873535156, 10.723230361938477, 17.096202850341797, 23.46917724609375, 29.842147827148438, 36.215118408203125, 42.58809280395508, 48.96106719970703, 55.33403778076172, 61.707008361816406, 68.07998657226562, 74.45295715332031, 80.825927734375, 87.19889831542969, 93.57186889648438, 99.9448471069336, 106.31781768798828, 112.69078826904297, 119.06376647949219, 125.43673706054688, 131.80970764160156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 1.0, 8.0, 7.0, 17.0, 25.0, 26.0, 37.0, 49.0, 50.0, 70.0, 74.0, 74.0, 83.0, 85.0, 72.0, 68.0, 58.0, 41.0, 49.0, 27.0, 25.0, 13.0, 8.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.61972045898438, -89.03205871582031, -86.44438934326172, -83.85671997070312, -81.26905822753906, -78.681396484375, -76.0937271118164, -73.50605773925781, -70.91839599609375, -68.33073425292969, -65.7430648803711, -63.155399322509766, -60.56773376464844, -57.98006820678711, -55.39240264892578, -52.80473709106445, -50.217071533203125, -47.6294059753418, -45.04174041748047, -42.45407485961914, -39.86640930175781, -37.278743743896484, -34.691078186035156, -32.10341262817383, -29.5157470703125, -26.928081512451172, -24.340415954589844, -21.752750396728516, -19.165084838867188, -16.57741928100586, -13.989753723144531, -11.402088165283203, -8.814422607421875, -6.226757049560547, -3.6390914916992188, -1.0514259338378906, 1.5362396240234375, 4.123905181884766, 6.711570739746094, 9.299236297607422, 11.88690185546875, 14.474567413330078, 17.062232971191406, 19.649898529052734, 22.237564086914062, 24.82522964477539, 27.41289520263672, 30.000560760498047, 32.588226318359375, 35.1758918762207, 37.76355743408203, 40.35122299194336, 42.93888854980469, 45.526554107666016, 48.114219665527344, 50.70188522338867, 53.28955078125, 55.87721633911133, 58.464881896972656, 61.052547454833984, 63.64021301269531, 66.22787475585938, 68.81554412841797, 71.40321350097656, 73.99087524414062]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 13.0, 20.0, 23.0, 69.0, 74.0, 125.0, 180.0, 300.0, 501.0, 844.0, 1512.0, 2784.0, 5326.0, 10355.0, 22368.0, 50700.0, 125306.0, 320853.0, 301747.0, 116251.0, 47261.0, 20911.0, 9945.0, 5023.0, 2588.0, 1472.0, 799.0, 465.0, 267.0, 159.0, 99.0, 77.0, 47.0, 26.0, 18.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.8983154296875, -6.632568359375, -6.3668212890625, -6.10107421875, -5.8353271484375, -5.569580078125, -5.3038330078125, -5.0380859375, -4.7723388671875, -4.506591796875, -4.2408447265625, -3.97509765625, -3.7093505859375, -3.443603515625, -3.1778564453125, -2.912109375, -2.6463623046875, -2.380615234375, -2.1148681640625, -1.84912109375, -1.5833740234375, -1.317626953125, -1.0518798828125, -0.7861328125, -0.5203857421875, -0.254638671875, 0.0111083984375, 0.27685546875, 0.5426025390625, 0.808349609375, 1.0740966796875, 1.33984375, 1.6055908203125, 1.871337890625, 2.1370849609375, 2.40283203125, 2.6685791015625, 2.934326171875, 3.2000732421875, 3.4658203125, 3.7315673828125, 3.997314453125, 4.2630615234375, 4.52880859375, 4.7945556640625, 5.060302734375, 5.3260498046875, 5.591796875, 5.8575439453125, 6.123291015625, 6.3890380859375, 6.65478515625, 6.9205322265625, 7.186279296875, 7.4520263671875, 7.7177734375, 7.9835205078125, 8.249267578125, 8.5150146484375, 8.78076171875, 9.0465087890625, 9.312255859375, 9.5780029296875, 9.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 16.0, 18.0, 22.0, 26.0, 25.0, 47.0, 53.0, 48.0, 48.0, 64.0, 74.0, 57.0, 61.0, 49.0, 53.0, 63.0, 49.0, 44.0, 36.0, 30.0, 15.0, 14.0, 17.0, 12.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.3885498046875, -4.202880859375, -4.0172119140625, -3.83154296875, -3.6458740234375, -3.460205078125, -3.2745361328125, -3.0888671875, -2.9031982421875, -2.717529296875, -2.5318603515625, -2.34619140625, -2.1605224609375, -1.974853515625, -1.7891845703125, -1.603515625, -1.4178466796875, -1.232177734375, -1.0465087890625, -0.86083984375, -0.6751708984375, -0.489501953125, -0.3038330078125, -0.1181640625, 0.0675048828125, 0.253173828125, 0.4388427734375, 0.62451171875, 0.8101806640625, 0.995849609375, 1.1815185546875, 1.3671875, 1.5528564453125, 1.738525390625, 1.9241943359375, 2.10986328125, 2.2955322265625, 2.481201171875, 2.6668701171875, 2.8525390625, 3.0382080078125, 3.223876953125, 3.4095458984375, 3.59521484375, 3.7808837890625, 3.966552734375, 4.1522216796875, 4.337890625, 4.5235595703125, 4.709228515625, 4.8948974609375, 5.08056640625, 5.2662353515625, 5.451904296875, 5.6375732421875, 5.8232421875, 6.0089111328125, 6.194580078125, 6.3802490234375, 6.56591796875, 6.7515869140625, 6.937255859375, 7.1229248046875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 9.0, 16.0, 18.0, 22.0, 33.0, 48.0, 74.0, 91.0, 127.0, 170.0, 278.0, 402.0, 675.0, 1159.0, 2251.0, 5855.0, 23728.0, 181519.0, 730467.0, 79795.0, 13390.0, 3951.0, 1757.0, 946.0, 576.0, 354.0, 255.0, 168.0, 123.0, 79.0, 66.0, 37.0, 22.0, 24.0, 20.0, 12.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.328125, -19.718017578125, -19.10791015625, -18.497802734375, -17.8876953125, -17.277587890625, -16.66748046875, -16.057373046875, -15.447265625, -14.837158203125, -14.22705078125, -13.616943359375, -13.0068359375, -12.396728515625, -11.78662109375, -11.176513671875, -10.56640625, -9.956298828125, -9.34619140625, -8.736083984375, -8.1259765625, -7.515869140625, -6.90576171875, -6.295654296875, -5.685546875, -5.075439453125, -4.46533203125, -3.855224609375, -3.2451171875, -2.635009765625, -2.02490234375, -1.414794921875, -0.8046875, -0.194580078125, 0.41552734375, 1.025634765625, 1.6357421875, 2.245849609375, 2.85595703125, 3.466064453125, 4.076171875, 4.686279296875, 5.29638671875, 5.906494140625, 6.5166015625, 7.126708984375, 7.73681640625, 8.346923828125, 8.95703125, 9.567138671875, 10.17724609375, 10.787353515625, 11.3974609375, 12.007568359375, 12.61767578125, 13.227783203125, 13.837890625, 14.447998046875, 15.05810546875, 15.668212890625, 16.2783203125, 16.888427734375, 17.49853515625, 18.108642578125, 18.71875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 23.0, 18.0, 17.0, 28.0, 34.0, 37.0, 45.0, 38.0, 49.0, 42.0, 52.0, 50.0, 77.0, 53.0, 54.0, 40.0, 51.0, 33.0, 37.0, 30.0, 25.0, 20.0, 21.0, 13.0, 14.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.782470703125, -16.17431640625, -15.566162109375, -14.9580078125, -14.349853515625, -13.74169921875, -13.133544921875, -12.525390625, -11.917236328125, -11.30908203125, -10.700927734375, -10.0927734375, -9.484619140625, -8.87646484375, -8.268310546875, -7.66015625, -7.052001953125, -6.44384765625, -5.835693359375, -5.2275390625, -4.619384765625, -4.01123046875, -3.403076171875, -2.794921875, -2.186767578125, -1.57861328125, -0.970458984375, -0.3623046875, 0.245849609375, 0.85400390625, 1.462158203125, 2.0703125, 2.678466796875, 3.28662109375, 3.894775390625, 4.5029296875, 5.111083984375, 5.71923828125, 6.327392578125, 6.935546875, 7.543701171875, 8.15185546875, 8.760009765625, 9.3681640625, 9.976318359375, 10.58447265625, 11.192626953125, 11.80078125, 12.408935546875, 13.01708984375, 13.625244140625, 14.2333984375, 14.841552734375, 15.44970703125, 16.057861328125, 16.666015625, 17.274169921875, 17.88232421875, 18.490478515625, 19.0986328125, 19.706787109375, 20.31494140625, 20.923095703125, 21.53125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 4.0, 10.0, 14.0, 25.0, 29.0, 49.0, 68.0, 106.0, 181.0, 264.0, 415.0, 742.0, 1317.0, 2693.0, 6693.0, 29652.0, 335434.0, 618651.0, 37633.0, 8033.0, 3023.0, 1451.0, 775.0, 475.0, 296.0, 163.0, 122.0, 70.0, 40.0, 32.0, 19.0, 17.0, 15.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.49432373046875, -5.2659912109375, -5.03765869140625, -4.809326171875, -4.58099365234375, -4.3526611328125, -4.12432861328125, -3.89599609375, -3.66766357421875, -3.4393310546875, -3.21099853515625, -2.982666015625, -2.75433349609375, -2.5260009765625, -2.29766845703125, -2.0693359375, -1.84100341796875, -1.6126708984375, -1.38433837890625, -1.156005859375, -0.92767333984375, -0.6993408203125, -0.47100830078125, -0.24267578125, -0.01434326171875, 0.2139892578125, 0.44232177734375, 0.670654296875, 0.89898681640625, 1.1273193359375, 1.35565185546875, 1.583984375, 1.81231689453125, 2.0406494140625, 2.26898193359375, 2.497314453125, 2.72564697265625, 2.9539794921875, 3.18231201171875, 3.41064453125, 3.63897705078125, 3.8673095703125, 4.09564208984375, 4.323974609375, 4.55230712890625, 4.7806396484375, 5.00897216796875, 5.2373046875, 5.46563720703125, 5.6939697265625, 5.92230224609375, 6.150634765625, 6.37896728515625, 6.6072998046875, 6.83563232421875, 7.06396484375, 7.29229736328125, 7.5206298828125, 7.74896240234375, 7.977294921875, 8.20562744140625, 8.4339599609375, 8.66229248046875, 8.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 14.0, 35.0, 63.0, 198.0, 456.0, 125.0, 44.0, 26.0, 16.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005268096923828125, -0.005105435848236084, -0.004942774772644043, -0.004780113697052002, -0.004617452621459961, -0.00445479154586792, -0.004292130470275879, -0.004129469394683838, -0.003966808319091797, -0.003804147243499756, -0.003641486167907715, -0.003478825092315674, -0.003316164016723633, -0.003153502941131592, -0.0029908418655395508, -0.0028281807899475098, -0.0026655197143554688, -0.0025028586387634277, -0.0023401975631713867, -0.0021775364875793457, -0.0020148754119873047, -0.0018522143363952637, -0.0016895532608032227, -0.0015268921852111816, -0.0013642311096191406, -0.0012015700340270996, -0.0010389089584350586, -0.0008762478828430176, -0.0007135868072509766, -0.0005509257316589355, -0.00038826465606689453, -0.00022560358047485352, -6.29425048828125e-05, 9.971857070922852e-05, 0.00026237964630126953, 0.00042504072189331055, 0.0005877017974853516, 0.0007503628730773926, 0.0009130239486694336, 0.0010756850242614746, 0.0012383460998535156, 0.0014010071754455566, 0.0015636682510375977, 0.0017263293266296387, 0.0018889904022216797, 0.0020516514778137207, 0.0022143125534057617, 0.0023769736289978027, 0.0025396347045898438, 0.0027022957801818848, 0.0028649568557739258, 0.003027617931365967, 0.003190279006958008, 0.003352940082550049, 0.00351560115814209, 0.003678262233734131, 0.003840923309326172, 0.004003584384918213, 0.004166245460510254, 0.004328906536102295, 0.004491567611694336, 0.004654228687286377, 0.004816889762878418, 0.004979550838470459, 0.0051422119140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 11.0, 29.0, 47.0, 76.0, 137.0, 306.0, 787.0, 2554.0, 16868.0, 936504.0, 83914.0, 5144.0, 1257.0, 467.0, 179.0, 93.0, 53.0, 36.0, 23.0, 19.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.4375, -17.94873046875, -17.4599609375, -16.97119140625, -16.482421875, -15.99365234375, -15.5048828125, -15.01611328125, -14.52734375, -14.03857421875, -13.5498046875, -13.06103515625, -12.572265625, -12.08349609375, -11.5947265625, -11.10595703125, -10.6171875, -10.12841796875, -9.6396484375, -9.15087890625, -8.662109375, -8.17333984375, -7.6845703125, -7.19580078125, -6.70703125, -6.21826171875, -5.7294921875, -5.24072265625, -4.751953125, -4.26318359375, -3.7744140625, -3.28564453125, -2.796875, -2.30810546875, -1.8193359375, -1.33056640625, -0.841796875, -0.35302734375, 0.1357421875, 0.62451171875, 1.11328125, 1.60205078125, 2.0908203125, 2.57958984375, 3.068359375, 3.55712890625, 4.0458984375, 4.53466796875, 5.0234375, 5.51220703125, 6.0009765625, 6.48974609375, 6.978515625, 7.46728515625, 7.9560546875, 8.44482421875, 8.93359375, 9.42236328125, 9.9111328125, 10.39990234375, 10.888671875, 11.37744140625, 11.8662109375, 12.35498046875, 12.84375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 6.0, 14.0, 20.0, 31.0, 78.0, 138.0, 194.0, 210.0, 139.0, 64.0, 37.0, 23.0, 9.0, 12.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -11.0296630859375, -10.723388671875, -10.4171142578125, -10.11083984375, -9.8045654296875, -9.498291015625, -9.1920166015625, -8.8857421875, -8.5794677734375, -8.273193359375, -7.9669189453125, -7.66064453125, -7.3543701171875, -7.048095703125, -6.7418212890625, -6.435546875, -6.1292724609375, -5.822998046875, -5.5167236328125, -5.21044921875, -4.9041748046875, -4.597900390625, -4.2916259765625, -3.9853515625, -3.6790771484375, -3.372802734375, -3.0665283203125, -2.76025390625, -2.4539794921875, -2.147705078125, -1.8414306640625, -1.53515625, -1.2288818359375, -0.922607421875, -0.6163330078125, -0.31005859375, -0.0037841796875, 0.302490234375, 0.6087646484375, 0.9150390625, 1.2213134765625, 1.527587890625, 1.8338623046875, 2.14013671875, 2.4464111328125, 2.752685546875, 3.0589599609375, 3.365234375, 3.6715087890625, 3.977783203125, 4.2840576171875, 4.59033203125, 4.8966064453125, 5.202880859375, 5.5091552734375, 5.8154296875, 6.1217041015625, 6.427978515625, 6.7342529296875, 7.04052734375, 7.3468017578125, 7.653076171875, 7.9593505859375, 8.265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 15.0, 37.0, 72.0, 157.0, 264.0, 204.0, 117.0, 56.0, 31.0, 17.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.45606994628906, -123.65691375732422, -118.8577651977539, -114.05860900878906, -109.25946044921875, -104.4603042602539, -99.66114807128906, -94.86199951171875, -90.0628433227539, -85.26368713378906, -80.46453857421875, -75.6653823852539, -70.86622619628906, -66.06707763671875, -61.267921447753906, -56.46876907348633, -51.66961669921875, -46.87046432495117, -42.071311950683594, -37.27215576171875, -32.47300338745117, -27.673851013183594, -22.874696731567383, -18.075542449951172, -13.276390075683594, -8.4772367477417, -3.6780834197998047, 1.1210699081420898, 5.920223236083984, 10.719375610351562, 15.518529891967773, 20.317684173583984, 25.1168212890625, 29.915973663330078, 34.715126037597656, 39.5142822265625, 44.31343460083008, 49.112586975097656, 53.9117431640625, 58.71089553833008, 63.510047912597656, 68.3092041015625, 73.10835266113281, 77.90750885009766, 82.7066650390625, 87.50581359863281, 92.30496978759766, 97.1041259765625, 101.90327453613281, 106.70243072509766, 111.50157928466797, 116.30073547363281, 121.09988403320312, 125.89904022216797, 130.6981964111328, 135.49734497070312, 140.2965087890625, 145.0956573486328, 149.8948211669922, 154.6939697265625, 159.4931182861328, 164.29226684570312, 169.0914306640625, 173.8905792236328, 178.68972778320312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 13.0, 5.0, 11.0, 9.0, 11.0, 12.0, 11.0, 19.0, 21.0, 14.0, 25.0, 19.0, 20.0, 24.0, 32.0, 42.0, 55.0, 59.0, 65.0, 66.0, 58.0, 51.0, 41.0, 26.0, 28.0, 37.0, 21.0, 19.0, 24.0, 21.0, 14.0, 15.0, 21.0, 15.0, 13.0, 6.0, 5.0, 7.0, 13.0, 10.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-62.65190887451172, -60.691123962402344, -58.730342864990234, -56.76955795288086, -54.80877685546875, -52.847991943359375, -50.88720703125, -48.926422119140625, -46.965641021728516, -45.00485610961914, -43.04407501220703, -41.083290100097656, -39.12250518798828, -37.16172409057617, -35.2009391784668, -33.24015808105469, -31.279373168945312, -29.31859016418457, -27.357807159423828, -25.397022247314453, -23.43623924255371, -21.47545623779297, -19.514671325683594, -17.55388832092285, -15.59310531616211, -13.632322311401367, -11.671538352966309, -9.71075439453125, -7.749971389770508, -5.789188385009766, -3.828404426574707, -1.8676204681396484, 0.09316253662109375, 2.053946018218994, 4.0147294998168945, 5.975512981414795, 7.936296463012695, 9.897079467773438, 11.857863426208496, 13.818647384643555, 15.779430389404297, 17.74021339416504, 19.70099639892578, 21.661781311035156, 23.6225643157959, 25.58334732055664, 27.544132232666016, 29.504915237426758, 31.4656982421875, 33.426483154296875, 35.387264251708984, 37.34804916381836, 39.30883026123047, 41.269615173339844, 43.23040008544922, 45.191184997558594, 47.1519660949707, 49.11275100708008, 51.07353210449219, 53.03431701660156, 54.99510192871094, 56.95588302612305, 58.91666793823242, 60.87744903564453, 62.838233947753906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 12.0, 33.0, 38.0, 59.0, 98.0, 154.0, 242.0, 396.0, 598.0, 1149.0, 2162.0, 4373.0, 10423.0, 31826.0, 173013.0, 1872332.0, 1873943.0, 173458.0, 30872.0, 10036.0, 4199.0, 2023.0, 1079.0, 671.0, 416.0, 234.0, 141.0, 85.0, 61.0, 37.0, 26.0, 21.0, 16.0, 15.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65338134765625, -6.4239501953125, -6.19451904296875, -5.965087890625, -5.73565673828125, -5.5062255859375, -5.27679443359375, -5.04736328125, -4.81793212890625, -4.5885009765625, -4.35906982421875, -4.129638671875, -3.90020751953125, -3.6707763671875, -3.44134521484375, -3.2119140625, -2.98248291015625, -2.7530517578125, -2.52362060546875, -2.294189453125, -2.06475830078125, -1.8353271484375, -1.60589599609375, -1.37646484375, -1.14703369140625, -0.9176025390625, -0.68817138671875, -0.458740234375, -0.22930908203125, 0.0001220703125, 0.22955322265625, 0.458984375, 0.68841552734375, 0.9178466796875, 1.14727783203125, 1.376708984375, 1.60614013671875, 1.8355712890625, 2.06500244140625, 2.29443359375, 2.52386474609375, 2.7532958984375, 2.98272705078125, 3.212158203125, 3.44158935546875, 3.6710205078125, 3.90045166015625, 4.1298828125, 4.35931396484375, 4.5887451171875, 4.81817626953125, 5.047607421875, 5.27703857421875, 5.5064697265625, 5.73590087890625, 5.96533203125, 6.19476318359375, 6.4241943359375, 6.65362548828125, 6.883056640625, 7.11248779296875, 7.3419189453125, 7.57135009765625, 7.80078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 9.0, 12.0, 15.0, 14.0, 20.0, 28.0, 33.0, 30.0, 39.0, 37.0, 50.0, 69.0, 72.0, 62.0, 59.0, 52.0, 57.0, 55.0, 61.0, 34.0, 41.0, 42.0, 23.0, 20.0, 13.0, 10.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.456695556640625, -3.28643798828125, -3.116180419921875, -2.9459228515625, -2.775665283203125, -2.60540771484375, -2.435150146484375, -2.264892578125, -2.094635009765625, -1.92437744140625, -1.754119873046875, -1.5838623046875, -1.413604736328125, -1.24334716796875, -1.073089599609375, -0.90283203125, -0.732574462890625, -0.56231689453125, -0.392059326171875, -0.2218017578125, -0.051544189453125, 0.11871337890625, 0.288970947265625, 0.459228515625, 0.629486083984375, 0.79974365234375, 0.970001220703125, 1.1402587890625, 1.310516357421875, 1.48077392578125, 1.651031494140625, 1.8212890625, 1.991546630859375, 2.16180419921875, 2.332061767578125, 2.5023193359375, 2.672576904296875, 2.84283447265625, 3.013092041015625, 3.183349609375, 3.353607177734375, 3.52386474609375, 3.694122314453125, 3.8643798828125, 4.034637451171875, 4.20489501953125, 4.375152587890625, 4.54541015625, 4.715667724609375, 4.88592529296875, 5.056182861328125, 5.2264404296875, 5.396697998046875, 5.56695556640625, 5.737213134765625, 5.907470703125, 6.077728271484375, 6.24798583984375, 6.418243408203125, 6.5885009765625, 6.758758544921875, 6.92901611328125, 7.099273681640625, 7.26953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 17.0, 20.0, 27.0, 49.0, 57.0, 91.0, 97.0, 152.0, 265.0, 419.0, 744.0, 1509.0, 3921.0, 14466.0, 97647.0, 3298375.0, 720601.0, 42021.0, 8362.0, 2613.0, 1165.0, 579.0, 339.0, 216.0, 159.0, 92.0, 75.0, 48.0, 38.0, 27.0, 23.0, 12.0, 7.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.9296875, -13.477294921875, -13.02490234375, -12.572509765625, -12.1201171875, -11.667724609375, -11.21533203125, -10.762939453125, -10.310546875, -9.858154296875, -9.40576171875, -8.953369140625, -8.5009765625, -8.048583984375, -7.59619140625, -7.143798828125, -6.69140625, -6.239013671875, -5.78662109375, -5.334228515625, -4.8818359375, -4.429443359375, -3.97705078125, -3.524658203125, -3.072265625, -2.619873046875, -2.16748046875, -1.715087890625, -1.2626953125, -0.810302734375, -0.35791015625, 0.094482421875, 0.546875, 0.999267578125, 1.45166015625, 1.904052734375, 2.3564453125, 2.808837890625, 3.26123046875, 3.713623046875, 4.166015625, 4.618408203125, 5.07080078125, 5.523193359375, 5.9755859375, 6.427978515625, 6.88037109375, 7.332763671875, 7.78515625, 8.237548828125, 8.68994140625, 9.142333984375, 9.5947265625, 10.047119140625, 10.49951171875, 10.951904296875, 11.404296875, 11.856689453125, 12.30908203125, 12.761474609375, 13.2138671875, 13.666259765625, 14.11865234375, 14.571044921875, 15.0234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 12.0, 22.0, 26.0, 56.0, 93.0, 216.0, 454.0, 1086.0, 1052.0, 503.0, 213.0, 108.0, 71.0, 47.0, 32.0, 22.0, 16.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.469970703125, -15.97119140625, -15.472412109375, -14.9736328125, -14.474853515625, -13.97607421875, -13.477294921875, -12.978515625, -12.479736328125, -11.98095703125, -11.482177734375, -10.9833984375, -10.484619140625, -9.98583984375, -9.487060546875, -8.98828125, -8.489501953125, -7.99072265625, -7.491943359375, -6.9931640625, -6.494384765625, -5.99560546875, -5.496826171875, -4.998046875, -4.499267578125, -4.00048828125, -3.501708984375, -3.0029296875, -2.504150390625, -2.00537109375, -1.506591796875, -1.0078125, -0.509033203125, -0.01025390625, 0.488525390625, 0.9873046875, 1.486083984375, 1.98486328125, 2.483642578125, 2.982421875, 3.481201171875, 3.97998046875, 4.478759765625, 4.9775390625, 5.476318359375, 5.97509765625, 6.473876953125, 6.97265625, 7.471435546875, 7.97021484375, 8.468994140625, 8.9677734375, 9.466552734375, 9.96533203125, 10.464111328125, 10.962890625, 11.461669921875, 11.96044921875, 12.459228515625, 12.9580078125, 13.456787109375, 13.95556640625, 14.454345703125, 14.953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 14.0, 53.0, 133.0, 290.0, 295.0, 129.0, 35.0, 28.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.38079833984375, -253.84283447265625, -247.30487060546875, -240.76690673828125, -234.2289581298828, -227.6909942626953, -221.1530303955078, -214.6150665283203, -208.07711791992188, -201.53915405273438, -195.00119018554688, -188.46322631835938, -181.92527770996094, -175.38731384277344, -168.84934997558594, -162.31138610839844, -155.77342224121094, -149.23545837402344, -142.69749450683594, -136.1595458984375, -129.62158203125, -123.0836181640625, -116.545654296875, -110.0076904296875, -103.46973419189453, -96.93177032470703, -90.39381408691406, -83.85585021972656, -77.31788635253906, -70.7799301147461, -64.2419662475586, -57.70400619506836, -51.166046142578125, -44.62808609008789, -38.090126037597656, -31.552162170410156, -25.014202117919922, -18.476242065429688, -11.938278198242188, -5.400318145751953, 1.1376419067382812, 7.675602912902832, 14.213563919067383, 20.75152587890625, 27.289485931396484, 33.82744598388672, 40.36540985107422, 46.90336990356445, 53.44132995605469, 59.97929000854492, 66.51725006103516, 73.05521392822266, 79.59317016601562, 86.13113403320312, 92.66909790039062, 99.20706176757812, 105.7450180053711, 112.2829818725586, 118.82093811035156, 125.35890197753906, 131.89686584472656, 138.434814453125, 144.9727783203125, 151.5107421875, 158.0487060546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 13.0, 16.0, 28.0, 21.0, 43.0, 39.0, 37.0, 53.0, 56.0, 43.0, 58.0, 65.0, 74.0, 55.0, 59.0, 47.0, 54.0, 41.0, 37.0, 25.0, 25.0, 17.0, 11.0, 24.0, 8.0, 7.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.72247314453125, -62.74386978149414, -60.7652702331543, -58.78666687011719, -56.808067321777344, -54.829463958740234, -52.85086441040039, -50.87226104736328, -48.89366149902344, -46.91505813598633, -44.936458587646484, -42.957855224609375, -40.97925567626953, -39.00065231323242, -37.02205276489258, -35.04344940185547, -33.064849853515625, -31.08624839782715, -29.107646942138672, -27.129045486450195, -25.15044403076172, -23.17184066772461, -21.193241119384766, -19.214637756347656, -17.236034393310547, -15.25743293762207, -13.278831481933594, -11.300230026245117, -9.32162857055664, -7.343026161193848, -5.364424705505371, -3.3858232498168945, -1.4072227478027344, 0.5713788270950317, 2.549980401992798, 4.5285820960998535, 6.50718355178833, 8.485785484313965, 10.464386940002441, 12.442988395690918, 14.421589851379395, 16.400192260742188, 18.378793716430664, 20.35739517211914, 22.335996627807617, 24.314598083496094, 26.29319953918457, 28.271800994873047, 30.250402450561523, 32.22900390625, 34.20760726928711, 36.18620681762695, 38.16481018066406, 40.143409729003906, 42.122013092041016, 44.10061264038086, 46.07921600341797, 48.05781936645508, 50.03641891479492, 52.01502227783203, 53.993621826171875, 55.972225189208984, 57.95082473754883, 59.92942810058594, 61.90802764892578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 12.0, 14.0, 17.0, 25.0, 40.0, 84.0, 105.0, 153.0, 275.0, 475.0, 816.0, 1438.0, 2690.0, 5161.0, 11184.0, 25426.0, 63562.0, 159644.0, 308289.0, 265548.0, 118995.0, 46819.0, 19615.0, 8846.0, 4266.0, 2147.0, 1209.0, 679.0, 377.0, 259.0, 142.0, 89.0, 67.0, 31.0, 20.0, 9.0, 10.0, 5.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.49554443359375, -6.3035888671875, -6.11163330078125, -5.919677734375, -5.72772216796875, -5.5357666015625, -5.34381103515625, -5.15185546875, -4.95989990234375, -4.7679443359375, -4.57598876953125, -4.384033203125, -4.19207763671875, -4.0001220703125, -3.80816650390625, -3.6162109375, -3.42425537109375, -3.2322998046875, -3.04034423828125, -2.848388671875, -2.65643310546875, -2.4644775390625, -2.27252197265625, -2.08056640625, -1.88861083984375, -1.6966552734375, -1.50469970703125, -1.312744140625, -1.12078857421875, -0.9288330078125, -0.73687744140625, -0.544921875, -0.35296630859375, -0.1610107421875, 0.03094482421875, 0.222900390625, 0.41485595703125, 0.6068115234375, 0.79876708984375, 0.99072265625, 1.18267822265625, 1.3746337890625, 1.56658935546875, 1.758544921875, 1.95050048828125, 2.1424560546875, 2.33441162109375, 2.5263671875, 2.71832275390625, 2.9102783203125, 3.10223388671875, 3.294189453125, 3.48614501953125, 3.6781005859375, 3.87005615234375, 4.06201171875, 4.25396728515625, 4.4459228515625, 4.63787841796875, 4.829833984375, 5.02178955078125, 5.2137451171875, 5.40570068359375, 5.59765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 11.0, 10.0, 20.0, 25.0, 22.0, 37.0, 43.0, 49.0, 41.0, 55.0, 68.0, 61.0, 53.0, 61.0, 50.0, 64.0, 46.0, 44.0, 46.0, 26.0, 31.0, 30.0, 25.0, 17.0, 14.0, 8.0, 7.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.87664794921875, -3.6986083984375, -3.52056884765625, -3.342529296875, -3.16448974609375, -2.9864501953125, -2.80841064453125, -2.63037109375, -2.45233154296875, -2.2742919921875, -2.09625244140625, -1.918212890625, -1.74017333984375, -1.5621337890625, -1.38409423828125, -1.2060546875, -1.02801513671875, -0.8499755859375, -0.67193603515625, -0.493896484375, -0.31585693359375, -0.1378173828125, 0.04022216796875, 0.21826171875, 0.39630126953125, 0.5743408203125, 0.75238037109375, 0.930419921875, 1.10845947265625, 1.2864990234375, 1.46453857421875, 1.642578125, 1.82061767578125, 1.9986572265625, 2.17669677734375, 2.354736328125, 2.53277587890625, 2.7108154296875, 2.88885498046875, 3.06689453125, 3.24493408203125, 3.4229736328125, 3.60101318359375, 3.779052734375, 3.95709228515625, 4.1351318359375, 4.31317138671875, 4.4912109375, 4.66925048828125, 4.8472900390625, 5.02532958984375, 5.203369140625, 5.38140869140625, 5.5594482421875, 5.73748779296875, 5.91552734375, 6.09356689453125, 6.2716064453125, 6.44964599609375, 6.627685546875, 6.80572509765625, 6.9837646484375, 7.16180419921875, 7.33984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 4.0, 4.0, 6.0, 11.0, 16.0, 16.0, 36.0, 38.0, 56.0, 81.0, 133.0, 183.0, 282.0, 511.0, 950.0, 2030.0, 4527.0, 13564.0, 58104.0, 343150.0, 531231.0, 68851.0, 15140.0, 5099.0, 2013.0, 1046.0, 581.0, 324.0, 167.0, 126.0, 69.0, 63.0, 43.0, 25.0, 19.0, 9.0, 10.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.59375, -11.2203369140625, -10.846923828125, -10.4735107421875, -10.10009765625, -9.7266845703125, -9.353271484375, -8.9798583984375, -8.6064453125, -8.2330322265625, -7.859619140625, -7.4862060546875, -7.11279296875, -6.7393798828125, -6.365966796875, -5.9925537109375, -5.619140625, -5.2457275390625, -4.872314453125, -4.4989013671875, -4.12548828125, -3.7520751953125, -3.378662109375, -3.0052490234375, -2.6318359375, -2.2584228515625, -1.885009765625, -1.5115966796875, -1.13818359375, -0.7647705078125, -0.391357421875, -0.0179443359375, 0.35546875, 0.7288818359375, 1.102294921875, 1.4757080078125, 1.84912109375, 2.2225341796875, 2.595947265625, 2.9693603515625, 3.3427734375, 3.7161865234375, 4.089599609375, 4.4630126953125, 4.83642578125, 5.2098388671875, 5.583251953125, 5.9566650390625, 6.330078125, 6.7034912109375, 7.076904296875, 7.4503173828125, 7.82373046875, 8.1971435546875, 8.570556640625, 8.9439697265625, 9.3173828125, 9.6907958984375, 10.064208984375, 10.4376220703125, 10.81103515625, 11.1844482421875, 11.557861328125, 11.9312744140625, 12.3046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 18.0, 25.0, 32.0, 17.0, 37.0, 51.0, 48.0, 46.0, 47.0, 55.0, 44.0, 65.0, 39.0, 54.0, 56.0, 45.0, 41.0, 37.0, 33.0, 27.0, 23.0, 27.0, 20.0, 18.0, 8.0, 15.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.810791015625, -14.26220703125, -13.713623046875, -13.1650390625, -12.616455078125, -12.06787109375, -11.519287109375, -10.970703125, -10.422119140625, -9.87353515625, -9.324951171875, -8.7763671875, -8.227783203125, -7.67919921875, -7.130615234375, -6.58203125, -6.033447265625, -5.48486328125, -4.936279296875, -4.3876953125, -3.839111328125, -3.29052734375, -2.741943359375, -2.193359375, -1.644775390625, -1.09619140625, -0.547607421875, 0.0009765625, 0.549560546875, 1.09814453125, 1.646728515625, 2.1953125, 2.743896484375, 3.29248046875, 3.841064453125, 4.3896484375, 4.938232421875, 5.48681640625, 6.035400390625, 6.583984375, 7.132568359375, 7.68115234375, 8.229736328125, 8.7783203125, 9.326904296875, 9.87548828125, 10.424072265625, 10.97265625, 11.521240234375, 12.06982421875, 12.618408203125, 13.1669921875, 13.715576171875, 14.26416015625, 14.812744140625, 15.361328125, 15.909912109375, 16.45849609375, 17.007080078125, 17.5556640625, 18.104248046875, 18.65283203125, 19.201416015625, 19.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 9.0, 16.0, 27.0, 33.0, 26.0, 49.0, 74.0, 123.0, 215.0, 372.0, 600.0, 940.0, 1687.0, 3246.0, 6638.0, 15152.0, 40602.0, 146984.0, 600957.0, 157592.0, 43136.0, 15715.0, 6759.0, 3314.0, 1720.0, 997.0, 550.0, 369.0, 212.0, 162.0, 83.0, 62.0, 41.0, 28.0, 13.0, 10.0, 3.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.841796875, -2.75164794921875, -2.6614990234375, -2.57135009765625, -2.481201171875, -2.39105224609375, -2.3009033203125, -2.21075439453125, -2.12060546875, -2.03045654296875, -1.9403076171875, -1.85015869140625, -1.760009765625, -1.66986083984375, -1.5797119140625, -1.48956298828125, -1.3994140625, -1.30926513671875, -1.2191162109375, -1.12896728515625, -1.038818359375, -0.94866943359375, -0.8585205078125, -0.76837158203125, -0.67822265625, -0.58807373046875, -0.4979248046875, -0.40777587890625, -0.317626953125, -0.22747802734375, -0.1373291015625, -0.04718017578125, 0.04296875, 0.13311767578125, 0.2232666015625, 0.31341552734375, 0.403564453125, 0.49371337890625, 0.5838623046875, 0.67401123046875, 0.76416015625, 0.85430908203125, 0.9444580078125, 1.03460693359375, 1.124755859375, 1.21490478515625, 1.3050537109375, 1.39520263671875, 1.4853515625, 1.57550048828125, 1.6656494140625, 1.75579833984375, 1.845947265625, 1.93609619140625, 2.0262451171875, 2.11639404296875, 2.20654296875, 2.29669189453125, 2.3868408203125, 2.47698974609375, 2.567138671875, 2.65728759765625, 2.7474365234375, 2.83758544921875, 2.927734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 10.0, 11.0, 22.0, 36.0, 66.0, 209.0, 252.0, 175.0, 78.0, 40.0, 25.0, 10.0, 16.0, 9.0, 4.0, 4.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001651763916015625, -0.00159551203250885, -0.0015392601490020752, -0.0014830082654953003, -0.0014267563819885254, -0.0013705044984817505, -0.0013142526149749756, -0.0012580007314682007, -0.0012017488479614258, -0.0011454969644546509, -0.001089245080947876, -0.001032993197441101, -0.0009767413139343262, -0.0009204894304275513, -0.0008642375469207764, -0.0008079856634140015, -0.0007517337799072266, -0.0006954818964004517, -0.0006392300128936768, -0.0005829781293869019, -0.000526726245880127, -0.00047047436237335205, -0.00041422247886657715, -0.00035797059535980225, -0.00030171871185302734, -0.00024546682834625244, -0.00018921494483947754, -0.00013296306133270264, -7.671117782592773e-05, -2.0459294319152832e-05, 3.579258918762207e-05, 9.204447269439697e-05, 0.00014829635620117188, 0.00020454823970794678, 0.0002608001232147217, 0.0003170520067214966, 0.0003733038902282715, 0.0004295557737350464, 0.0004858076572418213, 0.0005420595407485962, 0.0005983114242553711, 0.000654563307762146, 0.0007108151912689209, 0.0007670670747756958, 0.0008233189582824707, 0.0008795708417892456, 0.0009358227252960205, 0.0009920746088027954, 0.0010483264923095703, 0.0011045783758163452, 0.0011608302593231201, 0.001217082142829895, 0.00127333402633667, 0.0013295859098434448, 0.0013858377933502197, 0.0014420896768569946, 0.0014983415603637695, 0.0015545934438705444, 0.0016108453273773193, 0.0016670972108840942, 0.0017233490943908691, 0.001779600977897644, 0.001835852861404419, 0.0018921047449111938, 0.0019483566284179688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 10.0, 12.0, 15.0, 25.0, 28.0, 40.0, 87.0, 158.0, 275.0, 555.0, 1343.0, 3403.0, 10394.0, 38977.0, 228327.0, 653311.0, 83414.0, 18674.0, 5652.0, 2098.0, 831.0, 437.0, 204.0, 90.0, 64.0, 47.0, 26.0, 12.0, 11.0, 12.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.96484375, -4.831512451171875, -4.69818115234375, -4.564849853515625, -4.4315185546875, -4.298187255859375, -4.16485595703125, -4.031524658203125, -3.898193359375, -3.764862060546875, -3.63153076171875, -3.498199462890625, -3.3648681640625, -3.231536865234375, -3.09820556640625, -2.964874267578125, -2.83154296875, -2.698211669921875, -2.56488037109375, -2.431549072265625, -2.2982177734375, -2.164886474609375, -2.03155517578125, -1.898223876953125, -1.764892578125, -1.631561279296875, -1.49822998046875, -1.364898681640625, -1.2315673828125, -1.098236083984375, -0.96490478515625, -0.831573486328125, -0.6982421875, -0.564910888671875, -0.43157958984375, -0.298248291015625, -0.1649169921875, -0.031585693359375, 0.10174560546875, 0.235076904296875, 0.368408203125, 0.501739501953125, 0.63507080078125, 0.768402099609375, 0.9017333984375, 1.035064697265625, 1.16839599609375, 1.301727294921875, 1.43505859375, 1.568389892578125, 1.70172119140625, 1.835052490234375, 1.9683837890625, 2.101715087890625, 2.23504638671875, 2.368377685546875, 2.501708984375, 2.635040283203125, 2.76837158203125, 2.901702880859375, 3.0350341796875, 3.168365478515625, 3.30169677734375, 3.435028076171875, 3.568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 14.0, 19.0, 17.0, 23.0, 31.0, 46.0, 51.0, 72.0, 79.0, 83.0, 86.0, 95.0, 63.0, 76.0, 43.0, 37.0, 33.0, 26.0, 12.0, 20.0, 6.0, 5.0, 4.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.619140625, -3.516143798828125, -3.41314697265625, -3.310150146484375, -3.2071533203125, -3.104156494140625, -3.00115966796875, -2.898162841796875, -2.795166015625, -2.692169189453125, -2.58917236328125, -2.486175537109375, -2.3831787109375, -2.280181884765625, -2.17718505859375, -2.074188232421875, -1.97119140625, -1.868194580078125, -1.76519775390625, -1.662200927734375, -1.5592041015625, -1.456207275390625, -1.35321044921875, -1.250213623046875, -1.147216796875, -1.044219970703125, -0.94122314453125, -0.838226318359375, -0.7352294921875, -0.632232666015625, -0.52923583984375, -0.426239013671875, -0.3232421875, -0.220245361328125, -0.11724853515625, -0.014251708984375, 0.0887451171875, 0.191741943359375, 0.29473876953125, 0.397735595703125, 0.500732421875, 0.603729248046875, 0.70672607421875, 0.809722900390625, 0.9127197265625, 1.015716552734375, 1.11871337890625, 1.221710205078125, 1.32470703125, 1.427703857421875, 1.53070068359375, 1.633697509765625, 1.7366943359375, 1.839691162109375, 1.94268798828125, 2.045684814453125, 2.148681640625, 2.251678466796875, 2.35467529296875, 2.457672119140625, 2.5606689453125, 2.663665771484375, 2.76666259765625, 2.869659423828125, 2.97265625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 20.0, 41.0, 71.0, 142.0, 258.0, 238.0, 112.0, 58.0, 24.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.380126953125, -96.49137115478516, -92.60261535644531, -88.71385192871094, -84.8250961303711, -80.93634033203125, -77.0475845336914, -73.15882873535156, -69.27006530761719, -65.38130950927734, -61.492549896240234, -57.60379409790039, -53.71503448486328, -49.82627868652344, -45.937522888183594, -42.048763275146484, -38.16000747680664, -34.2712516784668, -30.382492065429688, -26.493736267089844, -22.604976654052734, -18.71622085571289, -14.827463150024414, -10.938705444335938, -7.049947738647461, -3.1611902713775635, 0.727567195892334, 4.616324424743652, 8.505082130432129, 12.393838882446289, 16.282596588134766, 20.171354293823242, 24.06011199951172, 27.948869705200195, 31.837627410888672, 35.726383209228516, 39.615142822265625, 43.50389862060547, 47.39265441894531, 51.28141403198242, 55.17017364501953, 59.058929443359375, 62.947689056396484, 66.8364486694336, 70.72520446777344, 74.61396026611328, 78.50271606445312, 82.3914794921875, 86.28022766113281, 90.16898345947266, 94.0577392578125, 97.94650268554688, 101.83525848388672, 105.72401428222656, 109.6127700805664, 113.50152587890625, 117.39028930664062, 121.27904510498047, 125.16780090332031, 129.0565643310547, 132.9453125, 136.83407592773438, 140.72283935546875, 144.61158752441406, 148.50035095214844]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 6.0, 6.0, 5.0, 10.0, 10.0, 10.0, 9.0, 18.0, 19.0, 21.0, 26.0, 25.0, 21.0, 37.0, 27.0, 38.0, 33.0, 53.0, 60.0, 76.0, 64.0, 50.0, 39.0, 42.0, 33.0, 26.0, 37.0, 34.0, 23.0, 14.0, 15.0, 19.0, 19.0, 15.0, 9.0, 13.0, 5.0, 5.0, 5.0, 1.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.46983337402344, -52.68632888793945, -50.90282440185547, -49.11932373046875, -47.335819244384766, -45.55231475830078, -43.7688102722168, -41.98530578613281, -40.20180130004883, -38.418296813964844, -36.63479232788086, -34.851287841796875, -33.067787170410156, -31.284282684326172, -29.500778198242188, -27.717273712158203, -25.93377113342285, -24.150266647338867, -22.366764068603516, -20.58325958251953, -18.799755096435547, -17.016250610351562, -15.232748031616211, -13.449243545532227, -11.665740013122559, -9.88223648071289, -8.098731994628906, -6.315228462219238, -4.531724452972412, -2.748220443725586, -0.964716911315918, 0.8187875747680664, 2.6022911071777344, 4.3857951164245605, 6.169299125671387, 7.952802658081055, 9.736307144165039, 11.519810676574707, 13.303314208984375, 15.08681869506836, 16.870323181152344, 18.653827667236328, 20.43733024597168, 22.220834732055664, 24.00433921813965, 25.787841796875, 27.571346282958984, 29.35485076904297, 31.13835334777832, 32.92185592651367, 34.705360412597656, 36.48886489868164, 38.272369384765625, 40.05587387084961, 41.839378356933594, 43.62287902832031, 45.4063835144043, 47.18988800048828, 48.973392486572266, 50.75689697265625, 52.54039764404297, 54.32390213012695, 56.10740661621094, 57.89091110229492, 59.674415588378906]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 8.0, 21.0, 14.0, 41.0, 63.0, 112.0, 145.0, 258.0, 432.0, 832.0, 1538.0, 2990.0, 6275.0, 15362.0, 51537.0, 295141.0, 1901606.0, 1616351.0, 234322.0, 42923.0, 12991.0, 5324.0, 2586.0, 1357.0, 795.0, 465.0, 285.0, 183.0, 97.0, 65.0, 47.0, 30.0, 21.0, 20.0, 6.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.518798828125, -5.33447265625, -5.150146484375, -4.9658203125, -4.781494140625, -4.59716796875, -4.412841796875, -4.228515625, -4.044189453125, -3.85986328125, -3.675537109375, -3.4912109375, -3.306884765625, -3.12255859375, -2.938232421875, -2.75390625, -2.569580078125, -2.38525390625, -2.200927734375, -2.0166015625, -1.832275390625, -1.64794921875, -1.463623046875, -1.279296875, -1.094970703125, -0.91064453125, -0.726318359375, -0.5419921875, -0.357666015625, -0.17333984375, 0.010986328125, 0.1953125, 0.379638671875, 0.56396484375, 0.748291015625, 0.9326171875, 1.116943359375, 1.30126953125, 1.485595703125, 1.669921875, 1.854248046875, 2.03857421875, 2.222900390625, 2.4072265625, 2.591552734375, 2.77587890625, 2.960205078125, 3.14453125, 3.328857421875, 3.51318359375, 3.697509765625, 3.8818359375, 4.066162109375, 4.25048828125, 4.434814453125, 4.619140625, 4.803466796875, 4.98779296875, 5.172119140625, 5.3564453125, 5.540771484375, 5.72509765625, 5.909423828125, 6.09375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 9.0, 9.0, 8.0, 12.0, 22.0, 23.0, 29.0, 43.0, 42.0, 37.0, 39.0, 66.0, 70.0, 75.0, 59.0, 64.0, 49.0, 55.0, 52.0, 45.0, 50.0, 34.0, 30.0, 17.0, 19.0, 8.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.98046875, -3.803466796875, -3.62646484375, -3.449462890625, -3.2724609375, -3.095458984375, -2.91845703125, -2.741455078125, -2.564453125, -2.387451171875, -2.21044921875, -2.033447265625, -1.8564453125, -1.679443359375, -1.50244140625, -1.325439453125, -1.1484375, -0.971435546875, -0.79443359375, -0.617431640625, -0.4404296875, -0.263427734375, -0.08642578125, 0.090576171875, 0.267578125, 0.444580078125, 0.62158203125, 0.798583984375, 0.9755859375, 1.152587890625, 1.32958984375, 1.506591796875, 1.68359375, 1.860595703125, 2.03759765625, 2.214599609375, 2.3916015625, 2.568603515625, 2.74560546875, 2.922607421875, 3.099609375, 3.276611328125, 3.45361328125, 3.630615234375, 3.8076171875, 3.984619140625, 4.16162109375, 4.338623046875, 4.515625, 4.692626953125, 4.86962890625, 5.046630859375, 5.2236328125, 5.400634765625, 5.57763671875, 5.754638671875, 5.931640625, 6.108642578125, 6.28564453125, 6.462646484375, 6.6396484375, 6.816650390625, 6.99365234375, 7.170654296875, 7.34765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 6.0, 17.0, 42.0, 52.0, 101.0, 160.0, 253.0, 596.0, 3684.0, 1480916.0, 2703056.0, 4164.0, 621.0, 265.0, 133.0, 85.0, 55.0, 30.0, 21.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.58935546875, -34.2724609375, -32.95556640625, -31.638671875, -30.32177734375, -29.0048828125, -27.68798828125, -26.37109375, -25.05419921875, -23.7373046875, -22.42041015625, -21.103515625, -19.78662109375, -18.4697265625, -17.15283203125, -15.8359375, -14.51904296875, -13.2021484375, -11.88525390625, -10.568359375, -9.25146484375, -7.9345703125, -6.61767578125, -5.30078125, -3.98388671875, -2.6669921875, -1.35009765625, -0.033203125, 1.28369140625, 2.6005859375, 3.91748046875, 5.234375, 6.55126953125, 7.8681640625, 9.18505859375, 10.501953125, 11.81884765625, 13.1357421875, 14.45263671875, 15.76953125, 17.08642578125, 18.4033203125, 19.72021484375, 21.037109375, 22.35400390625, 23.6708984375, 24.98779296875, 26.3046875, 27.62158203125, 28.9384765625, 30.25537109375, 31.572265625, 32.88916015625, 34.2060546875, 35.52294921875, 36.83984375, 38.15673828125, 39.4736328125, 40.79052734375, 42.107421875, 43.42431640625, 44.7412109375, 46.05810546875, 47.375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 34.0, 80.0, 196.0, 685.0, 1820.0, 860.0, 223.0, 85.0, 43.0, 14.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.119140625, -19.30078125, -18.482421875, -17.6640625, -16.845703125, -16.02734375, -15.208984375, -14.390625, -13.572265625, -12.75390625, -11.935546875, -11.1171875, -10.298828125, -9.48046875, -8.662109375, -7.84375, -7.025390625, -6.20703125, -5.388671875, -4.5703125, -3.751953125, -2.93359375, -2.115234375, -1.296875, -0.478515625, 0.33984375, 1.158203125, 1.9765625, 2.794921875, 3.61328125, 4.431640625, 5.25, 6.068359375, 6.88671875, 7.705078125, 8.5234375, 9.341796875, 10.16015625, 10.978515625, 11.796875, 12.615234375, 13.43359375, 14.251953125, 15.0703125, 15.888671875, 16.70703125, 17.525390625, 18.34375, 19.162109375, 19.98046875, 20.798828125, 21.6171875, 22.435546875, 23.25390625, 24.072265625, 24.890625, 25.708984375, 26.52734375, 27.345703125, 28.1640625, 28.982421875, 29.80078125, 30.619140625, 31.4375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 21.0, 34.0, 115.0, 236.0, 320.0, 157.0, 61.0, 29.0, 11.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.21636962890625, -270.2434387207031, -264.2705078125, -258.2975769042969, -252.32464599609375, -246.3517303466797, -240.37879943847656, -234.40586853027344, -228.4329376220703, -222.4600067138672, -216.48707580566406, -210.51414489746094, -204.54122924804688, -198.56829833984375, -192.59536743164062, -186.6224365234375, -180.64950561523438, -174.67657470703125, -168.70364379882812, -162.730712890625, -156.75778198242188, -150.7848663330078, -144.8119354248047, -138.83900451660156, -132.86607360839844, -126.89314270019531, -120.92021179199219, -114.9472885131836, -108.97435760498047, -103.00142669677734, -97.02850341796875, -91.05557250976562, -85.08262634277344, -79.10969543457031, -73.13676452636719, -67.1638412475586, -61.19091033935547, -55.217979431152344, -49.245052337646484, -43.272125244140625, -37.2991943359375, -31.326265335083008, -25.353336334228516, -19.380407333374023, -13.407478332519531, -7.434549331665039, -1.4616203308105469, 4.5113067626953125, 10.484237670898438, 16.45716667175293, 22.430095672607422, 28.403024673461914, 34.375953674316406, 40.34888458251953, 46.32181167602539, 52.29473876953125, 58.267669677734375, 64.2406005859375, 70.21353149414062, 76.18645477294922, 82.15938568115234, 88.13231658935547, 94.10523986816406, 100.07817077636719, 106.05110168457031]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 15.0, 17.0, 23.0, 23.0, 25.0, 29.0, 40.0, 35.0, 40.0, 38.0, 39.0, 39.0, 35.0, 48.0, 54.0, 44.0, 39.0, 43.0, 38.0, 39.0, 44.0, 38.0, 14.0, 22.0, 20.0, 30.0, 12.0, 12.0, 21.0, 8.0, 7.0, 3.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.81529998779297, -42.46793746948242, -41.120574951171875, -39.773216247558594, -38.42585372924805, -37.0784912109375, -35.73113250732422, -34.38376998901367, -33.036407470703125, -31.689044952392578, -30.341684341430664, -28.99432373046875, -27.646961212158203, -26.299598693847656, -24.952238082885742, -23.604877471923828, -22.25751495361328, -20.910152435302734, -19.56279182434082, -18.215431213378906, -16.86806869506836, -15.520707130432129, -14.173345565795898, -12.825984001159668, -11.478622436523438, -10.131260871887207, -8.783899307250977, -7.436537742614746, -6.089176177978516, -4.741814613342285, -3.3944530487060547, -2.047091484069824, -0.6997337341308594, 0.6476278305053711, 1.9949893951416016, 3.342350959777832, 4.6897125244140625, 6.037074089050293, 7.384435653686523, 8.731797218322754, 10.079158782958984, 11.426520347595215, 12.773881912231445, 14.121243476867676, 15.468605041503906, 16.815967559814453, 18.163328170776367, 19.51068878173828, 20.858051300048828, 22.205413818359375, 23.55277442932129, 24.900135040283203, 26.24749755859375, 27.594860076904297, 28.94222068786621, 30.289581298828125, 31.636943817138672, 32.98430633544922, 34.3316650390625, 35.67902755737305, 37.026390075683594, 38.37375259399414, 39.72111511230469, 41.06847381591797, 42.415836334228516]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 18.0, 17.0, 35.0, 45.0, 67.0, 121.0, 208.0, 386.0, 786.0, 1522.0, 3080.0, 6667.0, 15850.0, 41400.0, 119087.0, 320268.0, 334486.0, 129602.0, 44218.0, 16983.0, 7057.0, 3272.0, 1545.0, 842.0, 409.0, 235.0, 140.0, 77.0, 38.0, 38.0, 14.0, 11.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.07440185546875, -7.8675537109375, -7.66070556640625, -7.453857421875, -7.24700927734375, -7.0401611328125, -6.83331298828125, -6.62646484375, -6.41961669921875, -6.2127685546875, -6.00592041015625, -5.799072265625, -5.59222412109375, -5.3853759765625, -5.17852783203125, -4.9716796875, -4.76483154296875, -4.5579833984375, -4.35113525390625, -4.144287109375, -3.93743896484375, -3.7305908203125, -3.52374267578125, -3.31689453125, -3.11004638671875, -2.9031982421875, -2.69635009765625, -2.489501953125, -2.28265380859375, -2.0758056640625, -1.86895751953125, -1.662109375, -1.45526123046875, -1.2484130859375, -1.04156494140625, -0.834716796875, -0.62786865234375, -0.4210205078125, -0.21417236328125, -0.00732421875, 0.19952392578125, 0.4063720703125, 0.61322021484375, 0.820068359375, 1.02691650390625, 1.2337646484375, 1.44061279296875, 1.6474609375, 1.85430908203125, 2.0611572265625, 2.26800537109375, 2.474853515625, 2.68170166015625, 2.8885498046875, 3.09539794921875, 3.30224609375, 3.50909423828125, 3.7159423828125, 3.92279052734375, 4.129638671875, 4.33648681640625, 4.5433349609375, 4.75018310546875, 4.95703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 1.0, 5.0, 12.0, 13.0, 16.0, 20.0, 22.0, 36.0, 33.0, 34.0, 48.0, 52.0, 50.0, 53.0, 66.0, 54.0, 56.0, 61.0, 55.0, 49.0, 51.0, 44.0, 35.0, 26.0, 21.0, 24.0, 18.0, 10.0, 7.0, 6.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.13818359375, -3.9560546875, -3.77392578125, -3.591796875, -3.40966796875, -3.2275390625, -3.04541015625, -2.86328125, -2.68115234375, -2.4990234375, -2.31689453125, -2.134765625, -1.95263671875, -1.7705078125, -1.58837890625, -1.40625, -1.22412109375, -1.0419921875, -0.85986328125, -0.677734375, -0.49560546875, -0.3134765625, -0.13134765625, 0.05078125, 0.23291015625, 0.4150390625, 0.59716796875, 0.779296875, 0.96142578125, 1.1435546875, 1.32568359375, 1.5078125, 1.68994140625, 1.8720703125, 2.05419921875, 2.236328125, 2.41845703125, 2.6005859375, 2.78271484375, 2.96484375, 3.14697265625, 3.3291015625, 3.51123046875, 3.693359375, 3.87548828125, 4.0576171875, 4.23974609375, 4.421875, 4.60400390625, 4.7861328125, 4.96826171875, 5.150390625, 5.33251953125, 5.5146484375, 5.69677734375, 5.87890625, 6.06103515625, 6.2431640625, 6.42529296875, 6.607421875, 6.78955078125, 6.9716796875, 7.15380859375, 7.3359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 4.0, 9.0, 14.0, 17.0, 33.0, 33.0, 37.0, 58.0, 56.0, 83.0, 123.0, 180.0, 254.0, 301.0, 537.0, 878.0, 1737.0, 3837.0, 11355.0, 42307.0, 222247.0, 636035.0, 94963.0, 21430.0, 6411.0, 2436.0, 1160.0, 617.0, 404.0, 257.0, 179.0, 126.0, 103.0, 68.0, 65.0, 43.0, 37.0, 26.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.994140625, -8.67578125, -8.357421875, -8.0390625, -7.720703125, -7.40234375, -7.083984375, -6.765625, -6.447265625, -6.12890625, -5.810546875, -5.4921875, -5.173828125, -4.85546875, -4.537109375, -4.21875, -3.900390625, -3.58203125, -3.263671875, -2.9453125, -2.626953125, -2.30859375, -1.990234375, -1.671875, -1.353515625, -1.03515625, -0.716796875, -0.3984375, -0.080078125, 0.23828125, 0.556640625, 0.875, 1.193359375, 1.51171875, 1.830078125, 2.1484375, 2.466796875, 2.78515625, 3.103515625, 3.421875, 3.740234375, 4.05859375, 4.376953125, 4.6953125, 5.013671875, 5.33203125, 5.650390625, 5.96875, 6.287109375, 6.60546875, 6.923828125, 7.2421875, 7.560546875, 7.87890625, 8.197265625, 8.515625, 8.833984375, 9.15234375, 9.470703125, 9.7890625, 10.107421875, 10.42578125, 10.744140625, 11.0625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 6.0, 12.0, 10.0, 12.0, 11.0, 23.0, 14.0, 8.0, 32.0, 33.0, 29.0, 37.0, 37.0, 44.0, 44.0, 42.0, 49.0, 49.0, 51.0, 52.0, 50.0, 46.0, 39.0, 37.0, 32.0, 18.0, 20.0, 29.0, 18.0, 10.0, 22.0, 8.0, 11.0, 8.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8515625, -14.3704833984375, -13.889404296875, -13.4083251953125, -12.92724609375, -12.4461669921875, -11.965087890625, -11.4840087890625, -11.0029296875, -10.5218505859375, -10.040771484375, -9.5596923828125, -9.07861328125, -8.5975341796875, -8.116455078125, -7.6353759765625, -7.154296875, -6.6732177734375, -6.192138671875, -5.7110595703125, -5.22998046875, -4.7489013671875, -4.267822265625, -3.7867431640625, -3.3056640625, -2.8245849609375, -2.343505859375, -1.8624267578125, -1.38134765625, -0.9002685546875, -0.419189453125, 0.0618896484375, 0.54296875, 1.0240478515625, 1.505126953125, 1.9862060546875, 2.46728515625, 2.9483642578125, 3.429443359375, 3.9105224609375, 4.3916015625, 4.8726806640625, 5.353759765625, 5.8348388671875, 6.31591796875, 6.7969970703125, 7.278076171875, 7.7591552734375, 8.240234375, 8.7213134765625, 9.202392578125, 9.6834716796875, 10.16455078125, 10.6456298828125, 11.126708984375, 11.6077880859375, 12.0888671875, 12.5699462890625, 13.051025390625, 13.5321044921875, 14.01318359375, 14.4942626953125, 14.975341796875, 15.4564208984375, 15.9375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 16.0, 15.0, 32.0, 35.0, 46.0, 85.0, 134.0, 192.0, 387.0, 612.0, 1039.0, 2112.0, 4225.0, 9238.0, 22809.0, 65131.0, 279464.0, 540697.0, 76211.0, 25850.0, 10519.0, 4665.0, 2164.0, 1135.0, 680.0, 357.0, 228.0, 144.0, 84.0, 69.0, 47.0, 23.0, 14.0, 16.0, 10.0, 16.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8603515625, -1.7963409423828125, -1.732330322265625, -1.6683197021484375, -1.60430908203125, -1.5402984619140625, -1.476287841796875, -1.4122772216796875, -1.3482666015625, -1.2842559814453125, -1.220245361328125, -1.1562347412109375, -1.09222412109375, -1.0282135009765625, -0.964202880859375, -0.9001922607421875, -0.836181640625, -0.7721710205078125, -0.708160400390625, -0.6441497802734375, -0.58013916015625, -0.5161285400390625, -0.452117919921875, -0.3881072998046875, -0.3240966796875, -0.2600860595703125, -0.196075439453125, -0.1320648193359375, -0.06805419921875, -0.0040435791015625, 0.059967041015625, 0.1239776611328125, 0.18798828125, 0.2519989013671875, 0.316009521484375, 0.3800201416015625, 0.44403076171875, 0.5080413818359375, 0.572052001953125, 0.6360626220703125, 0.7000732421875, 0.7640838623046875, 0.828094482421875, 0.8921051025390625, 0.95611572265625, 1.0201263427734375, 1.084136962890625, 1.1481475830078125, 1.212158203125, 1.2761688232421875, 1.340179443359375, 1.4041900634765625, 1.46820068359375, 1.5322113037109375, 1.596221923828125, 1.6602325439453125, 1.7242431640625, 1.7882537841796875, 1.852264404296875, 1.9162750244140625, 1.98028564453125, 2.0442962646484375, 2.108306884765625, 2.1723175048828125, 2.236328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 13.0, 6.0, 17.0, 35.0, 36.0, 56.0, 105.0, 184.0, 195.0, 111.0, 71.0, 35.0, 30.0, 16.0, 7.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0012502670288085938, -0.001214638352394104, -0.0011790096759796143, -0.0011433809995651245, -0.0011077523231506348, -0.001072123646736145, -0.0010364949703216553, -0.0010008662939071655, -0.0009652376174926758, -0.000929608941078186, -0.0008939802646636963, -0.0008583515882492065, -0.0008227229118347168, -0.000787094235420227, -0.0007514655590057373, -0.0007158368825912476, -0.0006802082061767578, -0.0006445795297622681, -0.0006089508533477783, -0.0005733221769332886, -0.0005376935005187988, -0.0005020648241043091, -0.00046643614768981934, -0.0004308074712753296, -0.00039517879486083984, -0.0003595501184463501, -0.00032392144203186035, -0.0002882927656173706, -0.00025266408920288086, -0.0002170354127883911, -0.00018140673637390137, -0.00014577805995941162, -0.00011014938354492188, -7.452070713043213e-05, -3.889203071594238e-05, -3.2633543014526367e-06, 3.236532211303711e-05, 6.799399852752686e-05, 0.0001036226749420166, 0.00013925135135650635, 0.0001748800277709961, 0.00021050870418548584, 0.0002461373805999756, 0.00028176605701446533, 0.0003173947334289551, 0.0003530234098434448, 0.00038865208625793457, 0.0004242807626724243, 0.00045990943908691406, 0.0004955381155014038, 0.0005311667919158936, 0.0005667954683303833, 0.000602424144744873, 0.0006380528211593628, 0.0006736814975738525, 0.0007093101739883423, 0.000744938850402832, 0.0007805675268173218, 0.0008161962032318115, 0.0008518248796463013, 0.000887453556060791, 0.0009230822324752808, 0.0009587109088897705, 0.0009943395853042603, 0.00102996826171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 10.0, 10.0, 7.0, 15.0, 16.0, 23.0, 20.0, 37.0, 54.0, 110.0, 171.0, 244.0, 349.0, 581.0, 967.0, 1657.0, 3076.0, 6850.0, 16421.0, 48015.0, 173606.0, 626858.0, 111462.0, 34195.0, 12355.0, 5183.0, 2646.0, 1332.0, 811.0, 493.0, 322.0, 200.0, 139.0, 104.0, 61.0, 46.0, 30.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 16.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.507080078125, -2.43408203125, -2.361083984375, -2.2880859375, -2.215087890625, -2.14208984375, -2.069091796875, -1.99609375, -1.923095703125, -1.85009765625, -1.777099609375, -1.7041015625, -1.631103515625, -1.55810546875, -1.485107421875, -1.412109375, -1.339111328125, -1.26611328125, -1.193115234375, -1.1201171875, -1.047119140625, -0.97412109375, -0.901123046875, -0.828125, -0.755126953125, -0.68212890625, -0.609130859375, -0.5361328125, -0.463134765625, -0.39013671875, -0.317138671875, -0.244140625, -0.171142578125, -0.09814453125, -0.025146484375, 0.0478515625, 0.120849609375, 0.19384765625, 0.266845703125, 0.33984375, 0.412841796875, 0.48583984375, 0.558837890625, 0.6318359375, 0.704833984375, 0.77783203125, 0.850830078125, 0.923828125, 0.996826171875, 1.06982421875, 1.142822265625, 1.2158203125, 1.288818359375, 1.36181640625, 1.434814453125, 1.5078125, 1.580810546875, 1.65380859375, 1.726806640625, 1.7998046875, 1.872802734375, 1.94580078125, 2.018798828125, 2.091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 3.0, 9.0, 11.0, 13.0, 11.0, 12.0, 14.0, 22.0, 22.0, 20.0, 32.0, 28.0, 37.0, 57.0, 61.0, 60.0, 87.0, 88.0, 76.0, 61.0, 47.0, 39.0, 34.0, 26.0, 20.0, 15.0, 16.0, 10.0, 6.0, 9.0, 6.0, 9.0, 10.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.30780029296875, -2.2347412109375, -2.16168212890625, -2.088623046875, -2.01556396484375, -1.9425048828125, -1.86944580078125, -1.79638671875, -1.72332763671875, -1.6502685546875, -1.57720947265625, -1.504150390625, -1.43109130859375, -1.3580322265625, -1.28497314453125, -1.2119140625, -1.13885498046875, -1.0657958984375, -0.99273681640625, -0.919677734375, -0.84661865234375, -0.7735595703125, -0.70050048828125, -0.62744140625, -0.55438232421875, -0.4813232421875, -0.40826416015625, -0.335205078125, -0.26214599609375, -0.1890869140625, -0.11602783203125, -0.04296875, 0.03009033203125, 0.1031494140625, 0.17620849609375, 0.249267578125, 0.32232666015625, 0.3953857421875, 0.46844482421875, 0.54150390625, 0.61456298828125, 0.6876220703125, 0.76068115234375, 0.833740234375, 0.90679931640625, 0.9798583984375, 1.05291748046875, 1.1259765625, 1.19903564453125, 1.2720947265625, 1.34515380859375, 1.418212890625, 1.49127197265625, 1.5643310546875, 1.63739013671875, 1.71044921875, 1.78350830078125, 1.8565673828125, 1.92962646484375, 2.002685546875, 2.07574462890625, 2.1488037109375, 2.22186279296875, 2.294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 8.0, 16.0, 38.0, 51.0, 93.0, 130.0, 234.0, 163.0, 93.0, 45.0, 39.0, 27.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.77720260620117, -56.64575958251953, -54.514320373535156, -52.382877349853516, -50.25143814086914, -48.1199951171875, -45.988555908203125, -43.857112884521484, -41.725669860839844, -39.5942268371582, -37.46278762817383, -35.33134460449219, -33.19990539550781, -31.068462371826172, -28.937021255493164, -26.805580139160156, -24.67414093017578, -22.542699813842773, -20.411258697509766, -18.279815673828125, -16.14837646484375, -14.016934394836426, -11.885492324829102, -9.754051208496094, -7.622610092163086, -5.491168975830078, -3.359727382659912, -1.228285789489746, 0.9031553268432617, 3.0345964431762695, 5.166038513183594, 7.297479629516602, 9.428916931152344, 11.560358047485352, 13.69179916381836, 15.823241233825684, 17.954681396484375, 20.086124420166016, 22.217565536499023, 24.34900665283203, 26.48044776916504, 28.611888885498047, 30.743330001831055, 32.87477111816406, 35.0062141418457, 37.13765335083008, 39.26909637451172, 41.400535583496094, 43.531978607177734, 45.663421630859375, 47.79486083984375, 49.92630386352539, 52.057743072509766, 54.189186096191406, 56.32062530517578, 58.45206832885742, 60.58351135253906, 62.7149543762207, 64.84639739990234, 66.97783660888672, 69.1092758178711, 71.24071502685547, 73.37216186523438, 75.50360107421875, 77.63504028320312]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 9.0, 7.0, 11.0, 10.0, 17.0, 26.0, 30.0, 24.0, 34.0, 38.0, 45.0, 63.0, 99.0, 130.0, 100.0, 70.0, 59.0, 40.0, 41.0, 32.0, 23.0, 23.0, 9.0, 13.0, 9.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.55998229980469, -104.90193939208984, -102.243896484375, -99.58584594726562, -96.92780303955078, -94.26976013183594, -91.61170959472656, -88.95366668701172, -86.29562377929688, -83.63758087158203, -80.97953796386719, -78.32148742675781, -75.66344451904297, -73.00540161132812, -70.34735107421875, -67.6893081665039, -65.03126525878906, -62.37322235107422, -59.71517562866211, -57.05712890625, -54.399085998535156, -51.74104309082031, -49.0829963684082, -46.424949645996094, -43.76690673828125, -41.108863830566406, -38.4508171081543, -35.79277038574219, -33.134727478027344, -30.476682662963867, -27.81863784790039, -25.160593032836914, -22.502540588378906, -19.84449577331543, -17.186450958251953, -14.528406143188477, -11.870361328125, -9.212316513061523, -6.554271697998047, -3.8962268829345703, -1.2381820678710938, 1.4198627471923828, 4.077907562255859, 6.735952377319336, 9.393997192382812, 12.052042007446289, 14.710086822509766, 17.368131637573242, 20.02617645263672, 22.684221267700195, 25.342266082763672, 28.00031089782715, 30.658355712890625, 33.31639862060547, 35.97444534301758, 38.63249206542969, 41.29053497314453, 43.948577880859375, 46.606624603271484, 49.264671325683594, 51.92271423339844, 54.58075714111328, 57.23880386352539, 59.8968505859375, 62.554893493652344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 11.0, 13.0, 16.0, 30.0, 32.0, 53.0, 72.0, 104.0, 172.0, 238.0, 456.0, 779.0, 1331.0, 2688.0, 5988.0, 16412.0, 63984.0, 385464.0, 2173948.0, 1301532.0, 186890.0, 34750.0, 10406.0, 4158.0, 2027.0, 1087.0, 556.0, 380.0, 230.0, 154.0, 86.0, 63.0, 38.0, 30.0, 29.0, 22.0, 17.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.47076416015625, -6.2735595703125, -6.07635498046875, -5.879150390625, -5.68194580078125, -5.4847412109375, -5.28753662109375, -5.09033203125, -4.89312744140625, -4.6959228515625, -4.49871826171875, -4.301513671875, -4.10430908203125, -3.9071044921875, -3.70989990234375, -3.5126953125, -3.31549072265625, -3.1182861328125, -2.92108154296875, -2.723876953125, -2.52667236328125, -2.3294677734375, -2.13226318359375, -1.93505859375, -1.73785400390625, -1.5406494140625, -1.34344482421875, -1.146240234375, -0.94903564453125, -0.7518310546875, -0.55462646484375, -0.357421875, -0.16021728515625, 0.0369873046875, 0.23419189453125, 0.431396484375, 0.62860107421875, 0.8258056640625, 1.02301025390625, 1.22021484375, 1.41741943359375, 1.6146240234375, 1.81182861328125, 2.009033203125, 2.20623779296875, 2.4034423828125, 2.60064697265625, 2.7978515625, 2.99505615234375, 3.1922607421875, 3.38946533203125, 3.586669921875, 3.78387451171875, 3.9810791015625, 4.17828369140625, 4.37548828125, 4.57269287109375, 4.7698974609375, 4.96710205078125, 5.164306640625, 5.36151123046875, 5.5587158203125, 5.75592041015625, 5.953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 8.0, 8.0, 22.0, 20.0, 20.0, 31.0, 30.0, 40.0, 46.0, 60.0, 51.0, 67.0, 62.0, 63.0, 58.0, 65.0, 62.0, 56.0, 31.0, 37.0, 22.0, 32.0, 24.0, 23.0, 17.0, 11.0, 10.0, 6.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.0697021484375, -3.889404296875, -3.7091064453125, -3.52880859375, -3.3485107421875, -3.168212890625, -2.9879150390625, -2.8076171875, -2.6273193359375, -2.447021484375, -2.2667236328125, -2.08642578125, -1.9061279296875, -1.725830078125, -1.5455322265625, -1.365234375, -1.1849365234375, -1.004638671875, -0.8243408203125, -0.64404296875, -0.4637451171875, -0.283447265625, -0.1031494140625, 0.0771484375, 0.2574462890625, 0.437744140625, 0.6180419921875, 0.79833984375, 0.9786376953125, 1.158935546875, 1.3392333984375, 1.51953125, 1.6998291015625, 1.880126953125, 2.0604248046875, 2.24072265625, 2.4210205078125, 2.601318359375, 2.7816162109375, 2.9619140625, 3.1422119140625, 3.322509765625, 3.5028076171875, 3.68310546875, 3.8634033203125, 4.043701171875, 4.2239990234375, 4.404296875, 4.5845947265625, 4.764892578125, 4.9451904296875, 5.12548828125, 5.3057861328125, 5.486083984375, 5.6663818359375, 5.8466796875, 6.0269775390625, 6.207275390625, 6.3875732421875, 6.56787109375, 6.7481689453125, 6.928466796875, 7.1087646484375, 7.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 21.0, 34.0, 50.0, 99.0, 179.0, 317.0, 832.0, 2916.0, 40003.0, 4038903.0, 104402.0, 4534.0, 1016.0, 445.0, 235.0, 123.0, 62.0, 31.0, 20.0, 18.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.640625, -28.7587890625, -27.876953125, -26.9951171875, -26.11328125, -25.2314453125, -24.349609375, -23.4677734375, -22.5859375, -21.7041015625, -20.822265625, -19.9404296875, -19.05859375, -18.1767578125, -17.294921875, -16.4130859375, -15.53125, -14.6494140625, -13.767578125, -12.8857421875, -12.00390625, -11.1220703125, -10.240234375, -9.3583984375, -8.4765625, -7.5947265625, -6.712890625, -5.8310546875, -4.94921875, -4.0673828125, -3.185546875, -2.3037109375, -1.421875, -0.5400390625, 0.341796875, 1.2236328125, 2.10546875, 2.9873046875, 3.869140625, 4.7509765625, 5.6328125, 6.5146484375, 7.396484375, 8.2783203125, 9.16015625, 10.0419921875, 10.923828125, 11.8056640625, 12.6875, 13.5693359375, 14.451171875, 15.3330078125, 16.21484375, 17.0966796875, 17.978515625, 18.8603515625, 19.7421875, 20.6240234375, 21.505859375, 22.3876953125, 23.26953125, 24.1513671875, 25.033203125, 25.9150390625, 26.796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 16.0, 31.0, 41.0, 71.0, 153.0, 431.0, 939.0, 1214.0, 637.0, 272.0, 126.0, 53.0, 26.0, 16.0, 11.0, 9.0, 10.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.9375, -19.338623046875, -18.73974609375, -18.140869140625, -17.5419921875, -16.943115234375, -16.34423828125, -15.745361328125, -15.146484375, -14.547607421875, -13.94873046875, -13.349853515625, -12.7509765625, -12.152099609375, -11.55322265625, -10.954345703125, -10.35546875, -9.756591796875, -9.15771484375, -8.558837890625, -7.9599609375, -7.361083984375, -6.76220703125, -6.163330078125, -5.564453125, -4.965576171875, -4.36669921875, -3.767822265625, -3.1689453125, -2.570068359375, -1.97119140625, -1.372314453125, -0.7734375, -0.174560546875, 0.42431640625, 1.023193359375, 1.6220703125, 2.220947265625, 2.81982421875, 3.418701171875, 4.017578125, 4.616455078125, 5.21533203125, 5.814208984375, 6.4130859375, 7.011962890625, 7.61083984375, 8.209716796875, 8.80859375, 9.407470703125, 10.00634765625, 10.605224609375, 11.2041015625, 11.802978515625, 12.40185546875, 13.000732421875, 13.599609375, 14.198486328125, 14.79736328125, 15.396240234375, 15.9951171875, 16.593994140625, 17.19287109375, 17.791748046875, 18.390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 10.0, 10.0, 37.0, 78.0, 169.0, 262.0, 234.0, 109.0, 53.0, 16.0, 10.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.4344940185547, -149.5614776611328, -144.68846130371094, -139.81544494628906, -134.9424285888672, -130.0694122314453, -125.19640350341797, -120.3233871459961, -115.45037078857422, -110.57735443115234, -105.70433807373047, -100.8313217163086, -95.95831298828125, -91.08529663085938, -86.2122802734375, -81.33926391601562, -76.46624755859375, -71.59323120117188, -66.72021484375, -61.84720230102539, -56.974185943603516, -52.10116958618164, -47.22815704345703, -42.355140686035156, -37.48212432861328, -32.609107971191406, -27.736093521118164, -22.863079071044922, -17.990062713623047, -13.117046356201172, -8.24403190612793, -3.3710174560546875, 1.50201416015625, 6.375029563903809, 11.248044967651367, 16.12105941772461, 20.994075775146484, 25.86709213256836, 30.7401065826416, 35.613121032714844, 40.48613739013672, 45.359153747558594, 50.23217010498047, 55.10518264770508, 59.97819900512695, 64.85121154785156, 69.72422790527344, 74.59724426269531, 79.47026062011719, 84.34327697753906, 89.21629333496094, 94.08930969238281, 98.96232604980469, 103.83534240722656, 108.7083511352539, 113.58136749267578, 118.45438385009766, 123.32740020751953, 128.20040893554688, 133.07342529296875, 137.94644165039062, 142.8194580078125, 147.69247436523438, 152.56549072265625, 157.43850708007812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 8.0, 9.0, 12.0, 8.0, 14.0, 23.0, 15.0, 17.0, 12.0, 23.0, 24.0, 24.0, 28.0, 44.0, 42.0, 51.0, 47.0, 47.0, 48.0, 40.0, 35.0, 42.0, 51.0, 42.0, 27.0, 33.0, 27.0, 30.0, 24.0, 24.0, 13.0, 19.0, 8.0, 12.0, 13.0, 12.0, 7.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.855377197265625, -44.46354675292969, -43.071712493896484, -41.67987823486328, -40.288047790527344, -38.896217346191406, -37.5043830871582, -36.112548828125, -34.72071838378906, -33.328887939453125, -31.937053680419922, -30.54522132873535, -29.15338897705078, -27.76155662536621, -26.36972427368164, -24.97789192199707, -23.5860595703125, -22.19422721862793, -20.80239486694336, -19.41056251525879, -18.01873016357422, -16.62689781188965, -15.235065460205078, -13.843233108520508, -12.451400756835938, -11.059568405151367, -9.667736053466797, -8.275903701782227, -6.884071350097656, -5.492238998413086, -4.100406646728516, -2.7085742950439453, -1.3167381286621094, 0.07509422302246094, 1.4669265747070312, 2.8587589263916016, 4.250591278076172, 5.642423629760742, 7.0342559814453125, 8.426088333129883, 9.817920684814453, 11.209753036499023, 12.601585388183594, 13.993417739868164, 15.385250091552734, 16.777082443237305, 18.168914794921875, 19.560747146606445, 20.952579498291016, 22.344411849975586, 23.736244201660156, 25.128076553344727, 26.519908905029297, 27.911741256713867, 29.303573608398438, 30.695405960083008, 32.08723831176758, 33.47907257080078, 34.87090301513672, 36.262733459472656, 37.65456771850586, 39.04640197753906, 40.438232421875, 41.83006286621094, 43.22189712524414]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 21.0, 19.0, 28.0, 47.0, 47.0, 84.0, 117.0, 207.0, 342.0, 601.0, 1119.0, 2016.0, 3958.0, 8105.0, 18228.0, 44034.0, 116403.0, 302669.0, 330459.0, 131433.0, 49698.0, 20584.0, 9044.0, 4273.0, 2216.0, 1142.0, 635.0, 395.0, 228.0, 139.0, 103.0, 50.0, 24.0, 20.0, 17.0, 12.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.49615478515625, -5.2852783203125, -5.07440185546875, -4.863525390625, -4.65264892578125, -4.4417724609375, -4.23089599609375, -4.02001953125, -3.80914306640625, -3.5982666015625, -3.38739013671875, -3.176513671875, -2.96563720703125, -2.7547607421875, -2.54388427734375, -2.3330078125, -2.12213134765625, -1.9112548828125, -1.70037841796875, -1.489501953125, -1.27862548828125, -1.0677490234375, -0.85687255859375, -0.64599609375, -0.43511962890625, -0.2242431640625, -0.01336669921875, 0.197509765625, 0.40838623046875, 0.6192626953125, 0.83013916015625, 1.041015625, 1.25189208984375, 1.4627685546875, 1.67364501953125, 1.884521484375, 2.09539794921875, 2.3062744140625, 2.51715087890625, 2.72802734375, 2.93890380859375, 3.1497802734375, 3.36065673828125, 3.571533203125, 3.78240966796875, 3.9932861328125, 4.20416259765625, 4.4150390625, 4.62591552734375, 4.8367919921875, 5.04766845703125, 5.258544921875, 5.46942138671875, 5.6802978515625, 5.89117431640625, 6.10205078125, 6.31292724609375, 6.5238037109375, 6.73468017578125, 6.945556640625, 7.15643310546875, 7.3673095703125, 7.57818603515625, 7.7890625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 2.0, 7.0, 6.0, 13.0, 9.0, 17.0, 18.0, 23.0, 27.0, 33.0, 27.0, 30.0, 53.0, 54.0, 36.0, 67.0, 36.0, 62.0, 66.0, 53.0, 50.0, 29.0, 48.0, 40.0, 34.0, 34.0, 20.0, 25.0, 16.0, 15.0, 19.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.564178466796875, -3.39202880859375, -3.219879150390625, -3.0477294921875, -2.875579833984375, -2.70343017578125, -2.531280517578125, -2.359130859375, -2.186981201171875, -2.01483154296875, -1.842681884765625, -1.6705322265625, -1.498382568359375, -1.32623291015625, -1.154083251953125, -0.98193359375, -0.809783935546875, -0.63763427734375, -0.465484619140625, -0.2933349609375, -0.121185302734375, 0.05096435546875, 0.223114013671875, 0.395263671875, 0.567413330078125, 0.73956298828125, 0.911712646484375, 1.0838623046875, 1.256011962890625, 1.42816162109375, 1.600311279296875, 1.7724609375, 1.944610595703125, 2.11676025390625, 2.288909912109375, 2.4610595703125, 2.633209228515625, 2.80535888671875, 2.977508544921875, 3.149658203125, 3.321807861328125, 3.49395751953125, 3.666107177734375, 3.8382568359375, 4.010406494140625, 4.18255615234375, 4.354705810546875, 4.52685546875, 4.699005126953125, 4.87115478515625, 5.043304443359375, 5.2154541015625, 5.387603759765625, 5.55975341796875, 5.731903076171875, 5.904052734375, 6.076202392578125, 6.24835205078125, 6.420501708984375, 6.5926513671875, 6.764801025390625, 6.93695068359375, 7.109100341796875, 7.28125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 13.0, 15.0, 22.0, 40.0, 43.0, 49.0, 76.0, 104.0, 167.0, 225.0, 333.0, 506.0, 813.0, 1433.0, 3047.0, 8825.0, 39702.0, 567602.0, 372852.0, 37637.0, 8285.0, 3057.0, 1386.0, 814.0, 477.0, 317.0, 198.0, 150.0, 106.0, 55.0, 53.0, 35.0, 25.0, 17.0, 19.0, 12.0, 8.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.963134765625, -11.53564453125, -11.108154296875, -10.6806640625, -10.253173828125, -9.82568359375, -9.398193359375, -8.970703125, -8.543212890625, -8.11572265625, -7.688232421875, -7.2607421875, -6.833251953125, -6.40576171875, -5.978271484375, -5.55078125, -5.123291015625, -4.69580078125, -4.268310546875, -3.8408203125, -3.413330078125, -2.98583984375, -2.558349609375, -2.130859375, -1.703369140625, -1.27587890625, -0.848388671875, -0.4208984375, 0.006591796875, 0.43408203125, 0.861572265625, 1.2890625, 1.716552734375, 2.14404296875, 2.571533203125, 2.9990234375, 3.426513671875, 3.85400390625, 4.281494140625, 4.708984375, 5.136474609375, 5.56396484375, 5.991455078125, 6.4189453125, 6.846435546875, 7.27392578125, 7.701416015625, 8.12890625, 8.556396484375, 8.98388671875, 9.411376953125, 9.8388671875, 10.266357421875, 10.69384765625, 11.121337890625, 11.548828125, 11.976318359375, 12.40380859375, 12.831298828125, 13.2587890625, 13.686279296875, 14.11376953125, 14.541259765625, 14.96875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 11.0, 5.0, 12.0, 12.0, 27.0, 26.0, 31.0, 45.0, 45.0, 48.0, 52.0, 57.0, 76.0, 66.0, 57.0, 57.0, 62.0, 47.0, 42.0, 40.0, 29.0, 33.0, 21.0, 17.0, 9.0, 8.0, 12.0, 13.0, 10.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.301025390625, -17.61767578125, -16.934326171875, -16.2509765625, -15.567626953125, -14.88427734375, -14.200927734375, -13.517578125, -12.834228515625, -12.15087890625, -11.467529296875, -10.7841796875, -10.100830078125, -9.41748046875, -8.734130859375, -8.05078125, -7.367431640625, -6.68408203125, -6.000732421875, -5.3173828125, -4.634033203125, -3.95068359375, -3.267333984375, -2.583984375, -1.900634765625, -1.21728515625, -0.533935546875, 0.1494140625, 0.832763671875, 1.51611328125, 2.199462890625, 2.8828125, 3.566162109375, 4.24951171875, 4.932861328125, 5.6162109375, 6.299560546875, 6.98291015625, 7.666259765625, 8.349609375, 9.032958984375, 9.71630859375, 10.399658203125, 11.0830078125, 11.766357421875, 12.44970703125, 13.133056640625, 13.81640625, 14.499755859375, 15.18310546875, 15.866455078125, 16.5498046875, 17.233154296875, 17.91650390625, 18.599853515625, 19.283203125, 19.966552734375, 20.64990234375, 21.333251953125, 22.0166015625, 22.699951171875, 23.38330078125, 24.066650390625, 24.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 19.0, 31.0, 52.0, 70.0, 131.0, 283.0, 606.0, 2123.0, 11576.0, 183989.0, 821315.0, 23349.0, 3341.0, 871.0, 341.0, 167.0, 88.0, 56.0, 43.0, 24.0, 21.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.06463623046875, -5.8870849609375, -5.70953369140625, -5.531982421875, -5.35443115234375, -5.1768798828125, -4.99932861328125, -4.82177734375, -4.64422607421875, -4.4666748046875, -4.28912353515625, -4.111572265625, -3.93402099609375, -3.7564697265625, -3.57891845703125, -3.4013671875, -3.22381591796875, -3.0462646484375, -2.86871337890625, -2.691162109375, -2.51361083984375, -2.3360595703125, -2.15850830078125, -1.98095703125, -1.80340576171875, -1.6258544921875, -1.44830322265625, -1.270751953125, -1.09320068359375, -0.9156494140625, -0.73809814453125, -0.560546875, -0.38299560546875, -0.2054443359375, -0.02789306640625, 0.149658203125, 0.32720947265625, 0.5047607421875, 0.68231201171875, 0.85986328125, 1.03741455078125, 1.2149658203125, 1.39251708984375, 1.570068359375, 1.74761962890625, 1.9251708984375, 2.10272216796875, 2.2802734375, 2.45782470703125, 2.6353759765625, 2.81292724609375, 2.990478515625, 3.16802978515625, 3.3455810546875, 3.52313232421875, 3.70068359375, 3.87823486328125, 4.0557861328125, 4.23333740234375, 4.410888671875, 4.58843994140625, 4.7659912109375, 4.94354248046875, 5.12109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 22.0, 45.0, 92.0, 355.0, 253.0, 82.0, 48.0, 24.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002925872802734375, -0.0028340518474578857, -0.0027422308921813965, -0.0026504099369049072, -0.002558588981628418, -0.0024667680263519287, -0.0023749470710754395, -0.00228312611579895, -0.002191305160522461, -0.0020994842052459717, -0.0020076632499694824, -0.0019158422946929932, -0.001824021339416504, -0.0017322003841400146, -0.0016403794288635254, -0.0015485584735870361, -0.0014567375183105469, -0.0013649165630340576, -0.0012730956077575684, -0.001181274652481079, -0.0010894536972045898, -0.0009976327419281006, -0.0009058117866516113, -0.0008139908313751221, -0.0007221698760986328, -0.0006303489208221436, -0.0005385279655456543, -0.00044670701026916504, -0.0003548860549926758, -0.0002630650997161865, -0.00017124414443969727, -7.942318916320801e-05, 1.239776611328125e-05, 0.00010421872138977051, 0.00019603967666625977, 0.000287860631942749, 0.0003796815872192383, 0.00047150254249572754, 0.0005633234977722168, 0.0006551444530487061, 0.0007469654083251953, 0.0008387863636016846, 0.0009306073188781738, 0.001022428274154663, 0.0011142492294311523, 0.0012060701847076416, 0.0012978911399841309, 0.0013897120952606201, 0.0014815330505371094, 0.0015733540058135986, 0.0016651749610900879, 0.0017569959163665771, 0.0018488168716430664, 0.0019406378269195557, 0.002032458782196045, 0.002124279737472534, 0.0022161006927490234, 0.0023079216480255127, 0.002399742603302002, 0.002491563558578491, 0.0025833845138549805, 0.0026752054691314697, 0.002767026424407959, 0.0028588473796844482, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 12.0, 34.0, 45.0, 48.0, 82.0, 108.0, 210.0, 312.0, 537.0, 1038.0, 2166.0, 5757.0, 18507.0, 86569.0, 742341.0, 149409.0, 27861.0, 7715.0, 2833.0, 1264.0, 669.0, 386.0, 250.0, 131.0, 91.0, 53.0, 43.0, 25.0, 12.0, 10.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.417938232421875, -3.31634521484375, -3.214752197265625, -3.1131591796875, -3.011566162109375, -2.90997314453125, -2.808380126953125, -2.706787109375, -2.605194091796875, -2.50360107421875, -2.402008056640625, -2.3004150390625, -2.198822021484375, -2.09722900390625, -1.995635986328125, -1.89404296875, -1.792449951171875, -1.69085693359375, -1.589263916015625, -1.4876708984375, -1.386077880859375, -1.28448486328125, -1.182891845703125, -1.081298828125, -0.979705810546875, -0.87811279296875, -0.776519775390625, -0.6749267578125, -0.573333740234375, -0.47174072265625, -0.370147705078125, -0.2685546875, -0.166961669921875, -0.06536865234375, 0.036224365234375, 0.1378173828125, 0.239410400390625, 0.34100341796875, 0.442596435546875, 0.544189453125, 0.645782470703125, 0.74737548828125, 0.848968505859375, 0.9505615234375, 1.052154541015625, 1.15374755859375, 1.255340576171875, 1.35693359375, 1.458526611328125, 1.56011962890625, 1.661712646484375, 1.7633056640625, 1.864898681640625, 1.96649169921875, 2.068084716796875, 2.169677734375, 2.271270751953125, 2.37286376953125, 2.474456787109375, 2.5760498046875, 2.677642822265625, 2.77923583984375, 2.880828857421875, 2.982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 5.0, 11.0, 14.0, 20.0, 25.0, 46.0, 56.0, 68.0, 89.0, 132.0, 139.0, 113.0, 69.0, 50.0, 23.0, 32.0, 26.0, 15.0, 21.0, 11.0, 12.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.875335693359375, -4.75067138671875, -4.626007080078125, -4.5013427734375, -4.376678466796875, -4.25201416015625, -4.127349853515625, -4.002685546875, -3.878021240234375, -3.75335693359375, -3.628692626953125, -3.5040283203125, -3.379364013671875, -3.25469970703125, -3.130035400390625, -3.00537109375, -2.880706787109375, -2.75604248046875, -2.631378173828125, -2.5067138671875, -2.382049560546875, -2.25738525390625, -2.132720947265625, -2.008056640625, -1.883392333984375, -1.75872802734375, -1.634063720703125, -1.5093994140625, -1.384735107421875, -1.26007080078125, -1.135406494140625, -1.0107421875, -0.886077880859375, -0.76141357421875, -0.636749267578125, -0.5120849609375, -0.387420654296875, -0.26275634765625, -0.138092041015625, -0.013427734375, 0.111236572265625, 0.23590087890625, 0.360565185546875, 0.4852294921875, 0.609893798828125, 0.73455810546875, 0.859222412109375, 0.98388671875, 1.108551025390625, 1.23321533203125, 1.357879638671875, 1.4825439453125, 1.607208251953125, 1.73187255859375, 1.856536865234375, 1.981201171875, 2.105865478515625, 2.23052978515625, 2.355194091796875, 2.4798583984375, 2.604522705078125, 2.72918701171875, 2.853851318359375, 2.978515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 13.0, 36.0, 88.0, 422.0, 321.0, 79.0, 24.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.60452270507812, -99.35810852050781, -93.1116943359375, -86.86528015136719, -80.6188735961914, -74.3724594116211, -68.12604522705078, -61.879634857177734, -55.63322067260742, -49.38680648803711, -43.14039611816406, -36.89398193359375, -30.64756965637207, -24.40115737915039, -18.154743194580078, -11.908332824707031, -5.661918640136719, 0.5844941139221191, 6.830906867980957, 13.077320098876953, 19.323732376098633, 25.570144653320312, 31.816558837890625, 38.06296920776367, 44.309383392333984, 50.5557975769043, 56.802207946777344, 63.048622131347656, 69.29503631591797, 75.54144287109375, 81.78785705566406, 88.03427124023438, 94.28068542480469, 100.527099609375, 106.77351379394531, 113.01992797851562, 119.2663345336914, 125.51274871826172, 131.7591552734375, 138.0055694580078, 144.25198364257812, 150.49839782714844, 156.74481201171875, 162.99122619628906, 169.23764038085938, 175.48403930664062, 181.73046875, 187.97686767578125, 194.22329711914062, 200.46971130371094, 206.71612548828125, 212.96253967285156, 219.20895385742188, 225.45535278320312, 231.7017822265625, 237.94818115234375, 244.19459533691406, 250.44100952148438, 256.6874084472656, 262.933837890625, 269.18023681640625, 275.4266662597656, 281.6730651855469, 287.91949462890625, 294.1658935546875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 6.0, 13.0, 13.0, 12.0, 16.0, 17.0, 31.0, 24.0, 34.0, 34.0, 37.0, 41.0, 41.0, 112.0, 139.0, 80.0, 40.0, 35.0, 29.0, 20.0, 30.0, 20.0, 19.0, 28.0, 18.0, 14.0, 17.0, 10.0, 9.0, 10.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-90.8123550415039, -88.3792495727539, -85.94615173339844, -83.51304626464844, -81.07994842529297, -78.64684295654297, -76.2137451171875, -73.7806396484375, -71.3475341796875, -68.9144287109375, -66.48133087158203, -64.04822540283203, -61.61512756347656, -59.18202209472656, -56.74892044067383, -54.315818786621094, -51.882720947265625, -49.44961929321289, -47.016517639160156, -44.58341598510742, -42.15031433105469, -39.71720886230469, -37.28410720825195, -34.85100555419922, -32.417903900146484, -29.98480224609375, -27.551700592041016, -25.11859703063965, -22.685495376586914, -20.25239372253418, -17.819290161132812, -15.386188507080078, -12.953079223632812, -10.519977569580078, -8.086874961853027, -5.653772830963135, -3.220670700073242, -0.7875690460205078, 1.645533561706543, 4.078636169433594, 6.511737823486328, 8.944839477539062, 11.377942085266113, 13.811044692993164, 16.2441463470459, 18.677248001098633, 21.1103515625, 23.543453216552734, 25.97655487060547, 28.409656524658203, 30.842758178710938, 33.27585983276367, 35.708961486816406, 38.142066955566406, 40.57516860961914, 43.008270263671875, 45.44137191772461, 47.874473571777344, 50.30757522583008, 52.74067687988281, 55.17378234863281, 57.60688018798828, 60.03998565673828, 62.473087310791016, 64.90618896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 9.0, 30.0, 30.0, 38.0, 66.0, 116.0, 196.0, 310.0, 463.0, 780.0, 1394.0, 2379.0, 5171.0, 10946.0, 29807.0, 123403.0, 683168.0, 2138630.0, 964113.0, 173154.0, 36361.0, 12033.0, 5245.0, 2577.0, 1480.0, 858.0, 555.0, 341.0, 225.0, 128.0, 87.0, 48.0, 45.0, 23.0, 20.0, 11.0, 8.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1796875, -5.955810546875, -5.73193359375, -5.508056640625, -5.2841796875, -5.060302734375, -4.83642578125, -4.612548828125, -4.388671875, -4.164794921875, -3.94091796875, -3.717041015625, -3.4931640625, -3.269287109375, -3.04541015625, -2.821533203125, -2.59765625, -2.373779296875, -2.14990234375, -1.926025390625, -1.7021484375, -1.478271484375, -1.25439453125, -1.030517578125, -0.806640625, -0.582763671875, -0.35888671875, -0.135009765625, 0.0888671875, 0.312744140625, 0.53662109375, 0.760498046875, 0.984375, 1.208251953125, 1.43212890625, 1.656005859375, 1.8798828125, 2.103759765625, 2.32763671875, 2.551513671875, 2.775390625, 2.999267578125, 3.22314453125, 3.447021484375, 3.6708984375, 3.894775390625, 4.11865234375, 4.342529296875, 4.56640625, 4.790283203125, 5.01416015625, 5.238037109375, 5.4619140625, 5.685791015625, 5.90966796875, 6.133544921875, 6.357421875, 6.581298828125, 6.80517578125, 7.029052734375, 7.2529296875, 7.476806640625, 7.70068359375, 7.924560546875, 8.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 23.0, 29.0, 26.0, 29.0, 31.0, 54.0, 37.0, 56.0, 67.0, 65.0, 59.0, 63.0, 55.0, 50.0, 52.0, 47.0, 45.0, 28.0, 25.0, 14.0, 19.0, 14.0, 22.0, 8.0, 12.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.548431396484375, -3.37615966796875, -3.203887939453125, -3.0316162109375, -2.859344482421875, -2.68707275390625, -2.514801025390625, -2.342529296875, -2.170257568359375, -1.99798583984375, -1.825714111328125, -1.6534423828125, -1.481170654296875, -1.30889892578125, -1.136627197265625, -0.96435546875, -0.792083740234375, -0.61981201171875, -0.447540283203125, -0.2752685546875, -0.102996826171875, 0.06927490234375, 0.241546630859375, 0.413818359375, 0.586090087890625, 0.75836181640625, 0.930633544921875, 1.1029052734375, 1.275177001953125, 1.44744873046875, 1.619720458984375, 1.7919921875, 1.964263916015625, 2.13653564453125, 2.308807373046875, 2.4810791015625, 2.653350830078125, 2.82562255859375, 2.997894287109375, 3.170166015625, 3.342437744140625, 3.51470947265625, 3.686981201171875, 3.8592529296875, 4.031524658203125, 4.20379638671875, 4.376068115234375, 4.54833984375, 4.720611572265625, 4.89288330078125, 5.065155029296875, 5.2374267578125, 5.409698486328125, 5.58197021484375, 5.754241943359375, 5.926513671875, 6.098785400390625, 6.27105712890625, 6.443328857421875, 6.6156005859375, 6.787872314453125, 6.96014404296875, 7.132415771484375, 7.3046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 18.0, 39.0, 58.0, 147.0, 308.0, 783.0, 6136.0, 4172055.0, 13003.0, 1059.0, 375.0, 157.0, 66.0, 31.0, 23.0, 11.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-96.75, -93.869140625, -90.98828125, -88.107421875, -85.2265625, -82.345703125, -79.46484375, -76.583984375, -73.703125, -70.822265625, -67.94140625, -65.060546875, -62.1796875, -59.298828125, -56.41796875, -53.537109375, -50.65625, -47.775390625, -44.89453125, -42.013671875, -39.1328125, -36.251953125, -33.37109375, -30.490234375, -27.609375, -24.728515625, -21.84765625, -18.966796875, -16.0859375, -13.205078125, -10.32421875, -7.443359375, -4.5625, -1.681640625, 1.19921875, 4.080078125, 6.9609375, 9.841796875, 12.72265625, 15.603515625, 18.484375, 21.365234375, 24.24609375, 27.126953125, 30.0078125, 32.888671875, 35.76953125, 38.650390625, 41.53125, 44.412109375, 47.29296875, 50.173828125, 53.0546875, 55.935546875, 58.81640625, 61.697265625, 64.578125, 67.458984375, 70.33984375, 73.220703125, 76.1015625, 78.982421875, 81.86328125, 84.744140625, 87.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 15.0, 22.0, 65.0, 154.0, 337.0, 1228.0, 1524.0, 441.0, 143.0, 72.0, 37.0, 23.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.578125, -15.314208984375, -14.05029296875, -12.786376953125, -11.5224609375, -10.258544921875, -8.99462890625, -7.730712890625, -6.466796875, -5.202880859375, -3.93896484375, -2.675048828125, -1.4111328125, -0.147216796875, 1.11669921875, 2.380615234375, 3.64453125, 4.908447265625, 6.17236328125, 7.436279296875, 8.7001953125, 9.964111328125, 11.22802734375, 12.491943359375, 13.755859375, 15.019775390625, 16.28369140625, 17.547607421875, 18.8115234375, 20.075439453125, 21.33935546875, 22.603271484375, 23.8671875, 25.131103515625, 26.39501953125, 27.658935546875, 28.9228515625, 30.186767578125, 31.45068359375, 32.714599609375, 33.978515625, 35.242431640625, 36.50634765625, 37.770263671875, 39.0341796875, 40.298095703125, 41.56201171875, 42.825927734375, 44.08984375, 45.353759765625, 46.61767578125, 47.881591796875, 49.1455078125, 50.409423828125, 51.67333984375, 52.937255859375, 54.201171875, 55.465087890625, 56.72900390625, 57.992919921875, 59.2568359375, 60.520751953125, 61.78466796875, 63.048583984375, 64.3125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 11.0, 12.0, 25.0, 56.0, 104.0, 253.0, 262.0, 142.0, 54.0, 31.0, 17.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2028503417969, -248.6716766357422, -239.1405029296875, -229.6093292236328, -220.07815551757812, -210.54698181152344, -201.01580810546875, -191.48463439941406, -181.95346069335938, -172.4222869873047, -162.89111328125, -153.3599395751953, -143.82876586914062, -134.29759216308594, -124.76641845703125, -115.23524475097656, -105.70407104492188, -96.17289733886719, -86.6417236328125, -77.11054992675781, -67.57937622070312, -58.04820251464844, -48.51702880859375, -38.98585510253906, -29.454681396484375, -19.923507690429688, -10.392333984375, -0.8611602783203125, 8.670013427734375, 18.201187133789062, 27.73236083984375, 37.26353454589844, 46.794677734375, 56.32585144042969, 65.85702514648438, 75.38819885253906, 84.91937255859375, 94.45054626464844, 103.98171997070312, 113.51289367675781, 123.0440673828125, 132.5752410888672, 142.10641479492188, 151.63758850097656, 161.16876220703125, 170.69993591308594, 180.23110961914062, 189.7622833251953, 199.29345703125, 208.8246307373047, 218.35580444335938, 227.88697814941406, 237.41815185546875, 246.94932556152344, 256.4804992675781, 266.01165771484375, 275.5428466796875, 285.07403564453125, 294.6051940917969, 304.1363525390625, 313.66754150390625, 323.19873046875, 332.7298889160156, 342.26104736328125, 351.792236328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 10.0, 15.0, 16.0, 26.0, 22.0, 35.0, 33.0, 36.0, 51.0, 49.0, 59.0, 57.0, 63.0, 70.0, 52.0, 55.0, 38.0, 41.0, 44.0, 27.0, 32.0, 31.0, 18.0, 8.0, 11.0, 16.0, 9.0, 6.0, 6.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-110.79570007324219, -107.67374420166016, -104.5517807006836, -101.42982482910156, -98.30786895751953, -95.18590545654297, -92.06394958496094, -88.94198608398438, -85.82003021240234, -82.69807434082031, -79.57611083984375, -76.45415496826172, -73.33219909667969, -70.21023559570312, -67.0882797241211, -63.9663200378418, -60.844364166259766, -57.72240447998047, -54.60044860839844, -51.47848892211914, -48.356529235839844, -45.23457336425781, -42.112613677978516, -38.99065399169922, -35.86869812011719, -32.74673843383789, -29.624780654907227, -26.502822875976562, -23.380863189697266, -20.2589054107666, -17.136947631835938, -14.01498794555664, -10.893028259277344, -7.771069526672363, -4.649111270904541, -1.5271530151367188, 1.5948057174682617, 4.716764450073242, 7.838722229003906, 10.960681915283203, 14.082639694213867, 17.20459747314453, 20.326557159423828, 23.448514938354492, 26.570472717285156, 29.692432403564453, 32.81439208984375, 35.93634796142578, 39.05830764770508, 42.180267333984375, 45.302223205566406, 48.4241828918457, 51.546142578125, 54.66809844970703, 57.79005813598633, 60.912017822265625, 64.03397369384766, 67.15592956542969, 70.27789306640625, 73.39984893798828, 76.52180480957031, 79.64376831054688, 82.7657241821289, 85.88768005371094, 89.0096435546875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 20.0, 15.0, 36.0, 64.0, 115.0, 185.0, 314.0, 572.0, 1275.0, 2944.0, 7417.0, 23731.0, 97618.0, 518671.0, 309803.0, 60109.0, 16073.0, 5306.0, 2155.0, 1025.0, 470.0, 262.0, 151.0, 81.0, 56.0, 22.0, 26.0, 11.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.7010498046875, -9.386474609375, -9.0718994140625, -8.75732421875, -8.4427490234375, -8.128173828125, -7.8135986328125, -7.4990234375, -7.1844482421875, -6.869873046875, -6.5552978515625, -6.24072265625, -5.9261474609375, -5.611572265625, -5.2969970703125, -4.982421875, -4.6678466796875, -4.353271484375, -4.0386962890625, -3.72412109375, -3.4095458984375, -3.094970703125, -2.7803955078125, -2.4658203125, -2.1512451171875, -1.836669921875, -1.5220947265625, -1.20751953125, -0.8929443359375, -0.578369140625, -0.2637939453125, 0.05078125, 0.3653564453125, 0.679931640625, 0.9945068359375, 1.30908203125, 1.6236572265625, 1.938232421875, 2.2528076171875, 2.5673828125, 2.8819580078125, 3.196533203125, 3.5111083984375, 3.82568359375, 4.1402587890625, 4.454833984375, 4.7694091796875, 5.083984375, 5.3985595703125, 5.713134765625, 6.0277099609375, 6.34228515625, 6.6568603515625, 6.971435546875, 7.2860107421875, 7.6005859375, 7.9151611328125, 8.229736328125, 8.5443115234375, 8.85888671875, 9.1734619140625, 9.488037109375, 9.8026123046875, 10.1171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 8.0, 19.0, 16.0, 20.0, 32.0, 22.0, 28.0, 47.0, 42.0, 48.0, 56.0, 48.0, 54.0, 52.0, 44.0, 54.0, 48.0, 50.0, 40.0, 38.0, 38.0, 36.0, 20.0, 32.0, 23.0, 20.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5528564453125, -4.363525390625, -4.1741943359375, -3.98486328125, -3.7955322265625, -3.606201171875, -3.4168701171875, -3.2275390625, -3.0382080078125, -2.848876953125, -2.6595458984375, -2.47021484375, -2.2808837890625, -2.091552734375, -1.9022216796875, -1.712890625, -1.5235595703125, -1.334228515625, -1.1448974609375, -0.95556640625, -0.7662353515625, -0.576904296875, -0.3875732421875, -0.1982421875, -0.0089111328125, 0.180419921875, 0.3697509765625, 0.55908203125, 0.7484130859375, 0.937744140625, 1.1270751953125, 1.31640625, 1.5057373046875, 1.695068359375, 1.8843994140625, 2.07373046875, 2.2630615234375, 2.452392578125, 2.6417236328125, 2.8310546875, 3.0203857421875, 3.209716796875, 3.3990478515625, 3.58837890625, 3.7777099609375, 3.967041015625, 4.1563720703125, 4.345703125, 4.5350341796875, 4.724365234375, 4.9136962890625, 5.10302734375, 5.2923583984375, 5.481689453125, 5.6710205078125, 5.8603515625, 6.0496826171875, 6.239013671875, 6.4283447265625, 6.61767578125, 6.8070068359375, 6.996337890625, 7.1856689453125, 7.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 15.0, 17.0, 27.0, 51.0, 92.0, 153.0, 301.0, 697.0, 2612.0, 31794.0, 976215.0, 32624.0, 2625.0, 702.0, 258.0, 142.0, 93.0, 51.0, 20.0, 19.0, 9.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.64599609375, -13.9951171875, -13.34423828125, -12.693359375, -12.04248046875, -11.3916015625, -10.74072265625, -10.08984375, -9.43896484375, -8.7880859375, -8.13720703125, -7.486328125, -6.83544921875, -6.1845703125, -5.53369140625, -4.8828125, -4.23193359375, -3.5810546875, -2.93017578125, -2.279296875, -1.62841796875, -0.9775390625, -0.32666015625, 0.32421875, 0.97509765625, 1.6259765625, 2.27685546875, 2.927734375, 3.57861328125, 4.2294921875, 4.88037109375, 5.53125, 6.18212890625, 6.8330078125, 7.48388671875, 8.134765625, 8.78564453125, 9.4365234375, 10.08740234375, 10.73828125, 11.38916015625, 12.0400390625, 12.69091796875, 13.341796875, 13.99267578125, 14.6435546875, 15.29443359375, 15.9453125, 16.59619140625, 17.2470703125, 17.89794921875, 18.548828125, 19.19970703125, 19.8505859375, 20.50146484375, 21.15234375, 21.80322265625, 22.4541015625, 23.10498046875, 23.755859375, 24.40673828125, 25.0576171875, 25.70849609375, 26.359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 16.0, 18.0, 13.0, 27.0, 34.0, 25.0, 45.0, 56.0, 48.0, 78.0, 81.0, 84.0, 75.0, 64.0, 59.0, 53.0, 39.0, 32.0, 26.0, 15.0, 22.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.6005859375, -22.826171875, -22.0517578125, -21.27734375, -20.5029296875, -19.728515625, -18.9541015625, -18.1796875, -17.4052734375, -16.630859375, -15.8564453125, -15.08203125, -14.3076171875, -13.533203125, -12.7587890625, -11.984375, -11.2099609375, -10.435546875, -9.6611328125, -8.88671875, -8.1123046875, -7.337890625, -6.5634765625, -5.7890625, -5.0146484375, -4.240234375, -3.4658203125, -2.69140625, -1.9169921875, -1.142578125, -0.3681640625, 0.40625, 1.1806640625, 1.955078125, 2.7294921875, 3.50390625, 4.2783203125, 5.052734375, 5.8271484375, 6.6015625, 7.3759765625, 8.150390625, 8.9248046875, 9.69921875, 10.4736328125, 11.248046875, 12.0224609375, 12.796875, 13.5712890625, 14.345703125, 15.1201171875, 15.89453125, 16.6689453125, 17.443359375, 18.2177734375, 18.9921875, 19.7666015625, 20.541015625, 21.3154296875, 22.08984375, 22.8642578125, 23.638671875, 24.4130859375, 25.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 8.0, 9.0, 31.0, 32.0, 39.0, 93.0, 164.0, 365.0, 1178.0, 4209.0, 43470.0, 975733.0, 18897.0, 2793.0, 807.0, 328.0, 163.0, 69.0, 44.0, 26.0, 18.0, 11.0, 8.0, 6.0, 12.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.798828125, -3.677703857421875, -3.55657958984375, -3.435455322265625, -3.3143310546875, -3.193206787109375, -3.07208251953125, -2.950958251953125, -2.829833984375, -2.708709716796875, -2.58758544921875, -2.466461181640625, -2.3453369140625, -2.224212646484375, -2.10308837890625, -1.981964111328125, -1.86083984375, -1.739715576171875, -1.61859130859375, -1.497467041015625, -1.3763427734375, -1.255218505859375, -1.13409423828125, -1.012969970703125, -0.891845703125, -0.770721435546875, -0.64959716796875, -0.528472900390625, -0.4073486328125, -0.286224365234375, -0.16510009765625, -0.043975830078125, 0.0771484375, 0.198272705078125, 0.31939697265625, 0.440521240234375, 0.5616455078125, 0.682769775390625, 0.80389404296875, 0.925018310546875, 1.046142578125, 1.167266845703125, 1.28839111328125, 1.409515380859375, 1.5306396484375, 1.651763916015625, 1.77288818359375, 1.894012451171875, 2.01513671875, 2.136260986328125, 2.25738525390625, 2.378509521484375, 2.4996337890625, 2.620758056640625, 2.74188232421875, 2.863006591796875, 2.984130859375, 3.105255126953125, 3.22637939453125, 3.347503662109375, 3.4686279296875, 3.589752197265625, 3.71087646484375, 3.832000732421875, 3.953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 14.0, 20.0, 35.0, 55.0, 100.0, 214.0, 235.0, 126.0, 69.0, 35.0, 23.0, 19.0, 8.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013141632080078125, -0.0012768208980560303, -0.001239478588104248, -0.0012021362781524658, -0.0011647939682006836, -0.0011274516582489014, -0.0010901093482971191, -0.001052767038345337, -0.0010154247283935547, -0.0009780824184417725, -0.0009407401084899902, -0.000903397798538208, -0.0008660554885864258, -0.0008287131786346436, -0.0007913708686828613, -0.0007540285587310791, -0.0007166862487792969, -0.0006793439388275146, -0.0006420016288757324, -0.0006046593189239502, -0.000567317008972168, -0.0005299746990203857, -0.0004926323890686035, -0.0004552900791168213, -0.00041794776916503906, -0.00038060545921325684, -0.0003432631492614746, -0.0003059208393096924, -0.00026857852935791016, -0.00023123621940612793, -0.0001938939094543457, -0.00015655159950256348, -0.00011920928955078125, -8.186697959899902e-05, -4.45246696472168e-05, -7.18235969543457e-06, 3.0159950256347656e-05, 6.750226020812988e-05, 0.00010484457015991211, 0.00014218688011169434, 0.00017952919006347656, 0.0002168715000152588, 0.000254213809967041, 0.00029155611991882324, 0.00032889842987060547, 0.0003662407398223877, 0.0004035830497741699, 0.00044092535972595215, 0.0004782676696777344, 0.0005156099796295166, 0.0005529522895812988, 0.0005902945995330811, 0.0006276369094848633, 0.0006649792194366455, 0.0007023215293884277, 0.00073966383934021, 0.0007770061492919922, 0.0008143484592437744, 0.0008516907691955566, 0.0008890330791473389, 0.0009263753890991211, 0.0009637176990509033, 0.0010010600090026855, 0.0010384023189544678, 0.00107574462890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 10.0, 10.0, 25.0, 37.0, 73.0, 117.0, 208.0, 348.0, 656.0, 1277.0, 2940.0, 8088.0, 35104.0, 828042.0, 145253.0, 17263.0, 5012.0, 1929.0, 974.0, 513.0, 259.0, 165.0, 86.0, 45.0, 35.0, 19.0, 13.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.3984375, -2.32745361328125, -2.2564697265625, -2.18548583984375, -2.114501953125, -2.04351806640625, -1.9725341796875, -1.90155029296875, -1.83056640625, -1.75958251953125, -1.6885986328125, -1.61761474609375, -1.546630859375, -1.47564697265625, -1.4046630859375, -1.33367919921875, -1.2626953125, -1.19171142578125, -1.1207275390625, -1.04974365234375, -0.978759765625, -0.90777587890625, -0.8367919921875, -0.76580810546875, -0.69482421875, -0.62384033203125, -0.5528564453125, -0.48187255859375, -0.410888671875, -0.33990478515625, -0.2689208984375, -0.19793701171875, -0.126953125, -0.05596923828125, 0.0150146484375, 0.08599853515625, 0.156982421875, 0.22796630859375, 0.2989501953125, 0.36993408203125, 0.44091796875, 0.51190185546875, 0.5828857421875, 0.65386962890625, 0.724853515625, 0.79583740234375, 0.8668212890625, 0.93780517578125, 1.0087890625, 1.07977294921875, 1.1507568359375, 1.22174072265625, 1.292724609375, 1.36370849609375, 1.4346923828125, 1.50567626953125, 1.57666015625, 1.64764404296875, 1.7186279296875, 1.78961181640625, 1.860595703125, 1.93157958984375, 2.0025634765625, 2.07354736328125, 2.14453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 12.0, 15.0, 16.0, 15.0, 30.0, 43.0, 66.0, 80.0, 102.0, 121.0, 92.0, 100.0, 80.0, 59.0, 24.0, 19.0, 22.0, 15.0, 15.0, 2.0, 8.0, 5.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.005859375, -1.9481201171875, -1.890380859375, -1.8326416015625, -1.77490234375, -1.7171630859375, -1.659423828125, -1.6016845703125, -1.5439453125, -1.4862060546875, -1.428466796875, -1.3707275390625, -1.31298828125, -1.2552490234375, -1.197509765625, -1.1397705078125, -1.08203125, -1.0242919921875, -0.966552734375, -0.9088134765625, -0.85107421875, -0.7933349609375, -0.735595703125, -0.6778564453125, -0.6201171875, -0.5623779296875, -0.504638671875, -0.4468994140625, -0.38916015625, -0.3314208984375, -0.273681640625, -0.2159423828125, -0.158203125, -0.1004638671875, -0.042724609375, 0.0150146484375, 0.07275390625, 0.1304931640625, 0.188232421875, 0.2459716796875, 0.3037109375, 0.3614501953125, 0.419189453125, 0.4769287109375, 0.53466796875, 0.5924072265625, 0.650146484375, 0.7078857421875, 0.765625, 0.8233642578125, 0.881103515625, 0.9388427734375, 0.99658203125, 1.0543212890625, 1.112060546875, 1.1697998046875, 1.2275390625, 1.2852783203125, 1.343017578125, 1.4007568359375, 1.45849609375, 1.5162353515625, 1.573974609375, 1.6317138671875, 1.689453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 32.0, 127.0, 701.0, 105.0, 25.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.4772186279297, -197.0380401611328, -189.59886169433594, -182.15968322753906, -174.7205047607422, -167.2813262939453, -159.84214782714844, -152.40296936035156, -144.9637908935547, -137.5246124267578, -130.08543395996094, -122.64625549316406, -115.20707702636719, -107.76789855957031, -100.32872009277344, -92.88954162597656, -85.45036315917969, -78.01118469238281, -70.57200622558594, -63.13282775878906, -55.69364929199219, -48.25447082519531, -40.81529235839844, -33.37611389160156, -25.936935424804688, -18.497756958007812, -11.058578491210938, -3.6194000244140625, 3.8197784423828125, 11.258956909179688, 18.698135375976562, 26.137313842773438, 33.57647705078125, 41.015655517578125, 48.454833984375, 55.894012451171875, 63.33319091796875, 70.77236938476562, 78.2115478515625, 85.65072631835938, 93.08990478515625, 100.52908325195312, 107.96826171875, 115.40744018554688, 122.84661865234375, 130.28579711914062, 137.7249755859375, 145.16415405273438, 152.60333251953125, 160.04251098632812, 167.481689453125, 174.92086791992188, 182.36004638671875, 189.79922485351562, 197.2384033203125, 204.67758178710938, 212.11676025390625, 219.55593872070312, 226.9951171875, 234.43429565429688, 241.87347412109375, 249.31265258789062, 256.7518310546875, 264.1910095214844, 271.63018798828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 10.0, 13.0, 10.0, 22.0, 28.0, 24.0, 30.0, 32.0, 59.0, 117.0, 299.0, 109.0, 36.0, 49.0, 23.0, 31.0, 12.0, 15.0, 19.0, 11.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.204261779785156, -53.45351791381836, -50.7027702331543, -47.9520263671875, -45.2012825012207, -42.450538635253906, -39.699790954589844, -36.94904708862305, -34.19830322265625, -31.44755744934082, -28.696813583374023, -25.946067810058594, -23.195323944091797, -20.444578170776367, -17.693832397460938, -14.94308853149414, -12.192340850830078, -9.441596031188965, -6.690850734710693, -3.940105438232422, -1.1893606185913086, 1.5613842010498047, 4.312129974365234, 7.062873840332031, 9.813619613647461, 12.564364433288574, 15.315109252929688, 18.065855026245117, 20.816600799560547, 23.567344665527344, 26.318090438842773, 29.06883430480957, 31.819580078125, 34.5703239440918, 37.32107162475586, 40.071815490722656, 42.82255935668945, 45.57330322265625, 48.32405090332031, 51.07479476928711, 53.825538635253906, 56.5762825012207, 59.327030181884766, 62.07777404785156, 64.82852172851562, 67.57926177978516, 70.33000946044922, 73.08074951171875, 75.83149719238281, 78.58224487304688, 81.3329849243164, 84.08373260498047, 86.83448028564453, 89.58522033691406, 92.33596801757812, 95.08671569824219, 97.83746337890625, 100.58821105957031, 103.33895111083984, 106.0896987915039, 108.84044647216797, 111.5911865234375, 114.34193420410156, 117.09268188476562, 119.84342193603516]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 22.0, 38.0, 50.0, 56.0, 73.0, 390.0, 148.0, 77.0, 49.0, 26.0, 24.0, 14.0, 11.0, 9.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -5.841552734375, -5.38623046875, -4.930908203125, -4.4755859375, -4.020263671875, -3.56494140625, -3.109619140625, -2.654296875, -2.198974609375, -1.74365234375, -1.288330078125, -0.8330078125, -0.377685546875, 0.07763671875, 0.532958984375, 0.98828125, 1.443603515625, 1.89892578125, 2.354248046875, 2.8095703125, 3.264892578125, 3.72021484375, 4.175537109375, 4.630859375, 5.086181640625, 5.54150390625, 5.996826171875, 6.4521484375, 6.907470703125, 7.36279296875, 7.818115234375, 8.2734375, 8.728759765625, 9.18408203125, 9.639404296875, 10.0947265625, 10.550048828125, 11.00537109375, 11.460693359375, 11.916015625, 12.371337890625, 12.82666015625, 13.281982421875, 13.7373046875, 14.192626953125, 14.64794921875, 15.103271484375, 15.55859375, 16.013916015625, 16.46923828125, 16.924560546875, 17.3798828125, 17.835205078125, 18.29052734375, 18.745849609375, 19.201171875, 19.656494140625, 20.11181640625, 20.567138671875, 21.0224609375, 21.477783203125, 21.93310546875, 22.388427734375, 22.84375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 7.0, 7.0, 10.0, 19.0, 12.0, 12.0, 23.0, 31.0, 66.0, 85.0, 141.0, 260.0, 472.0, 1196.0, 3937.0, 26785.0, 8332886.0, 17267.0, 3247.0, 1051.0, 476.0, 221.0, 117.0, 68.0, 38.0, 36.0, 28.0, 23.0, 5.0, 10.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.35891723632812, -72.37186431884766, -70.38480377197266, -68.39775085449219, -66.41069793701172, -64.42364501953125, -62.436588287353516, -60.44953155517578, -58.46247863769531, -56.47542190551758, -54.48836898803711, -52.501312255859375, -50.514259338378906, -48.52720260620117, -46.5401496887207, -44.55309295654297, -42.5660400390625, -40.578983306884766, -38.5919303894043, -36.60487365722656, -34.617820739746094, -32.63076400756836, -30.64371109008789, -28.656654357910156, -26.669597625732422, -24.68254280090332, -22.69548797607422, -20.708433151245117, -18.721378326416016, -16.73432159423828, -14.747267723083496, -12.760212898254395, -10.77315902709961, -8.786104202270508, -6.799049377441406, -4.8119940757751465, -2.824939250946045, -0.8378839492797852, 1.1491708755493164, 3.136225700378418, 5.1232805252075195, 7.110335350036621, 9.097390174865723, 11.08444595336914, 13.071500778198242, 15.058555603027344, 17.045610427856445, 19.032665252685547, 21.01972007751465, 23.00677490234375, 24.99382972717285, 26.980884552001953, 28.967939376831055, 30.954994201660156, 32.94205093383789, 34.92910385131836, 36.916160583496094, 38.90321731567383, 40.8902702331543, 42.87732696533203, 44.8643798828125, 46.851436614990234, 48.8384895324707, 50.82554626464844, 52.812599182128906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 12.0, 6.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.6932601928711, -101.4347915649414, -98.17632293701172, -94.9178466796875, -91.65937805175781, -88.40090942382812, -85.14244079589844, -81.88397216796875, -78.62550354003906, -75.36703491210938, -72.10856628417969, -68.85009765625, -65.59162139892578, -62.333152770996094, -59.074684143066406, -55.81621551513672, -52.5577392578125, -49.29927062988281, -46.04079818725586, -42.78232955932617, -39.52385711669922, -36.26538848876953, -33.006919860839844, -29.748449325561523, -26.489978790283203, -23.231508255004883, -19.973037719726562, -16.714569091796875, -13.456098556518555, -10.197628021240234, -6.939159393310547, -3.6806888580322266, -0.42221832275390625, 2.836251735687256, 6.094721794128418, 9.353191375732422, 12.611661911010742, 15.870132446289062, 19.12860107421875, 22.38707160949707, 25.64554214477539, 28.90401268005371, 32.16248321533203, 35.42095184326172, 38.679420471191406, 41.93789291381836, 45.19636154174805, 48.454833984375, 51.71330261230469, 54.971771240234375, 58.23024368286133, 61.488712310791016, 64.74718475341797, 68.00565338134766, 71.26412200927734, 74.52259063720703, 77.78106689453125, 81.03953552246094, 84.29800415039062, 87.55647277832031, 90.81494903564453, 94.07341766357422, 97.3318862915039, 100.5903549194336, 103.84882354736328]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 14.0, 14.0, 12.0, 25.0, 23.0, 30.0, 51.0, 61.0, 100.0, 157.0, 247.0, 389.0, 687.0, 1285.0, 2881.0, 6931.0, 20415.0, 70636.0, 216126.0, 142807.0, 40175.0, 12340.0, 4569.0, 2020.0, 951.0, 511.0, 298.0, 170.0, 108.0, 74.0, 47.0, 27.0, 23.0, 13.0, 8.0, 10.0, 5.0, 3.0, 2.0], "bins": [-84.125, -82.203125, -80.28125, -78.359375, -76.4375, -74.515625, -72.59375, -70.671875, -68.75, -66.828125, -64.90625, -62.984375, -61.0625, -59.140625, -57.21875, -55.296875, -53.375, -51.453125, -49.53125, -47.609375, -45.6875, -43.765625, -41.84375, -39.921875, -38.0, -36.078125, -34.15625, -32.234375, -30.3125, -28.390625, -26.46875, -24.546875, -22.625, -20.703125, -18.78125, -16.859375, -14.9375, -13.015625, -11.09375, -9.171875, -7.25, -5.328125, -3.40625, -1.484375, 0.4375, 2.359375, 4.28125, 6.203125, 8.125, 10.046875, 11.96875, 13.890625, 15.8125, 17.734375, 19.65625, 21.578125, 23.5, 25.421875, 27.34375, 29.265625, 31.1875, 33.109375, 35.03125, 36.953125, 38.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 13.0, 14.0, 22.0, 26.0, 45.0, 59.0, 72.0, 101.0, 112.0, 110.0, 110.0, 113.0, 72.0, 41.0, 47.0, 19.0, 15.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -16.0570068359375, -15.676513671875, -15.2960205078125, -14.91552734375, -14.5350341796875, -14.154541015625, -13.7740478515625, -13.3935546875, -13.0130615234375, -12.632568359375, -12.2520751953125, -11.87158203125, -11.4910888671875, -11.110595703125, -10.7301025390625, -10.349609375, -9.9691162109375, -9.588623046875, -9.2081298828125, -8.82763671875, -8.4471435546875, -8.066650390625, -7.6861572265625, -7.3056640625, -6.9251708984375, -6.544677734375, -6.1641845703125, -5.78369140625, -5.4031982421875, -5.022705078125, -4.6422119140625, -4.26171875, -3.8812255859375, -3.500732421875, -3.1202392578125, -2.73974609375, -2.3592529296875, -1.978759765625, -1.5982666015625, -1.2177734375, -0.8372802734375, -0.456787109375, -0.0762939453125, 0.30419921875, 0.6846923828125, 1.065185546875, 1.4456787109375, 1.826171875, 2.2066650390625, 2.587158203125, 2.9676513671875, 3.34814453125, 3.7286376953125, 4.109130859375, 4.4896240234375, 4.8701171875, 5.2506103515625, 5.631103515625, 6.0115966796875, 6.39208984375, 6.7725830078125, 7.153076171875, 7.5335693359375, 7.9140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 14.0, 13.0, 20.0, 18.0, 38.0, 55.0, 78.0, 77.0, 54.0, 35.0, 14.0, 13.0, 16.0, 7.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.44195556640625, -64.41422271728516, -62.3864860534668, -60.3587532043457, -58.33102035522461, -56.30328369140625, -54.275550842285156, -52.24781799316406, -50.22008514404297, -48.192352294921875, -46.164615631103516, -44.13688278198242, -42.10914993286133, -40.08141326904297, -38.053680419921875, -36.02594757080078, -33.99821090698242, -31.970476150512695, -29.9427433013916, -27.915008544921875, -25.88727569580078, -23.859540939331055, -21.831806182861328, -19.804073333740234, -17.776338577270508, -15.748604774475098, -13.720870971679688, -11.693136215209961, -9.66540241241455, -7.637668609619141, -5.609933853149414, -3.582200050354004, -1.5544700622558594, 0.4732639789581299, 2.500998020172119, 4.5287322998046875, 6.556466102600098, 8.584199905395508, 10.611934661865234, 12.639668464660645, 14.667402267456055, 16.69513702392578, 18.722869873046875, 20.7506046295166, 22.778339385986328, 24.806072235107422, 26.83380699157715, 28.861541748046875, 30.88927459716797, 32.91700744628906, 34.94474411010742, 36.972476959228516, 39.00020980834961, 41.02794647216797, 43.05567932128906, 45.083412170410156, 47.11114501953125, 49.138877868652344, 51.1666145324707, 53.1943473815918, 55.22208023071289, 57.24981689453125, 59.277549743652344, 61.30528259277344, 63.3330192565918]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 15.0, 25.0, 34.0, 39.0, 54.0, 60.0, 75.0, 54.0, 34.0, 17.0, 13.0, 5.0, 5.0, 1.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.305160522460938, -28.190046310424805, -27.074932098388672, -25.959819793701172, -24.84470558166504, -23.729591369628906, -22.614479064941406, -21.499364852905273, -20.38425064086914, -19.269136428833008, -18.154022216796875, -17.038909912109375, -15.923795700073242, -14.80868148803711, -13.693568229675293, -12.578454971313477, -11.463340759277344, -10.348226547241211, -9.233113288879395, -8.118000030517578, -7.002885818481445, -5.887772083282471, -4.772658348083496, -3.6575446128845215, -2.542430877685547, -1.4273171424865723, -0.31220340728759766, 0.802910327911377, 1.9180240631103516, 3.033137798309326, 4.148251533508301, 5.263365268707275, 6.378482818603516, 7.49359655380249, 8.608710289001465, 9.723823547363281, 10.838937759399414, 11.954051971435547, 13.069165229797363, 14.18427848815918, 15.299392700195312, 16.414506912231445, 17.529621124267578, 18.644733428955078, 19.75984764099121, 20.874961853027344, 21.990074157714844, 23.105188369750977, 24.22030258178711, 25.335416793823242, 26.450531005859375, 27.565643310546875, 28.680757522583008, 29.79587173461914, 30.91098403930664, 32.026100158691406, 33.141212463378906, 34.256324768066406, 35.37144088745117, 36.48655319213867, 37.60166931152344, 38.71678161621094, 39.83189392089844, 40.9470100402832, 42.0621223449707]}, "eval/loss": 0.8383785486221313, "eval/wer": 0.1366748020715519, "eval/runtime": 1219.9567, "eval/samples_per_second": 2.166, "eval/steps_per_second": 0.271, "train/train_runtime": 122857.9097, "train/train_samples_per_second": 4.646, "train/train_steps_per_second": 0.145, "train/total_flos": 0.0, "train/train_loss": 2.2609593777487165} \ No newline at end of file +{"train/loss": 0.2499, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 124597, "_timestamp": 1647498874, "_step": 17852, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 14.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 4.0, 9.0, 18.0, 29525.0, 875.0, 16.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.125, -168.603515625, -165.08203125, -161.560546875, -158.0390625, -154.517578125, -150.99609375, -147.474609375, -143.953125, -140.431640625, -136.91015625, -133.388671875, -129.8671875, -126.345703125, -122.82421875, -119.302734375, -115.78125, -112.259765625, -108.73828125, -105.216796875, -101.6953125, -98.173828125, -94.65234375, -91.130859375, -87.609375, -84.087890625, -80.56640625, -77.044921875, -73.5234375, -70.001953125, -66.48046875, -62.958984375, -59.4375, -55.916015625, -52.39453125, -48.873046875, -45.3515625, -41.830078125, -38.30859375, -34.787109375, -31.265625, -27.744140625, -24.22265625, -20.701171875, -17.1796875, -13.658203125, -10.13671875, -6.615234375, -3.09375, 0.427734375, 3.94921875, 7.470703125, 10.9921875, 14.513671875, 18.03515625, 21.556640625, 25.078125, 28.599609375, 32.12109375, 35.642578125, 39.1640625, 42.685546875, 46.20703125, 49.728515625, 53.25]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 3.0, 3.0, 6.0, 8.0, 6.0, 5.0, 13.0, 13.0, 17.0, 19.0, 24.0, 24.0, 22.0, 21.0, 35.0, 37.0, 47.0, 27.0, 39.0, 42.0, 41.0, 58.0, 41.0, 38.0, 43.0, 42.0, 39.0, 39.0, 38.0, 29.0, 20.0, 24.0, 26.0, 15.0, 15.0, 13.0, 6.0, 10.0, 10.0, 4.0, 7.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-37.44131088256836, -36.594993591308594, -35.74867630004883, -34.90236282348633, -34.05604553222656, -33.2097282409668, -32.36341094970703, -31.5170955657959, -30.670780181884766, -29.824462890625, -28.978147506713867, -28.1318302154541, -27.28551483154297, -26.439197540283203, -25.592880249023438, -24.746564865112305, -23.90024757385254, -23.053930282592773, -22.20761489868164, -21.361297607421875, -20.514982223510742, -19.668664932250977, -18.822349548339844, -17.976032257080078, -17.129714965820312, -16.283397674560547, -15.437082290649414, -14.590764999389648, -13.744449615478516, -12.89813232421875, -12.0518159866333, -11.205499649047852, -10.359186172485352, -9.512869834899902, -8.666553497314453, -7.820236682891846, -6.9739203453063965, -6.127604007720947, -5.28128719329834, -4.434970855712891, -3.5886545181274414, -2.742338180541992, -1.8960216045379639, -1.0497050285339355, -0.20338869094848633, 0.6429276466369629, 1.4892444610595703, 2.3355607986450195, 3.1818771362304688, 4.028193473815918, 4.874509811401367, 5.720826625823975, 6.567142963409424, 7.413459300994873, 8.25977611541748, 9.10609245300293, 9.952408790588379, 10.798725128173828, 11.645041465759277, 12.491357803344727, 13.337675094604492, 14.183990478515625, 15.03030776977539, 15.87662410736084, 16.72294044494629]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 8.0, 6.0, 9.0, 6.0, 11.0, 9.0, 17.0, 14.0, 31.0, 26.0, 29.0, 23.0, 36.0, 51.0, 43.0, 34.0, 44.0, 50.0, 42.0, 32.0, 52.0, 35.0, 40.0, 48.0, 33.0, 29.0, 20.0, 31.0, 30.0, 16.0, 24.0, 27.0, 13.0, 17.0, 17.0, 10.0, 9.0, 4.0, 4.0, 8.0, 8.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.865875244140625, -26.000263214111328, -25.13465118408203, -24.269039154052734, -23.403425216674805, -22.537813186645508, -21.67220115661621, -20.806589126586914, -19.940975189208984, -19.075363159179688, -18.20975112915039, -17.344139099121094, -16.478525161743164, -15.612913131713867, -14.74730110168457, -13.881689071655273, -13.016077041625977, -12.15046501159668, -11.284852027893066, -10.41923999786377, -9.553627014160156, -8.68801498413086, -7.8224029541015625, -6.956790447235107, -6.091177940368652, -5.225565433502197, -4.359952926635742, -3.4943408966064453, -2.6287283897399902, -1.7631158828735352, -0.8975038528442383, -0.0318913459777832, 0.8337230682373047, 1.6993354558944702, 2.5649478435516357, 3.4305601119995117, 4.296172618865967, 5.161785125732422, 6.027397155761719, 6.893009662628174, 7.758622169494629, 8.624234199523926, 9.489847183227539, 10.355459213256836, 11.221071243286133, 12.086684226989746, 12.952296257019043, 13.817909240722656, 14.683521270751953, 15.54913330078125, 16.414745330810547, 17.280357360839844, 18.145971298217773, 19.01158332824707, 19.877195358276367, 20.742807388305664, 21.608421325683594, 22.47403335571289, 23.339645385742188, 24.205257415771484, 25.070871353149414, 25.93648338317871, 26.802095413208008, 27.667707443237305, 28.5333194732666]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 13.0, 11.0, 18.0, 35.0, 61.0, 87.0, 144.0, 236.0, 381.0, 558.0, 930.0, 1512.0, 2314.0, 3589.0, 5697.0, 8750.0, 12940.0, 19432.0, 27520.0, 38987.0, 51489.0, 67133.0, 81702.0, 94353.0, 120262.0, 107531.0, 91995.0, 79255.0, 64688.0, 50098.0, 37011.0, 26422.0, 18287.0, 12305.0, 8119.0, 5403.0, 3480.0, 2149.0, 1360.0, 858.0, 533.0, 316.0, 200.0, 140.0, 90.0, 56.0, 41.0, 28.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.25, -85.396484375, -82.54296875, -79.689453125, -76.8359375, -73.982421875, -71.12890625, -68.275390625, -65.421875, -62.568359375, -59.71484375, -56.861328125, -54.0078125, -51.154296875, -48.30078125, -45.447265625, -42.59375, -39.740234375, -36.88671875, -34.033203125, -31.1796875, -28.326171875, -25.47265625, -22.619140625, -19.765625, -16.912109375, -14.05859375, -11.205078125, -8.3515625, -5.498046875, -2.64453125, 0.208984375, 3.0625, 5.916015625, 8.76953125, 11.623046875, 14.4765625, 17.330078125, 20.18359375, 23.037109375, 25.890625, 28.744140625, 31.59765625, 34.451171875, 37.3046875, 40.158203125, 43.01171875, 45.865234375, 48.71875, 51.572265625, 54.42578125, 57.279296875, 60.1328125, 62.986328125, 65.83984375, 68.693359375, 71.546875, 74.400390625, 77.25390625, 80.107421875, 82.9609375, 85.814453125, 88.66796875, 91.521484375, 94.375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 6.0, 13.0, 20.0, 24.0, 14.0, 25.0, 33.0, 35.0, 52.0, 42.0, 43.0, 50.0, 43.0, 73.0, 84.0, 53.0, 57.0, 36.0, 45.0, 46.0, 32.0, 39.0, 16.0, 15.0, 17.0, 18.0, 13.0, 9.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.84619140625, -51.1923828125, -49.53857421875, -47.884765625, -46.23095703125, -44.5771484375, -42.92333984375, -41.26953125, -39.61572265625, -37.9619140625, -36.30810546875, -34.654296875, -33.00048828125, -31.3466796875, -29.69287109375, -28.0390625, -26.38525390625, -24.7314453125, -23.07763671875, -21.423828125, -19.77001953125, -18.1162109375, -16.46240234375, -14.80859375, -13.15478515625, -11.5009765625, -9.84716796875, -8.193359375, -6.53955078125, -4.8857421875, -3.23193359375, -1.578125, 0.07568359375, 1.7294921875, 3.38330078125, 5.037109375, 6.69091796875, 8.3447265625, 9.99853515625, 11.65234375, 13.30615234375, 14.9599609375, 16.61376953125, 18.267578125, 19.92138671875, 21.5751953125, 23.22900390625, 24.8828125, 26.53662109375, 28.1904296875, 29.84423828125, 31.498046875, 33.15185546875, 34.8056640625, 36.45947265625, 38.11328125, 39.76708984375, 41.4208984375, 43.07470703125, 44.728515625, 46.38232421875, 48.0361328125, 49.68994140625, 51.34375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 12.0, 5.0, 7.0, 4.0, 18.0, 19.0, 24.0, 31.0, 37.0, 40.0, 42.0, 53.0, 33.0, 37.0, 45.0, 41.0, 56.0, 48.0, 60.0, 46.0, 43.0, 32.0, 37.0, 29.0, 25.0, 29.0, 25.0, 17.0, 12.0, 21.0, 17.0, 12.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.385425567626953, -25.43740463256836, -24.489383697509766, -23.541362762451172, -22.59334373474121, -21.645322799682617, -20.697301864624023, -19.74928092956543, -18.80126190185547, -17.853240966796875, -16.90522003173828, -15.957200050354004, -15.009180068969727, -14.061159133911133, -13.113138198852539, -12.165117263793945, -11.217096328735352, -10.269075393676758, -9.32105541229248, -8.373034477233887, -7.425014019012451, -6.476993560791016, -5.528972625732422, -4.580952167510986, -3.632931709289551, -2.6849112510681152, -1.7368905544281006, -0.7888698577880859, 0.1591506004333496, 1.1071710586547852, 2.055191993713379, 3.0032124519348145, 3.95123291015625, 4.8992533683776855, 5.847273826599121, 6.795294761657715, 7.74331521987915, 8.691335678100586, 9.63935661315918, 10.587377548217773, 11.53539752960205, 12.483418464660645, 13.431438446044922, 14.379459381103516, 15.32748031616211, 16.275501251220703, 17.223522186279297, 18.171541213989258, 19.11956214904785, 20.067583084106445, 21.01560401916504, 21.963623046875, 22.911643981933594, 23.859664916992188, 24.80768585205078, 25.755706787109375, 26.70372772216797, 27.651748657226562, 28.599769592285156, 29.54779052734375, 30.49580955505371, 31.443830490112305, 32.39185333251953, 33.33987045288086, 34.28789138793945]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 18.0, 13.0, 19.0, 24.0, 17.0, 28.0, 28.0, 27.0, 33.0, 37.0, 38.0, 38.0, 34.0, 37.0, 29.0, 32.0, 34.0, 50.0, 35.0, 29.0, 39.0, 29.0, 23.0, 26.0, 23.0, 22.0, 25.0, 22.0, 16.0, 13.0, 16.0, 13.0, 13.0, 7.0, 3.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.41060447692871, -23.645917892456055, -22.881229400634766, -22.11654281616211, -21.351856231689453, -20.587169647216797, -19.822481155395508, -19.05779457092285, -18.293106079101562, -17.528419494628906, -16.763731002807617, -15.999044418334961, -15.234357833862305, -14.469670295715332, -13.70498275756836, -12.940296173095703, -12.175609588623047, -11.410922050476074, -10.646235466003418, -9.881547927856445, -9.116861343383789, -8.352173805236816, -7.587486267089844, -6.822799205780029, -6.058112144470215, -5.2934250831604, -4.528738021850586, -3.7640504837036133, -2.999363422393799, -2.2346763610839844, -1.4699888229370117, -0.7053017616271973, 0.059383392333984375, 0.8240705728530884, 1.5887577533721924, 2.353445053100586, 3.1181321144104004, 3.882819175720215, 4.6475067138671875, 5.412193775177002, 6.176880836486816, 6.941567897796631, 7.706254959106445, 8.470942497253418, 9.23563003540039, 10.000316619873047, 10.76500415802002, 11.529691696166992, 12.294378280639648, 13.059065818786621, 13.823752403259277, 14.58843994140625, 15.353126525878906, 16.117813110351562, 16.88250160217285, 17.647188186645508, 18.411876678466797, 19.176563262939453, 19.941251754760742, 20.7059383392334, 21.470624923706055, 22.235313415527344, 23.0, 23.764686584472656, 24.529373168945312]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 3.0, 8.0, 18.0, 32.0, 34.0, 52.0, 100.0, 157.0, 221.0, 375.0, 630.0, 1037.0, 1504.0, 2432.0, 3798.0, 5961.0, 9766.0, 15600.0, 24875.0, 39892.0, 65460.0, 105003.0, 171497.0, 273961.0, 430752.0, 634959.0, 751476.0, 601193.0, 398115.0, 250380.0, 154641.0, 95080.0, 58549.0, 35874.0, 22552.0, 13783.0, 8724.0, 5604.0, 3651.0, 2317.0, 1469.0, 901.0, 638.0, 386.0, 280.0, 207.0, 125.0, 71.0, 59.0, 37.0, 16.0, 16.0, 6.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-41.5, -40.1357421875, -38.771484375, -37.4072265625, -36.04296875, -34.6787109375, -33.314453125, -31.9501953125, -30.5859375, -29.2216796875, -27.857421875, -26.4931640625, -25.12890625, -23.7646484375, -22.400390625, -21.0361328125, -19.671875, -18.3076171875, -16.943359375, -15.5791015625, -14.21484375, -12.8505859375, -11.486328125, -10.1220703125, -8.7578125, -7.3935546875, -6.029296875, -4.6650390625, -3.30078125, -1.9365234375, -0.572265625, 0.7919921875, 2.15625, 3.5205078125, 4.884765625, 6.2490234375, 7.61328125, 8.9775390625, 10.341796875, 11.7060546875, 13.0703125, 14.4345703125, 15.798828125, 17.1630859375, 18.52734375, 19.8916015625, 21.255859375, 22.6201171875, 23.984375, 25.3486328125, 26.712890625, 28.0771484375, 29.44140625, 30.8056640625, 32.169921875, 33.5341796875, 34.8984375, 36.2626953125, 37.626953125, 38.9912109375, 40.35546875, 41.7197265625, 43.083984375, 44.4482421875, 45.8125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 22.0, 13.0, 16.0, 19.0, 23.0, 22.0, 19.0, 30.0, 23.0, 24.0, 40.0, 30.0, 45.0, 34.0, 31.0, 31.0, 27.0, 42.0, 40.0, 39.0, 26.0, 39.0, 27.0, 32.0, 27.0, 14.0, 31.0, 22.0, 26.0, 12.0, 21.0, 16.0, 16.0, 12.0, 18.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.96875, -20.309326171875, -19.64990234375, -18.990478515625, -18.3310546875, -17.671630859375, -17.01220703125, -16.352783203125, -15.693359375, -15.033935546875, -14.37451171875, -13.715087890625, -13.0556640625, -12.396240234375, -11.73681640625, -11.077392578125, -10.41796875, -9.758544921875, -9.09912109375, -8.439697265625, -7.7802734375, -7.120849609375, -6.46142578125, -5.802001953125, -5.142578125, -4.483154296875, -3.82373046875, -3.164306640625, -2.5048828125, -1.845458984375, -1.18603515625, -0.526611328125, 0.1328125, 0.792236328125, 1.45166015625, 2.111083984375, 2.7705078125, 3.429931640625, 4.08935546875, 4.748779296875, 5.408203125, 6.067626953125, 6.72705078125, 7.386474609375, 8.0458984375, 8.705322265625, 9.36474609375, 10.024169921875, 10.68359375, 11.343017578125, 12.00244140625, 12.661865234375, 13.3212890625, 13.980712890625, 14.64013671875, 15.299560546875, 15.958984375, 16.618408203125, 17.27783203125, 17.937255859375, 18.5966796875, 19.256103515625, 19.91552734375, 20.574951171875, 21.234375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 11.0, 13.0, 5.0, 29.0, 44.0, 67.0, 103.0, 168.0, 251.0, 365.0, 604.0, 976.0, 1532.0, 2343.0, 3750.0, 5927.0, 9563.0, 14926.0, 23821.0, 37469.0, 59351.0, 92981.0, 144844.0, 219601.0, 324507.0, 455309.0, 581203.0, 610101.0, 505410.0, 370667.0, 255806.0, 169993.0, 110137.0, 70691.0, 45003.0, 28529.0, 17916.0, 11100.0, 7026.0, 4359.0, 2848.0, 1764.0, 1187.0, 706.0, 465.0, 323.0, 183.0, 115.0, 74.0, 50.0, 25.0, 18.0, 14.0, 14.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-27.90625, -27.039306640625, -26.17236328125, -25.305419921875, -24.4384765625, -23.571533203125, -22.70458984375, -21.837646484375, -20.970703125, -20.103759765625, -19.23681640625, -18.369873046875, -17.5029296875, -16.635986328125, -15.76904296875, -14.902099609375, -14.03515625, -13.168212890625, -12.30126953125, -11.434326171875, -10.5673828125, -9.700439453125, -8.83349609375, -7.966552734375, -7.099609375, -6.232666015625, -5.36572265625, -4.498779296875, -3.6318359375, -2.764892578125, -1.89794921875, -1.031005859375, -0.1640625, 0.702880859375, 1.56982421875, 2.436767578125, 3.3037109375, 4.170654296875, 5.03759765625, 5.904541015625, 6.771484375, 7.638427734375, 8.50537109375, 9.372314453125, 10.2392578125, 11.106201171875, 11.97314453125, 12.840087890625, 13.70703125, 14.573974609375, 15.44091796875, 16.307861328125, 17.1748046875, 18.041748046875, 18.90869140625, 19.775634765625, 20.642578125, 21.509521484375, 22.37646484375, 23.243408203125, 24.1103515625, 24.977294921875, 25.84423828125, 26.711181640625, 27.578125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 9.0, 10.0, 17.0, 17.0, 27.0, 30.0, 41.0, 40.0, 49.0, 75.0, 94.0, 122.0, 135.0, 163.0, 175.0, 177.0, 235.0, 248.0, 258.0, 237.0, 241.0, 216.0, 218.0, 181.0, 191.0, 135.0, 127.0, 99.0, 92.0, 64.0, 71.0, 49.0, 40.0, 40.0, 27.0, 22.0, 16.0, 26.0, 15.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9765625, -11.58203125, -11.1875, -10.79296875, -10.3984375, -10.00390625, -9.609375, -9.21484375, -8.8203125, -8.42578125, -8.03125, -7.63671875, -7.2421875, -6.84765625, -6.453125, -6.05859375, -5.6640625, -5.26953125, -4.875, -4.48046875, -4.0859375, -3.69140625, -3.296875, -2.90234375, -2.5078125, -2.11328125, -1.71875, -1.32421875, -0.9296875, -0.53515625, -0.140625, 0.25390625, 0.6484375, 1.04296875, 1.4375, 1.83203125, 2.2265625, 2.62109375, 3.015625, 3.41015625, 3.8046875, 4.19921875, 4.59375, 4.98828125, 5.3828125, 5.77734375, 6.171875, 6.56640625, 6.9609375, 7.35546875, 7.75, 8.14453125, 8.5390625, 8.93359375, 9.328125, 9.72265625, 10.1171875, 10.51171875, 10.90625, 11.30078125, 11.6953125, 12.08984375, 12.484375, 12.87890625, 13.2734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 18.0, 21.0, 17.0, 31.0, 19.0, 31.0, 17.0, 35.0, 53.0, 36.0, 50.0, 47.0, 61.0, 61.0, 54.0, 60.0, 58.0, 47.0, 56.0, 32.0, 30.0, 31.0, 27.0, 18.0, 13.0, 15.0, 16.0, 11.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.50990104675293, -29.452804565429688, -28.395709991455078, -27.338613510131836, -26.281517028808594, -25.224422454833984, -24.167325973510742, -23.1102294921875, -22.05313491821289, -20.99603843688965, -19.93894386291504, -18.881847381591797, -17.824750900268555, -16.767654418945312, -15.710559844970703, -14.653463363647461, -13.596366882324219, -12.539271354675293, -11.48217487335205, -10.425079345703125, -9.367982864379883, -8.310887336730957, -7.253791809082031, -6.196695804595947, -5.139599800109863, -4.082503795623779, -3.0254080295562744, -1.9683122634887695, -0.9112162590026855, 0.14587974548339844, 1.2029752731323242, 2.260071277618408, 3.317169189453125, 4.374265193939209, 5.431361198425293, 6.488456726074219, 7.545552730560303, 8.602648735046387, 9.659744262695312, 10.716840744018555, 11.77393627166748, 12.831031799316406, 13.888128280639648, 14.945223808288574, 16.0023193359375, 17.059415817260742, 18.116512298583984, 19.173606872558594, 20.230703353881836, 21.287799835205078, 22.344894409179688, 23.40199089050293, 24.459087371826172, 25.51618194580078, 26.573278427124023, 27.630374908447266, 28.687469482421875, 29.744565963745117, 30.801660537719727, 31.85875701904297, 32.91585159301758, 33.97294998168945, 35.03004455566406, 36.08713912963867, 37.14423751831055]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 13.0, 7.0, 18.0, 20.0, 21.0, 21.0, 28.0, 26.0, 34.0, 36.0, 38.0, 40.0, 37.0, 38.0, 36.0, 39.0, 50.0, 46.0, 43.0, 31.0, 37.0, 35.0, 25.0, 25.0, 32.0, 29.0, 25.0, 31.0, 19.0, 22.0, 8.0, 17.0, 11.0, 7.0, 11.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.82933235168457, -25.998638153076172, -25.16794204711914, -24.337247848510742, -23.50655174255371, -22.675857543945312, -21.84516143798828, -21.014467239379883, -20.183773040771484, -19.353078842163086, -18.522382736206055, -17.691688537597656, -16.860992431640625, -16.030298233032227, -15.199603080749512, -14.368907928466797, -13.538211822509766, -12.70751667022705, -11.876821517944336, -11.046127319335938, -10.215431213378906, -9.384737014770508, -8.554041862487793, -7.723346710205078, -6.892651557922363, -6.061956405639648, -5.231261253356934, -4.400566577911377, -3.569871425628662, -2.7391762733459473, -1.9084815979003906, -1.0777864456176758, -0.24708938598632812, 0.5836056470870972, 1.4143006801605225, 2.244995594024658, 3.075690746307373, 3.906385898590088, 4.7370805740356445, 5.567775726318359, 6.398470878601074, 7.229166030883789, 8.059861183166504, 8.890556335449219, 9.721250534057617, 10.551946640014648, 11.382640838623047, 12.213335990905762, 13.044031143188477, 13.874726295471191, 14.705421447753906, 15.536115646362305, 16.366811752319336, 17.197505950927734, 18.028202056884766, 18.858896255493164, 19.689590454101562, 20.52028465270996, 21.350980758666992, 22.18167495727539, 23.012371063232422, 23.84306526184082, 24.67375946044922, 25.50445556640625, 26.33515167236328]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 17.0, 19.0, 31.0, 43.0, 77.0, 87.0, 147.0, 224.0, 339.0, 516.0, 854.0, 1359.0, 1890.0, 3049.0, 4505.0, 6896.0, 10347.0, 15084.0, 22622.0, 33123.0, 47921.0, 67835.0, 91363.0, 115509.0, 131494.0, 125950.0, 105654.0, 79613.0, 57718.0, 40394.0, 27504.0, 18776.0, 12876.0, 8414.0, 5651.0, 3673.0, 2466.0, 1545.0, 1020.0, 697.0, 445.0, 323.0, 165.0, 103.0, 83.0, 52.0, 31.0, 23.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-14.734375, -14.28466796875, -13.8349609375, -13.38525390625, -12.935546875, -12.48583984375, -12.0361328125, -11.58642578125, -11.13671875, -10.68701171875, -10.2373046875, -9.78759765625, -9.337890625, -8.88818359375, -8.4384765625, -7.98876953125, -7.5390625, -7.08935546875, -6.6396484375, -6.18994140625, -5.740234375, -5.29052734375, -4.8408203125, -4.39111328125, -3.94140625, -3.49169921875, -3.0419921875, -2.59228515625, -2.142578125, -1.69287109375, -1.2431640625, -0.79345703125, -0.34375, 0.10595703125, 0.5556640625, 1.00537109375, 1.455078125, 1.90478515625, 2.3544921875, 2.80419921875, 3.25390625, 3.70361328125, 4.1533203125, 4.60302734375, 5.052734375, 5.50244140625, 5.9521484375, 6.40185546875, 6.8515625, 7.30126953125, 7.7509765625, 8.20068359375, 8.650390625, 9.10009765625, 9.5498046875, 9.99951171875, 10.44921875, 10.89892578125, 11.3486328125, 11.79833984375, 12.248046875, 12.69775390625, 13.1474609375, 13.59716796875, 14.046875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 17.0, 17.0, 16.0, 17.0, 16.0, 29.0, 34.0, 41.0, 37.0, 37.0, 45.0, 36.0, 46.0, 47.0, 38.0, 53.0, 43.0, 36.0, 27.0, 32.0, 38.0, 27.0, 34.0, 34.0, 25.0, 23.0, 20.0, 27.0, 19.0, 12.0, 13.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.990478515625, -23.18408203125, -22.377685546875, -21.5712890625, -20.764892578125, -19.95849609375, -19.152099609375, -18.345703125, -17.539306640625, -16.73291015625, -15.926513671875, -15.1201171875, -14.313720703125, -13.50732421875, -12.700927734375, -11.89453125, -11.088134765625, -10.28173828125, -9.475341796875, -8.6689453125, -7.862548828125, -7.05615234375, -6.249755859375, -5.443359375, -4.636962890625, -3.83056640625, -3.024169921875, -2.2177734375, -1.411376953125, -0.60498046875, 0.201416015625, 1.0078125, 1.814208984375, 2.62060546875, 3.427001953125, 4.2333984375, 5.039794921875, 5.84619140625, 6.652587890625, 7.458984375, 8.265380859375, 9.07177734375, 9.878173828125, 10.6845703125, 11.490966796875, 12.29736328125, 13.103759765625, 13.91015625, 14.716552734375, 15.52294921875, 16.329345703125, 17.1357421875, 17.942138671875, 18.74853515625, 19.554931640625, 20.361328125, 21.167724609375, 21.97412109375, 22.780517578125, 23.5869140625, 24.393310546875, 25.19970703125, 26.006103515625, 26.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 9.0, 13.0, 11.0, 25.0, 23.0, 42.0, 65.0, 63.0, 132.0, 151.0, 209.0, 301.0, 444.0, 662.0, 951.0, 1321.0, 2091.0, 3223.0, 5351.0, 8662.0, 15274.0, 32503.0, 724323.0, 193773.0, 24985.0, 13108.0, 7510.0, 4683.0, 2910.0, 1873.0, 1240.0, 817.0, 555.0, 355.0, 261.0, 191.0, 125.0, 89.0, 66.0, 57.0, 39.0, 18.0, 19.0, 7.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.0, -33.86572265625, -32.7314453125, -31.59716796875, -30.462890625, -29.32861328125, -28.1943359375, -27.06005859375, -25.92578125, -24.79150390625, -23.6572265625, -22.52294921875, -21.388671875, -20.25439453125, -19.1201171875, -17.98583984375, -16.8515625, -15.71728515625, -14.5830078125, -13.44873046875, -12.314453125, -11.18017578125, -10.0458984375, -8.91162109375, -7.77734375, -6.64306640625, -5.5087890625, -4.37451171875, -3.240234375, -2.10595703125, -0.9716796875, 0.16259765625, 1.296875, 2.43115234375, 3.5654296875, 4.69970703125, 5.833984375, 6.96826171875, 8.1025390625, 9.23681640625, 10.37109375, 11.50537109375, 12.6396484375, 13.77392578125, 14.908203125, 16.04248046875, 17.1767578125, 18.31103515625, 19.4453125, 20.57958984375, 21.7138671875, 22.84814453125, 23.982421875, 25.11669921875, 26.2509765625, 27.38525390625, 28.51953125, 29.65380859375, 30.7880859375, 31.92236328125, 33.056640625, 34.19091796875, 35.3251953125, 36.45947265625, 37.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 8.0, 12.0, 8.0, 18.0, 14.0, 27.0, 20.0, 30.0, 29.0, 36.0, 42.0, 52.0, 47.0, 54.0, 56.0, 60.0, 59.0, 48.0, 49.0, 39.0, 47.0, 37.0, 35.0, 26.0, 20.0, 24.0, 19.0, 14.0, 11.0, 7.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.546630859375, -22.68701171875, -21.827392578125, -20.9677734375, -20.108154296875, -19.24853515625, -18.388916015625, -17.529296875, -16.669677734375, -15.81005859375, -14.950439453125, -14.0908203125, -13.231201171875, -12.37158203125, -11.511962890625, -10.65234375, -9.792724609375, -8.93310546875, -8.073486328125, -7.2138671875, -6.354248046875, -5.49462890625, -4.635009765625, -3.775390625, -2.915771484375, -2.05615234375, -1.196533203125, -0.3369140625, 0.522705078125, 1.38232421875, 2.241943359375, 3.1015625, 3.961181640625, 4.82080078125, 5.680419921875, 6.5400390625, 7.399658203125, 8.25927734375, 9.118896484375, 9.978515625, 10.838134765625, 11.69775390625, 12.557373046875, 13.4169921875, 14.276611328125, 15.13623046875, 15.995849609375, 16.85546875, 17.715087890625, 18.57470703125, 19.434326171875, 20.2939453125, 21.153564453125, 22.01318359375, 22.872802734375, 23.732421875, 24.592041015625, 25.45166015625, 26.311279296875, 27.1708984375, 28.030517578125, 28.89013671875, 29.749755859375, 30.609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 11.0, 4.0, 8.0, 6.0, 15.0, 19.0, 27.0, 33.0, 33.0, 78.0, 105.0, 175.0, 242.0, 429.0, 600.0, 998.0, 1839.0, 3163.0, 5787.0, 10821.0, 23013.0, 101112.0, 823349.0, 40568.0, 16720.0, 8463.0, 4579.0, 2451.0, 1461.0, 892.0, 486.0, 365.0, 230.0, 138.0, 95.0, 68.0, 54.0, 36.0, 29.0, 16.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.26019287109375, -7.0281982421875, -6.79620361328125, -6.564208984375, -6.33221435546875, -6.1002197265625, -5.86822509765625, -5.63623046875, -5.40423583984375, -5.1722412109375, -4.94024658203125, -4.708251953125, -4.47625732421875, -4.2442626953125, -4.01226806640625, -3.7802734375, -3.54827880859375, -3.3162841796875, -3.08428955078125, -2.852294921875, -2.62030029296875, -2.3883056640625, -2.15631103515625, -1.92431640625, -1.69232177734375, -1.4603271484375, -1.22833251953125, -0.996337890625, -0.76434326171875, -0.5323486328125, -0.30035400390625, -0.068359375, 0.16363525390625, 0.3956298828125, 0.62762451171875, 0.859619140625, 1.09161376953125, 1.3236083984375, 1.55560302734375, 1.78759765625, 2.01959228515625, 2.2515869140625, 2.48358154296875, 2.715576171875, 2.94757080078125, 3.1795654296875, 3.41156005859375, 3.6435546875, 3.87554931640625, 4.1075439453125, 4.33953857421875, 4.571533203125, 4.80352783203125, 5.0355224609375, 5.26751708984375, 5.49951171875, 5.73150634765625, 5.9635009765625, 6.19549560546875, 6.427490234375, 6.65948486328125, 6.8914794921875, 7.12347412109375, 7.35546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 9.0, 9.0, 21.0, 21.0, 28.0, 38.0, 41.0, 59.0, 64.0, 75.0, 77.0, 91.0, 79.0, 68.0, 51.0, 39.0, 25.0, 30.0, 19.0, 18.0, 13.0, 17.0, 16.0, 9.0, 8.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009636133909225464, -0.000932544469833374, -0.0009014755487442017, -0.0008704066276550293, -0.0008393377065658569, -0.0008082687854766846, -0.0007771998643875122, -0.0007461309432983398, -0.0007150620222091675, -0.0006839931011199951, -0.0006529241800308228, -0.0006218552589416504, -0.000590786337852478, -0.0005597174167633057, -0.0005286484956741333, -0.0004975795745849609, -0.0004665106534957886, -0.0004354417324066162, -0.00040437281131744385, -0.0003733038902282715, -0.0003422349691390991, -0.00031116604804992676, -0.0002800971269607544, -0.00024902820587158203, -0.00021795928478240967, -0.0001868903636932373, -0.00015582144260406494, -0.00012475252151489258, -9.368360042572021e-05, -6.261467933654785e-05, -3.154575824737549e-05, -4.76837158203125e-07, 3.059208393096924e-05, 6.16610050201416e-05, 9.272992610931396e-05, 0.00012379884719848633, 0.0001548677682876587, 0.00018593668937683105, 0.00021700561046600342, 0.0002480745315551758, 0.00027914345264434814, 0.0003102123737335205, 0.00034128129482269287, 0.00037235021591186523, 0.0004034191370010376, 0.00043448805809020996, 0.0004655569791793823, 0.0004966259002685547, 0.000527694821357727, 0.0005587637424468994, 0.0005898326635360718, 0.0006209015846252441, 0.0006519705057144165, 0.0006830394268035889, 0.0007141083478927612, 0.0007451772689819336, 0.000776246190071106, 0.0008073151111602783, 0.0008383840322494507, 0.000869452953338623, 0.0009005218744277954, 0.0009315907955169678, 0.0009626597166061401, 0.0009937286376953125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 15.0, 12.0, 25.0, 33.0, 47.0, 65.0, 79.0, 154.0, 198.0, 290.0, 414.0, 638.0, 1054.0, 1535.0, 2600.0, 4377.0, 7614.0, 13250.0, 24151.0, 43480.0, 76554.0, 126405.0, 180612.0, 194406.0, 149415.0, 94911.0, 55291.0, 30497.0, 16927.0, 9409.0, 5391.0, 3200.0, 1925.0, 1267.0, 785.0, 463.0, 332.0, 212.0, 143.0, 103.0, 76.0, 58.0, 33.0, 46.0, 26.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.77734375, -3.666900634765625, -3.55645751953125, -3.446014404296875, -3.3355712890625, -3.225128173828125, -3.11468505859375, -3.004241943359375, -2.893798828125, -2.783355712890625, -2.67291259765625, -2.562469482421875, -2.4520263671875, -2.341583251953125, -2.23114013671875, -2.120697021484375, -2.01025390625, -1.899810791015625, -1.78936767578125, -1.678924560546875, -1.5684814453125, -1.458038330078125, -1.34759521484375, -1.237152099609375, -1.126708984375, -1.016265869140625, -0.90582275390625, -0.795379638671875, -0.6849365234375, -0.574493408203125, -0.46405029296875, -0.353607177734375, -0.2431640625, -0.132720947265625, -0.02227783203125, 0.088165283203125, 0.1986083984375, 0.309051513671875, 0.41949462890625, 0.529937744140625, 0.640380859375, 0.750823974609375, 0.86126708984375, 0.971710205078125, 1.0821533203125, 1.192596435546875, 1.30303955078125, 1.413482666015625, 1.52392578125, 1.634368896484375, 1.74481201171875, 1.855255126953125, 1.9656982421875, 2.076141357421875, 2.18658447265625, 2.297027587890625, 2.407470703125, 2.517913818359375, 2.62835693359375, 2.738800048828125, 2.8492431640625, 2.959686279296875, 3.07012939453125, 3.180572509765625, 3.291015625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 12.0, 11.0, 9.0, 15.0, 25.0, 22.0, 25.0, 45.0, 58.0, 43.0, 64.0, 60.0, 53.0, 80.0, 55.0, 57.0, 61.0, 42.0, 40.0, 37.0, 35.0, 28.0, 24.0, 13.0, 10.0, 6.0, 6.0, 8.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.371368408203125, -1.33258056640625, -1.293792724609375, -1.2550048828125, -1.216217041015625, -1.17742919921875, -1.138641357421875, -1.099853515625, -1.061065673828125, -1.02227783203125, -0.983489990234375, -0.9447021484375, -0.905914306640625, -0.86712646484375, -0.828338623046875, -0.78955078125, -0.750762939453125, -0.71197509765625, -0.673187255859375, -0.6343994140625, -0.595611572265625, -0.55682373046875, -0.518035888671875, -0.479248046875, -0.440460205078125, -0.40167236328125, -0.362884521484375, -0.3240966796875, -0.285308837890625, -0.24652099609375, -0.207733154296875, -0.1689453125, -0.130157470703125, -0.09136962890625, -0.052581787109375, -0.0137939453125, 0.024993896484375, 0.06378173828125, 0.102569580078125, 0.141357421875, 0.180145263671875, 0.21893310546875, 0.257720947265625, 0.2965087890625, 0.335296630859375, 0.37408447265625, 0.412872314453125, 0.45166015625, 0.490447998046875, 0.52923583984375, 0.568023681640625, 0.6068115234375, 0.645599365234375, 0.68438720703125, 0.723175048828125, 0.761962890625, 0.800750732421875, 0.83953857421875, 0.878326416015625, 0.9171142578125, 0.955902099609375, 0.99468994140625, 1.033477783203125, 1.072265625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 13.0, 12.0, 23.0, 22.0, 21.0, 23.0, 31.0, 33.0, 35.0, 47.0, 45.0, 41.0, 44.0, 55.0, 58.0, 58.0, 50.0, 57.0, 52.0, 48.0, 33.0, 35.0, 25.0, 28.0, 28.0, 14.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.869583129882812, -23.966888427734375, -23.064193725585938, -22.1614990234375, -21.258804321289062, -20.356109619140625, -19.453414916992188, -18.55072021484375, -17.648025512695312, -16.745330810546875, -15.842636108398438, -14.93994140625, -14.037246704101562, -13.134552001953125, -12.231856346130371, -11.329161643981934, -10.42646598815918, -9.523771286010742, -8.621076583862305, -7.718381404876709, -6.8156867027282715, -5.912992000579834, -5.010296821594238, -4.107602119445801, -3.2049074172973633, -2.302212715148926, -1.3995177745819092, -0.4968228340148926, 0.4058718681335449, 1.3085665702819824, 2.211261749267578, 3.1139564514160156, 4.016651153564453, 4.919345855712891, 5.822040557861328, 6.724735736846924, 7.627430438995361, 8.53012466430664, 9.432820320129395, 10.335515022277832, 11.23820972442627, 12.140904426574707, 13.043599128723145, 13.946294784545898, 14.848989486694336, 15.751684188842773, 16.65437889099121, 17.55707359313965, 18.459768295288086, 19.362462997436523, 20.26515769958496, 21.1678524017334, 22.070547103881836, 22.973241806030273, 23.875938415527344, 24.77863311767578, 25.68132781982422, 26.584022521972656, 27.486717224121094, 28.38941192626953, 29.29210662841797, 30.194801330566406, 31.097496032714844, 32.00019073486328, 32.90288543701172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 16.0, 9.0, 16.0, 19.0, 20.0, 17.0, 25.0, 26.0, 28.0, 37.0, 38.0, 37.0, 38.0, 51.0, 28.0, 45.0, 54.0, 42.0, 35.0, 42.0, 28.0, 34.0, 30.0, 32.0, 30.0, 27.0, 28.0, 31.0, 20.0, 13.0, 15.0, 27.0, 9.0, 6.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.204423904418945, -22.469974517822266, -21.735523223876953, -21.001073837280273, -20.26662254333496, -19.53217315673828, -18.79772186279297, -18.06327247619629, -17.32882308959961, -16.59437370300293, -15.859922409057617, -15.125473022460938, -14.391021728515625, -13.656572341918945, -12.92212200164795, -12.187671661376953, -11.45322036743164, -10.718770027160645, -9.984319686889648, -9.249870300292969, -8.515419006347656, -7.780969142913818, -7.0465192794799805, -6.312068939208984, -5.577618598937988, -4.843168258666992, -4.108717918395996, -3.374268054962158, -2.639817714691162, -1.905367374420166, -1.1709175109863281, -0.43646717071533203, 0.29798126220703125, 1.0324314832687378, 1.7668817043304443, 2.5013318061828613, 3.2357821464538574, 3.9702324867248535, 4.704682350158691, 5.4391326904296875, 6.173583030700684, 6.90803337097168, 7.642483711242676, 8.376934051513672, 9.111383438110352, 9.845834732055664, 10.580284118652344, 11.31473445892334, 12.049184799194336, 12.783635139465332, 13.518085479736328, 14.252534866333008, 14.98698616027832, 15.721435546875, 16.455886840820312, 17.190336227416992, 17.924785614013672, 18.65923500061035, 19.393686294555664, 20.128135681152344, 20.862586975097656, 21.597036361694336, 22.331485748291016, 23.065937042236328, 23.80038833618164]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 29.0, 37.0, 55.0, 95.0, 143.0, 237.0, 337.0, 530.0, 878.0, 1337.0, 1948.0, 3210.0, 4837.0, 7632.0, 11890.0, 18504.0, 27989.0, 41775.0, 59828.0, 82951.0, 106070.0, 122432.0, 126501.0, 115354.0, 94807.0, 70614.0, 50169.0, 33781.0, 22892.0, 14855.0, 9762.0, 5968.0, 3870.0, 2534.0, 1672.0, 1084.0, 669.0, 425.0, 291.0, 188.0, 118.0, 74.0, 49.0, 37.0, 29.0, 10.0, 9.0, 4.0, 8.0, 4.0, 1.0, 3.0, 3.0], "bins": [-28.765625, -27.900390625, -27.03515625, -26.169921875, -25.3046875, -24.439453125, -23.57421875, -22.708984375, -21.84375, -20.978515625, -20.11328125, -19.248046875, -18.3828125, -17.517578125, -16.65234375, -15.787109375, -14.921875, -14.056640625, -13.19140625, -12.326171875, -11.4609375, -10.595703125, -9.73046875, -8.865234375, -8.0, -7.134765625, -6.26953125, -5.404296875, -4.5390625, -3.673828125, -2.80859375, -1.943359375, -1.078125, -0.212890625, 0.65234375, 1.517578125, 2.3828125, 3.248046875, 4.11328125, 4.978515625, 5.84375, 6.708984375, 7.57421875, 8.439453125, 9.3046875, 10.169921875, 11.03515625, 11.900390625, 12.765625, 13.630859375, 14.49609375, 15.361328125, 16.2265625, 17.091796875, 17.95703125, 18.822265625, 19.6875, 20.552734375, 21.41796875, 22.283203125, 23.1484375, 24.013671875, 24.87890625, 25.744140625, 26.609375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 10.0, 18.0, 7.0, 14.0, 19.0, 24.0, 20.0, 20.0, 38.0, 31.0, 33.0, 28.0, 38.0, 33.0, 46.0, 50.0, 28.0, 47.0, 31.0, 32.0, 43.0, 42.0, 43.0, 36.0, 27.0, 32.0, 19.0, 23.0, 27.0, 21.0, 15.0, 20.0, 17.0, 9.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.098876953125, -20.40087890625, -19.702880859375, -19.0048828125, -18.306884765625, -17.60888671875, -16.910888671875, -16.212890625, -15.514892578125, -14.81689453125, -14.118896484375, -13.4208984375, -12.722900390625, -12.02490234375, -11.326904296875, -10.62890625, -9.930908203125, -9.23291015625, -8.534912109375, -7.8369140625, -7.138916015625, -6.44091796875, -5.742919921875, -5.044921875, -4.346923828125, -3.64892578125, -2.950927734375, -2.2529296875, -1.554931640625, -0.85693359375, -0.158935546875, 0.5390625, 1.237060546875, 1.93505859375, 2.633056640625, 3.3310546875, 4.029052734375, 4.72705078125, 5.425048828125, 6.123046875, 6.821044921875, 7.51904296875, 8.217041015625, 8.9150390625, 9.613037109375, 10.31103515625, 11.009033203125, 11.70703125, 12.405029296875, 13.10302734375, 13.801025390625, 14.4990234375, 15.197021484375, 15.89501953125, 16.593017578125, 17.291015625, 17.989013671875, 18.68701171875, 19.385009765625, 20.0830078125, 20.781005859375, 21.47900390625, 22.177001953125, 22.875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 20.0, 14.0, 23.0, 28.0, 53.0, 82.0, 136.0, 217.0, 325.0, 487.0, 781.0, 1177.0, 1777.0, 2847.0, 4137.0, 6166.0, 9528.0, 13520.0, 19323.0, 27671.0, 38352.0, 50891.0, 65814.0, 80844.0, 93688.0, 101429.0, 102982.0, 94082.0, 82344.0, 66949.0, 52426.0, 39184.0, 28400.0, 20232.0, 14013.0, 9541.0, 6513.0, 4295.0, 2852.0, 1847.0, 1222.0, 848.0, 544.0, 329.0, 211.0, 149.0, 81.0, 76.0, 42.0, 29.0, 17.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.859375, -22.14599609375, -21.4326171875, -20.71923828125, -20.005859375, -19.29248046875, -18.5791015625, -17.86572265625, -17.15234375, -16.43896484375, -15.7255859375, -15.01220703125, -14.298828125, -13.58544921875, -12.8720703125, -12.15869140625, -11.4453125, -10.73193359375, -10.0185546875, -9.30517578125, -8.591796875, -7.87841796875, -7.1650390625, -6.45166015625, -5.73828125, -5.02490234375, -4.3115234375, -3.59814453125, -2.884765625, -2.17138671875, -1.4580078125, -0.74462890625, -0.03125, 0.68212890625, 1.3955078125, 2.10888671875, 2.822265625, 3.53564453125, 4.2490234375, 4.96240234375, 5.67578125, 6.38916015625, 7.1025390625, 7.81591796875, 8.529296875, 9.24267578125, 9.9560546875, 10.66943359375, 11.3828125, 12.09619140625, 12.8095703125, 13.52294921875, 14.236328125, 14.94970703125, 15.6630859375, 16.37646484375, 17.08984375, 17.80322265625, 18.5166015625, 19.22998046875, 19.943359375, 20.65673828125, 21.3701171875, 22.08349609375, 22.796875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 16.0, 13.0, 17.0, 19.0, 25.0, 26.0, 22.0, 32.0, 31.0, 30.0, 33.0, 31.0, 35.0, 37.0, 47.0, 47.0, 30.0, 43.0, 41.0, 31.0, 35.0, 45.0, 32.0, 32.0, 34.0, 37.0, 32.0, 30.0, 16.0, 9.0, 16.0, 15.0, 9.0, 7.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.593505859375, -16.12451171875, -15.655517578125, -15.1865234375, -14.717529296875, -14.24853515625, -13.779541015625, -13.310546875, -12.841552734375, -12.37255859375, -11.903564453125, -11.4345703125, -10.965576171875, -10.49658203125, -10.027587890625, -9.55859375, -9.089599609375, -8.62060546875, -8.151611328125, -7.6826171875, -7.213623046875, -6.74462890625, -6.275634765625, -5.806640625, -5.337646484375, -4.86865234375, -4.399658203125, -3.9306640625, -3.461669921875, -2.99267578125, -2.523681640625, -2.0546875, -1.585693359375, -1.11669921875, -0.647705078125, -0.1787109375, 0.290283203125, 0.75927734375, 1.228271484375, 1.697265625, 2.166259765625, 2.63525390625, 3.104248046875, 3.5732421875, 4.042236328125, 4.51123046875, 4.980224609375, 5.44921875, 5.918212890625, 6.38720703125, 6.856201171875, 7.3251953125, 7.794189453125, 8.26318359375, 8.732177734375, 9.201171875, 9.670166015625, 10.13916015625, 10.608154296875, 11.0771484375, 11.546142578125, 12.01513671875, 12.484130859375, 12.953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 18.0, 20.0, 35.0, 53.0, 81.0, 109.0, 199.0, 256.0, 436.0, 651.0, 1161.0, 2046.0, 3313.0, 5582.0, 9923.0, 17664.0, 31659.0, 56208.0, 95968.0, 149091.0, 189343.0, 176799.0, 127086.0, 77757.0, 44498.0, 25192.0, 14065.0, 7982.0, 4674.0, 2666.0, 1576.0, 896.0, 547.0, 373.0, 204.0, 133.0, 87.0, 56.0, 35.0, 35.0, 19.0, 17.0, 11.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.640625, -13.2247314453125, -12.808837890625, -12.3929443359375, -11.97705078125, -11.5611572265625, -11.145263671875, -10.7293701171875, -10.3134765625, -9.8975830078125, -9.481689453125, -9.0657958984375, -8.64990234375, -8.2340087890625, -7.818115234375, -7.4022216796875, -6.986328125, -6.5704345703125, -6.154541015625, -5.7386474609375, -5.32275390625, -4.9068603515625, -4.490966796875, -4.0750732421875, -3.6591796875, -3.2432861328125, -2.827392578125, -2.4114990234375, -1.99560546875, -1.5797119140625, -1.163818359375, -0.7479248046875, -0.33203125, 0.0838623046875, 0.499755859375, 0.9156494140625, 1.33154296875, 1.7474365234375, 2.163330078125, 2.5792236328125, 2.9951171875, 3.4110107421875, 3.826904296875, 4.2427978515625, 4.65869140625, 5.0745849609375, 5.490478515625, 5.9063720703125, 6.322265625, 6.7381591796875, 7.154052734375, 7.5699462890625, 7.98583984375, 8.4017333984375, 8.817626953125, 9.2335205078125, 9.6494140625, 10.0653076171875, 10.481201171875, 10.8970947265625, 11.31298828125, 11.7288818359375, 12.144775390625, 12.5606689453125, 12.9765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 22.0, 25.0, 18.0, 43.0, 42.0, 48.0, 58.0, 71.0, 82.0, 87.0, 63.0, 80.0, 60.0, 62.0, 34.0, 39.0, 21.0, 31.0, 15.0, 10.0, 9.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00180816650390625, -0.0017583668231964111, -0.0017085671424865723, -0.0016587674617767334, -0.0016089677810668945, -0.0015591681003570557, -0.0015093684196472168, -0.001459568738937378, -0.001409769058227539, -0.0013599693775177002, -0.0013101696968078613, -0.0012603700160980225, -0.0012105703353881836, -0.0011607706546783447, -0.0011109709739685059, -0.001061171293258667, -0.0010113716125488281, -0.0009615719318389893, -0.0009117722511291504, -0.0008619725704193115, -0.0008121728897094727, -0.0007623732089996338, -0.0007125735282897949, -0.0006627738475799561, -0.0006129741668701172, -0.0005631744861602783, -0.0005133748054504395, -0.0004635751247406006, -0.0004137754440307617, -0.00036397576332092285, -0.000314176082611084, -0.0002643764019012451, -0.00021457672119140625, -0.00016477704048156738, -0.00011497735977172852, -6.517767906188965e-05, -1.537799835205078e-05, 3.4421682357788086e-05, 8.422136306762695e-05, 0.00013402104377746582, 0.0001838207244873047, 0.00023362040519714355, 0.0002834200859069824, 0.0003332197666168213, 0.00038301944732666016, 0.000432819128036499, 0.0004826188087463379, 0.0005324184894561768, 0.0005822181701660156, 0.0006320178508758545, 0.0006818175315856934, 0.0007316172122955322, 0.0007814168930053711, 0.00083121657371521, 0.0008810162544250488, 0.0009308159351348877, 0.0009806156158447266, 0.0010304152965545654, 0.0010802149772644043, 0.0011300146579742432, 0.001179814338684082, 0.001229614019393921, 0.0012794137001037598, 0.0013292133808135986, 0.0013790130615234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 11.0, 22.0, 19.0, 38.0, 54.0, 88.0, 121.0, 197.0, 305.0, 521.0, 856.0, 1473.0, 2468.0, 4160.0, 7301.0, 12294.0, 21399.0, 36063.0, 59802.0, 94490.0, 133180.0, 161283.0, 158612.0, 127981.0, 88716.0, 56004.0, 33810.0, 19544.0, 11599.0, 6604.0, 3877.0, 2228.0, 1337.0, 824.0, 477.0, 269.0, 183.0, 125.0, 60.0, 39.0, 32.0, 26.0, 13.0, 17.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.2578125, -9.9365234375, -9.615234375, -9.2939453125, -8.97265625, -8.6513671875, -8.330078125, -8.0087890625, -7.6875, -7.3662109375, -7.044921875, -6.7236328125, -6.40234375, -6.0810546875, -5.759765625, -5.4384765625, -5.1171875, -4.7958984375, -4.474609375, -4.1533203125, -3.83203125, -3.5107421875, -3.189453125, -2.8681640625, -2.546875, -2.2255859375, -1.904296875, -1.5830078125, -1.26171875, -0.9404296875, -0.619140625, -0.2978515625, 0.0234375, 0.3447265625, 0.666015625, 0.9873046875, 1.30859375, 1.6298828125, 1.951171875, 2.2724609375, 2.59375, 2.9150390625, 3.236328125, 3.5576171875, 3.87890625, 4.2001953125, 4.521484375, 4.8427734375, 5.1640625, 5.4853515625, 5.806640625, 6.1279296875, 6.44921875, 6.7705078125, 7.091796875, 7.4130859375, 7.734375, 8.0556640625, 8.376953125, 8.6982421875, 9.01953125, 9.3408203125, 9.662109375, 9.9833984375, 10.3046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 26.0, 18.0, 41.0, 45.0, 52.0, 66.0, 63.0, 75.0, 57.0, 65.0, 56.0, 74.0, 63.0, 44.0, 32.0, 35.0, 22.0, 24.0, 13.0, 16.0, 14.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.74700927734375, -3.6112060546875, -3.47540283203125, -3.339599609375, -3.20379638671875, -3.0679931640625, -2.93218994140625, -2.79638671875, -2.66058349609375, -2.5247802734375, -2.38897705078125, -2.253173828125, -2.11737060546875, -1.9815673828125, -1.84576416015625, -1.7099609375, -1.57415771484375, -1.4383544921875, -1.30255126953125, -1.166748046875, -1.03094482421875, -0.8951416015625, -0.75933837890625, -0.62353515625, -0.48773193359375, -0.3519287109375, -0.21612548828125, -0.080322265625, 0.05548095703125, 0.1912841796875, 0.32708740234375, 0.462890625, 0.59869384765625, 0.7344970703125, 0.87030029296875, 1.006103515625, 1.14190673828125, 1.2777099609375, 1.41351318359375, 1.54931640625, 1.68511962890625, 1.8209228515625, 1.95672607421875, 2.092529296875, 2.22833251953125, 2.3641357421875, 2.49993896484375, 2.6357421875, 2.77154541015625, 2.9073486328125, 3.04315185546875, 3.178955078125, 3.31475830078125, 3.4505615234375, 3.58636474609375, 3.72216796875, 3.85797119140625, 3.9937744140625, 4.12957763671875, 4.265380859375, 4.40118408203125, 4.5369873046875, 4.67279052734375, 4.80859375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 7.0, 13.0, 3.0, 12.0, 16.0, 29.0, 30.0, 30.0, 37.0, 56.0, 44.0, 39.0, 63.0, 57.0, 67.0, 43.0, 37.0, 50.0, 53.0, 44.0, 45.0, 40.0, 38.0, 39.0, 23.0, 12.0, 16.0, 14.0, 5.0, 4.0, 8.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.73617935180664, -25.854040145874023, -24.971899032592773, -24.089759826660156, -23.20762062072754, -22.325481414794922, -21.443340301513672, -20.561201095581055, -19.679061889648438, -18.79692268371582, -17.91478157043457, -17.032642364501953, -16.150503158569336, -15.268362998962402, -14.386222839355469, -13.504083633422852, -12.621942520141602, -11.739802360534668, -10.85766315460205, -9.975522994995117, -9.0933837890625, -8.211243629455566, -7.329103469848633, -6.446963787078857, -5.564824104309082, -4.682684421539307, -3.800544500350952, -2.9184045791625977, -2.0362648963928223, -1.1541252136230469, -0.2719850540161133, 0.6101546287536621, 1.4922924041748047, 2.37443208694458, 3.2565720081329346, 4.138711929321289, 5.0208516120910645, 5.90299129486084, 6.785131454467773, 7.667271137237549, 8.549410820007324, 9.431550979614258, 10.313690185546875, 11.195830345153809, 12.077970504760742, 12.96010971069336, 13.842249870300293, 14.724390029907227, 15.606529235839844, 16.48866844177246, 17.37080955505371, 18.252948760986328, 19.135087966918945, 20.017227172851562, 20.899368286132812, 21.78150749206543, 22.663646697998047, 23.545785903930664, 24.427927017211914, 25.31006622314453, 26.19220542907715, 27.074344635009766, 27.956485748291016, 28.838624954223633, 29.720766067504883]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 11.0, 8.0, 8.0, 11.0, 10.0, 14.0, 7.0, 17.0, 18.0, 25.0, 19.0, 31.0, 22.0, 38.0, 36.0, 40.0, 38.0, 32.0, 51.0, 37.0, 34.0, 38.0, 48.0, 42.0, 32.0, 35.0, 33.0, 21.0, 32.0, 29.0, 23.0, 16.0, 23.0, 14.0, 15.0, 12.0, 13.0, 8.0, 15.0, 11.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.233980178833008, -23.551773071289062, -22.869565963745117, -22.187358856201172, -21.505151748657227, -20.82294464111328, -20.14073944091797, -19.45853042602539, -18.776325225830078, -18.094118118286133, -17.411911010742188, -16.729703903198242, -16.047496795654297, -15.365289688110352, -14.683083534240723, -14.000876426696777, -13.318668365478516, -12.63646125793457, -11.954254150390625, -11.27204704284668, -10.589839935302734, -9.907632827758789, -9.22542667388916, -8.543219566345215, -7.8610124588012695, -7.178805351257324, -6.496598243713379, -5.814391613006592, -5.1321845054626465, -4.449977397918701, -3.767770767211914, -3.0855636596679688, -2.4033584594726562, -1.7211514711380005, -1.0389444828033447, -0.3567376136779785, 0.3254694938659668, 1.007676601409912, 1.6898832321166992, 2.3720903396606445, 3.05429744720459, 3.736504554748535, 4.4187116622924805, 5.100918292999268, 5.783125400543213, 6.465332508087158, 7.147539138793945, 7.829746246337891, 8.511953353881836, 9.194160461425781, 9.876367568969727, 10.558574676513672, 11.240781784057617, 11.922988891601562, 12.605195045471191, 13.287402153015137, 13.969609260559082, 14.651816368103027, 15.334023475646973, 16.0162296295166, 16.698436737060547, 17.380643844604492, 18.062850952148438, 18.745058059692383, 19.427265167236328]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 16.0, 20.0, 39.0, 60.0, 95.0, 133.0, 200.0, 294.0, 509.0, 811.0, 1348.0, 2261.0, 3855.0, 6811.0, 11720.0, 21053.0, 39053.0, 73023.0, 141012.0, 273685.0, 518285.0, 843565.0, 919731.0, 625401.0, 338054.0, 174321.0, 91071.0, 47567.0, 25884.0, 14245.0, 8200.0, 4815.0, 2782.0, 1713.0, 1011.0, 617.0, 371.0, 243.0, 140.0, 107.0, 58.0, 35.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.390625, -26.482421875, -25.57421875, -24.666015625, -23.7578125, -22.849609375, -21.94140625, -21.033203125, -20.125, -19.216796875, -18.30859375, -17.400390625, -16.4921875, -15.583984375, -14.67578125, -13.767578125, -12.859375, -11.951171875, -11.04296875, -10.134765625, -9.2265625, -8.318359375, -7.41015625, -6.501953125, -5.59375, -4.685546875, -3.77734375, -2.869140625, -1.9609375, -1.052734375, -0.14453125, 0.763671875, 1.671875, 2.580078125, 3.48828125, 4.396484375, 5.3046875, 6.212890625, 7.12109375, 8.029296875, 8.9375, 9.845703125, 10.75390625, 11.662109375, 12.5703125, 13.478515625, 14.38671875, 15.294921875, 16.203125, 17.111328125, 18.01953125, 18.927734375, 19.8359375, 20.744140625, 21.65234375, 22.560546875, 23.46875, 24.376953125, 25.28515625, 26.193359375, 27.1015625, 28.009765625, 28.91796875, 29.826171875, 30.734375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 9.0, 7.0, 9.0, 10.0, 9.0, 13.0, 11.0, 14.0, 17.0, 21.0, 21.0, 28.0, 37.0, 42.0, 32.0, 21.0, 35.0, 46.0, 41.0, 42.0, 35.0, 44.0, 39.0, 38.0, 36.0, 42.0, 31.0, 26.0, 26.0, 32.0, 24.0, 23.0, 12.0, 13.0, 15.0, 21.0, 11.0, 11.0, 10.0, 6.0, 6.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.984375, -16.462158203125, -15.93994140625, -15.417724609375, -14.8955078125, -14.373291015625, -13.85107421875, -13.328857421875, -12.806640625, -12.284423828125, -11.76220703125, -11.239990234375, -10.7177734375, -10.195556640625, -9.67333984375, -9.151123046875, -8.62890625, -8.106689453125, -7.58447265625, -7.062255859375, -6.5400390625, -6.017822265625, -5.49560546875, -4.973388671875, -4.451171875, -3.928955078125, -3.40673828125, -2.884521484375, -2.3623046875, -1.840087890625, -1.31787109375, -0.795654296875, -0.2734375, 0.248779296875, 0.77099609375, 1.293212890625, 1.8154296875, 2.337646484375, 2.85986328125, 3.382080078125, 3.904296875, 4.426513671875, 4.94873046875, 5.470947265625, 5.9931640625, 6.515380859375, 7.03759765625, 7.559814453125, 8.08203125, 8.604248046875, 9.12646484375, 9.648681640625, 10.1708984375, 10.693115234375, 11.21533203125, 11.737548828125, 12.259765625, 12.781982421875, 13.30419921875, 13.826416015625, 14.3486328125, 14.870849609375, 15.39306640625, 15.915283203125, 16.4375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 9.0, 22.0, 35.0, 63.0, 99.0, 146.0, 227.0, 345.0, 562.0, 889.0, 1380.0, 2238.0, 3472.0, 5520.0, 8517.0, 13684.0, 21011.0, 33408.0, 52339.0, 82529.0, 127678.0, 196691.0, 295586.0, 423378.0, 556947.0, 618748.0, 542010.0, 405500.0, 280182.0, 186211.0, 121175.0, 78030.0, 49481.0, 31531.0, 20051.0, 12467.0, 7966.0, 4983.0, 3329.0, 2165.0, 1281.0, 878.0, 566.0, 349.0, 225.0, 137.0, 88.0, 62.0, 29.0, 30.0, 16.0, 11.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-18.046875, -17.490478515625, -16.93408203125, -16.377685546875, -15.8212890625, -15.264892578125, -14.70849609375, -14.152099609375, -13.595703125, -13.039306640625, -12.48291015625, -11.926513671875, -11.3701171875, -10.813720703125, -10.25732421875, -9.700927734375, -9.14453125, -8.588134765625, -8.03173828125, -7.475341796875, -6.9189453125, -6.362548828125, -5.80615234375, -5.249755859375, -4.693359375, -4.136962890625, -3.58056640625, -3.024169921875, -2.4677734375, -1.911376953125, -1.35498046875, -0.798583984375, -0.2421875, 0.314208984375, 0.87060546875, 1.427001953125, 1.9833984375, 2.539794921875, 3.09619140625, 3.652587890625, 4.208984375, 4.765380859375, 5.32177734375, 5.878173828125, 6.4345703125, 6.990966796875, 7.54736328125, 8.103759765625, 8.66015625, 9.216552734375, 9.77294921875, 10.329345703125, 10.8857421875, 11.442138671875, 11.99853515625, 12.554931640625, 13.111328125, 13.667724609375, 14.22412109375, 14.780517578125, 15.3369140625, 15.893310546875, 16.44970703125, 17.006103515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 11.0, 5.0, 13.0, 5.0, 18.0, 19.0, 22.0, 33.0, 39.0, 34.0, 55.0, 69.0, 69.0, 110.0, 133.0, 157.0, 158.0, 207.0, 238.0, 240.0, 277.0, 263.0, 258.0, 241.0, 224.0, 222.0, 150.0, 138.0, 114.0, 93.0, 89.0, 86.0, 65.0, 58.0, 40.0, 31.0, 25.0, 17.0, 8.0, 16.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.078125, -8.80615234375, -8.5341796875, -8.26220703125, -7.990234375, -7.71826171875, -7.4462890625, -7.17431640625, -6.90234375, -6.63037109375, -6.3583984375, -6.08642578125, -5.814453125, -5.54248046875, -5.2705078125, -4.99853515625, -4.7265625, -4.45458984375, -4.1826171875, -3.91064453125, -3.638671875, -3.36669921875, -3.0947265625, -2.82275390625, -2.55078125, -2.27880859375, -2.0068359375, -1.73486328125, -1.462890625, -1.19091796875, -0.9189453125, -0.64697265625, -0.375, -0.10302734375, 0.1689453125, 0.44091796875, 0.712890625, 0.98486328125, 1.2568359375, 1.52880859375, 1.80078125, 2.07275390625, 2.3447265625, 2.61669921875, 2.888671875, 3.16064453125, 3.4326171875, 3.70458984375, 3.9765625, 4.24853515625, 4.5205078125, 4.79248046875, 5.064453125, 5.33642578125, 5.6083984375, 5.88037109375, 6.15234375, 6.42431640625, 6.6962890625, 6.96826171875, 7.240234375, 7.51220703125, 7.7841796875, 8.05615234375, 8.328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 9.0, 17.0, 10.0, 13.0, 17.0, 24.0, 32.0, 38.0, 36.0, 46.0, 36.0, 50.0, 44.0, 63.0, 46.0, 45.0, 55.0, 54.0, 59.0, 42.0, 26.0, 40.0, 29.0, 35.0, 19.0, 14.0, 16.0, 15.0, 13.0, 7.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.473526000976562, -24.72777557373047, -23.982027053833008, -23.236276626586914, -22.490528106689453, -21.74477767944336, -20.999027252197266, -20.253278732299805, -19.50752830505371, -18.761777877807617, -18.016029357910156, -17.270278930664062, -16.5245304107666, -15.778779983520508, -15.03303050994873, -14.287281036376953, -13.541531562805176, -12.795782089233398, -12.050032615661621, -11.304283142089844, -10.55853271484375, -9.812783241271973, -9.067033767700195, -8.321283340454102, -7.575534343719482, -6.829784870147705, -6.0840349197387695, -5.338285446166992, -4.592535972595215, -3.8467860221862793, -3.101036548614502, -2.3552865982055664, -1.609537124633789, -0.8637874722480774, -0.11803781986236572, 0.6277117729187012, 1.3734614849090576, 2.119211196899414, 2.8649606704711914, 3.610710620880127, 4.356460094451904, 5.102209568023682, 5.847959518432617, 6.5937089920043945, 7.339458465576172, 8.085208892822266, 8.830957412719727, 9.57670783996582, 10.322457313537598, 11.068206787109375, 11.813956260681152, 12.55970573425293, 13.305456161499023, 14.0512056350708, 14.796955108642578, 15.542705535888672, 16.288454055786133, 17.034204483032227, 17.779953002929688, 18.52570343017578, 19.271451950073242, 20.017202377319336, 20.762950897216797, 21.50870132446289, 22.254451751708984]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 7.0, 3.0, 10.0, 4.0, 6.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 20.0, 28.0, 30.0, 41.0, 25.0, 39.0, 31.0, 37.0, 48.0, 46.0, 34.0, 37.0, 43.0, 35.0, 35.0, 48.0, 20.0, 42.0, 31.0, 29.0, 32.0, 20.0, 21.0, 25.0, 18.0, 19.0, 18.0, 13.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.582006454467773, -20.952877044677734, -20.323745727539062, -19.694616317749023, -19.065486907958984, -18.436357498168945, -17.807228088378906, -17.178096771240234, -16.548967361450195, -15.919837951660156, -15.2907075881958, -14.661577224731445, -14.032447814941406, -13.403318405151367, -12.774188041687012, -12.145057678222656, -11.515928268432617, -10.886798858642578, -10.257668495178223, -9.628538131713867, -8.999408721923828, -8.370279312133789, -7.741148948669434, -7.112019062042236, -6.482889175415039, -5.853759288787842, -5.2246294021606445, -4.595499515533447, -3.96636962890625, -3.3372397422790527, -2.7081098556518555, -2.078979969024658, -1.449850082397461, -0.8207201957702637, -0.1915903091430664, 0.43753957748413086, 1.0666694641113281, 1.6957993507385254, 2.3249292373657227, 2.95405912399292, 3.583189010620117, 4.2123188972473145, 4.841448783874512, 5.470578670501709, 6.099708557128906, 6.7288384437561035, 7.357968330383301, 7.987098217010498, 8.616228103637695, 9.245357513427734, 9.87448787689209, 10.503618240356445, 11.132747650146484, 11.761877059936523, 12.391007423400879, 13.020137786865234, 13.649267196655273, 14.278396606445312, 14.907526969909668, 15.536657333374023, 16.165786743164062, 16.7949161529541, 17.42404556274414, 18.053176879882812, 18.68230628967285]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 11.0, 15.0, 21.0, 37.0, 55.0, 88.0, 157.0, 234.0, 379.0, 650.0, 999.0, 1725.0, 2692.0, 4180.0, 6711.0, 10472.0, 15782.0, 23705.0, 34523.0, 48728.0, 65560.0, 84325.0, 101317.0, 112252.0, 112471.0, 103065.0, 87416.0, 69400.0, 51491.0, 36936.0, 25459.0, 17051.0, 11179.0, 7119.0, 4619.0, 2935.0, 1861.0, 1104.0, 682.0, 405.0, 265.0, 180.0, 131.0, 64.0, 47.0, 25.0, 12.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-13.0546875, -12.6717529296875, -12.288818359375, -11.9058837890625, -11.52294921875, -11.1400146484375, -10.757080078125, -10.3741455078125, -9.9912109375, -9.6082763671875, -9.225341796875, -8.8424072265625, -8.45947265625, -8.0765380859375, -7.693603515625, -7.3106689453125, -6.927734375, -6.5447998046875, -6.161865234375, -5.7789306640625, -5.39599609375, -5.0130615234375, -4.630126953125, -4.2471923828125, -3.8642578125, -3.4813232421875, -3.098388671875, -2.7154541015625, -2.33251953125, -1.9495849609375, -1.566650390625, -1.1837158203125, -0.80078125, -0.4178466796875, -0.034912109375, 0.3480224609375, 0.73095703125, 1.1138916015625, 1.496826171875, 1.8797607421875, 2.2626953125, 2.6456298828125, 3.028564453125, 3.4114990234375, 3.79443359375, 4.1773681640625, 4.560302734375, 4.9432373046875, 5.326171875, 5.7091064453125, 6.092041015625, 6.4749755859375, 6.85791015625, 7.2408447265625, 7.623779296875, 8.0067138671875, 8.3896484375, 8.7725830078125, 9.155517578125, 9.5384521484375, 9.92138671875, 10.3043212890625, 10.687255859375, 11.0701904296875, 11.453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 3.0, 11.0, 10.0, 14.0, 15.0, 11.0, 24.0, 24.0, 35.0, 18.0, 32.0, 37.0, 32.0, 60.0, 41.0, 37.0, 41.0, 41.0, 44.0, 42.0, 41.0, 32.0, 36.0, 38.0, 30.0, 27.0, 27.0, 28.0, 33.0, 27.0, 16.0, 13.0, 17.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.55517578125, -17.0166015625, -16.47802734375, -15.939453125, -15.40087890625, -14.8623046875, -14.32373046875, -13.78515625, -13.24658203125, -12.7080078125, -12.16943359375, -11.630859375, -11.09228515625, -10.5537109375, -10.01513671875, -9.4765625, -8.93798828125, -8.3994140625, -7.86083984375, -7.322265625, -6.78369140625, -6.2451171875, -5.70654296875, -5.16796875, -4.62939453125, -4.0908203125, -3.55224609375, -3.013671875, -2.47509765625, -1.9365234375, -1.39794921875, -0.859375, -0.32080078125, 0.2177734375, 0.75634765625, 1.294921875, 1.83349609375, 2.3720703125, 2.91064453125, 3.44921875, 3.98779296875, 4.5263671875, 5.06494140625, 5.603515625, 6.14208984375, 6.6806640625, 7.21923828125, 7.7578125, 8.29638671875, 8.8349609375, 9.37353515625, 9.912109375, 10.45068359375, 10.9892578125, 11.52783203125, 12.06640625, 12.60498046875, 13.1435546875, 13.68212890625, 14.220703125, 14.75927734375, 15.2978515625, 15.83642578125, 16.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 6.0, 9.0, 17.0, 15.0, 22.0, 41.0, 47.0, 50.0, 81.0, 120.0, 178.0, 205.0, 302.0, 413.0, 627.0, 833.0, 1233.0, 1712.0, 2520.0, 3452.0, 5218.0, 7937.0, 12790.0, 21520.0, 63395.0, 808992.0, 58145.0, 20983.0, 12579.0, 7964.0, 5200.0, 3692.0, 2421.0, 1728.0, 1133.0, 819.0, 619.0, 440.0, 287.0, 211.0, 161.0, 115.0, 81.0, 61.0, 46.0, 37.0, 27.0, 14.0, 17.0, 12.0, 5.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0], "bins": [-36.75, -35.61865234375, -34.4873046875, -33.35595703125, -32.224609375, -31.09326171875, -29.9619140625, -28.83056640625, -27.69921875, -26.56787109375, -25.4365234375, -24.30517578125, -23.173828125, -22.04248046875, -20.9111328125, -19.77978515625, -18.6484375, -17.51708984375, -16.3857421875, -15.25439453125, -14.123046875, -12.99169921875, -11.8603515625, -10.72900390625, -9.59765625, -8.46630859375, -7.3349609375, -6.20361328125, -5.072265625, -3.94091796875, -2.8095703125, -1.67822265625, -0.546875, 0.58447265625, 1.7158203125, 2.84716796875, 3.978515625, 5.10986328125, 6.2412109375, 7.37255859375, 8.50390625, 9.63525390625, 10.7666015625, 11.89794921875, 13.029296875, 14.16064453125, 15.2919921875, 16.42333984375, 17.5546875, 18.68603515625, 19.8173828125, 20.94873046875, 22.080078125, 23.21142578125, 24.3427734375, 25.47412109375, 26.60546875, 27.73681640625, 28.8681640625, 29.99951171875, 31.130859375, 32.26220703125, 33.3935546875, 34.52490234375, 35.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 10.0, 7.0, 8.0, 15.0, 17.0, 14.0, 20.0, 30.0, 29.0, 35.0, 37.0, 30.0, 39.0, 48.0, 40.0, 66.0, 42.0, 51.0, 46.0, 36.0, 39.0, 41.0, 30.0, 30.0, 30.0, 39.0, 15.0, 19.0, 13.0, 17.0, 15.0, 16.0, 11.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-26.359375, -25.589599609375, -24.81982421875, -24.050048828125, -23.2802734375, -22.510498046875, -21.74072265625, -20.970947265625, -20.201171875, -19.431396484375, -18.66162109375, -17.891845703125, -17.1220703125, -16.352294921875, -15.58251953125, -14.812744140625, -14.04296875, -13.273193359375, -12.50341796875, -11.733642578125, -10.9638671875, -10.194091796875, -9.42431640625, -8.654541015625, -7.884765625, -7.114990234375, -6.34521484375, -5.575439453125, -4.8056640625, -4.035888671875, -3.26611328125, -2.496337890625, -1.7265625, -0.956787109375, -0.18701171875, 0.582763671875, 1.3525390625, 2.122314453125, 2.89208984375, 3.661865234375, 4.431640625, 5.201416015625, 5.97119140625, 6.740966796875, 7.5107421875, 8.280517578125, 9.05029296875, 9.820068359375, 10.58984375, 11.359619140625, 12.12939453125, 12.899169921875, 13.6689453125, 14.438720703125, 15.20849609375, 15.978271484375, 16.748046875, 17.517822265625, 18.28759765625, 19.057373046875, 19.8271484375, 20.596923828125, 21.36669921875, 22.136474609375, 22.90625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 15.0, 13.0, 20.0, 34.0, 51.0, 64.0, 92.0, 129.0, 190.0, 324.0, 454.0, 732.0, 1098.0, 1798.0, 2981.0, 5001.0, 8918.0, 17335.0, 48044.0, 801814.0, 110534.0, 22512.0, 11001.0, 5982.0, 3533.0, 2141.0, 1307.0, 831.0, 540.0, 314.0, 220.0, 140.0, 119.0, 83.0, 37.0, 31.0, 35.0, 15.0, 19.0, 12.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 4.0], "bins": [-14.96875, -14.560546875, -14.15234375, -13.744140625, -13.3359375, -12.927734375, -12.51953125, -12.111328125, -11.703125, -11.294921875, -10.88671875, -10.478515625, -10.0703125, -9.662109375, -9.25390625, -8.845703125, -8.4375, -8.029296875, -7.62109375, -7.212890625, -6.8046875, -6.396484375, -5.98828125, -5.580078125, -5.171875, -4.763671875, -4.35546875, -3.947265625, -3.5390625, -3.130859375, -2.72265625, -2.314453125, -1.90625, -1.498046875, -1.08984375, -0.681640625, -0.2734375, 0.134765625, 0.54296875, 0.951171875, 1.359375, 1.767578125, 2.17578125, 2.583984375, 2.9921875, 3.400390625, 3.80859375, 4.216796875, 4.625, 5.033203125, 5.44140625, 5.849609375, 6.2578125, 6.666015625, 7.07421875, 7.482421875, 7.890625, 8.298828125, 8.70703125, 9.115234375, 9.5234375, 9.931640625, 10.33984375, 10.748046875, 11.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 21.0, 18.0, 19.0, 28.0, 38.0, 49.0, 58.0, 79.0, 91.0, 126.0, 95.0, 88.0, 63.0, 43.0, 28.0, 30.0, 15.0, 19.0, 17.0, 14.0, 9.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039005279541015625, -0.0037538111209869385, -0.0036070942878723145, -0.0034603774547576904, -0.0033136606216430664, -0.0031669437885284424, -0.0030202269554138184, -0.0028735101222991943, -0.0027267932891845703, -0.0025800764560699463, -0.0024333596229553223, -0.0022866427898406982, -0.0021399259567260742, -0.00199320912361145, -0.0018464922904968262, -0.0016997754573822021, -0.0015530586242675781, -0.001406341791152954, -0.00125962495803833, -0.001112908124923706, -0.000966191291809082, -0.000819474458694458, -0.000672757625579834, -0.00052604079246521, -0.00037932395935058594, -0.00023260712623596191, -8.589029312133789e-05, 6.082653999328613e-05, 0.00020754337310791016, 0.0003542602062225342, 0.0005009770393371582, 0.0006476938724517822, 0.0007944107055664062, 0.0009411275386810303, 0.0010878443717956543, 0.0012345612049102783, 0.0013812780380249023, 0.0015279948711395264, 0.0016747117042541504, 0.0018214285373687744, 0.0019681453704833984, 0.0021148622035980225, 0.0022615790367126465, 0.0024082958698272705, 0.0025550127029418945, 0.0027017295360565186, 0.0028484463691711426, 0.0029951632022857666, 0.0031418800354003906, 0.0032885968685150146, 0.0034353137016296387, 0.0035820305347442627, 0.0037287473678588867, 0.0038754642009735107, 0.004022181034088135, 0.004168897867202759, 0.004315614700317383, 0.004462331533432007, 0.004609048366546631, 0.004755765199661255, 0.004902482032775879, 0.005049198865890503, 0.005195915699005127, 0.005342632532119751, 0.005489349365234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 8.0, 6.0, 22.0, 27.0, 36.0, 49.0, 67.0, 101.0, 126.0, 189.0, 300.0, 416.0, 616.0, 863.0, 1360.0, 2110.0, 3421.0, 5813.0, 10800.0, 21068.0, 42745.0, 89204.0, 181858.0, 274714.0, 205526.0, 104385.0, 49360.0, 23876.0, 12290.0, 6516.0, 3879.0, 2318.0, 1422.0, 873.0, 640.0, 477.0, 311.0, 239.0, 170.0, 101.0, 82.0, 53.0, 36.0, 30.0, 18.0, 12.0, 5.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.70989990234375, -3.5994873046875, -3.48907470703125, -3.378662109375, -3.26824951171875, -3.1578369140625, -3.04742431640625, -2.93701171875, -2.82659912109375, -2.7161865234375, -2.60577392578125, -2.495361328125, -2.38494873046875, -2.2745361328125, -2.16412353515625, -2.0537109375, -1.94329833984375, -1.8328857421875, -1.72247314453125, -1.612060546875, -1.50164794921875, -1.3912353515625, -1.28082275390625, -1.17041015625, -1.05999755859375, -0.9495849609375, -0.83917236328125, -0.728759765625, -0.61834716796875, -0.5079345703125, -0.39752197265625, -0.287109375, -0.17669677734375, -0.0662841796875, 0.04412841796875, 0.154541015625, 0.26495361328125, 0.3753662109375, 0.48577880859375, 0.59619140625, 0.70660400390625, 0.8170166015625, 0.92742919921875, 1.037841796875, 1.14825439453125, 1.2586669921875, 1.36907958984375, 1.4794921875, 1.58990478515625, 1.7003173828125, 1.81072998046875, 1.921142578125, 2.03155517578125, 2.1419677734375, 2.25238037109375, 2.36279296875, 2.47320556640625, 2.5836181640625, 2.69403076171875, 2.804443359375, 2.91485595703125, 3.0252685546875, 3.13568115234375, 3.24609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 6.0, 12.0, 8.0, 13.0, 17.0, 25.0, 27.0, 27.0, 45.0, 50.0, 59.0, 61.0, 72.0, 79.0, 69.0, 72.0, 73.0, 55.0, 46.0, 36.0, 23.0, 20.0, 22.0, 8.0, 10.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.079315185546875, -1.04534912109375, -1.011383056640625, -0.9774169921875, -0.943450927734375, -0.90948486328125, -0.875518798828125, -0.841552734375, -0.807586669921875, -0.77362060546875, -0.739654541015625, -0.7056884765625, -0.671722412109375, -0.63775634765625, -0.603790283203125, -0.56982421875, -0.535858154296875, -0.50189208984375, -0.467926025390625, -0.4339599609375, -0.399993896484375, -0.36602783203125, -0.332061767578125, -0.298095703125, -0.264129638671875, -0.23016357421875, -0.196197509765625, -0.1622314453125, -0.128265380859375, -0.09429931640625, -0.060333251953125, -0.0263671875, 0.007598876953125, 0.04156494140625, 0.075531005859375, 0.1094970703125, 0.143463134765625, 0.17742919921875, 0.211395263671875, 0.245361328125, 0.279327392578125, 0.31329345703125, 0.347259521484375, 0.3812255859375, 0.415191650390625, 0.44915771484375, 0.483123779296875, 0.51708984375, 0.551055908203125, 0.58502197265625, 0.618988037109375, 0.6529541015625, 0.686920166015625, 0.72088623046875, 0.754852294921875, 0.788818359375, 0.822784423828125, 0.85675048828125, 0.890716552734375, 0.9246826171875, 0.958648681640625, 0.99261474609375, 1.026580810546875, 1.060546875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 2.0, 5.0, 6.0, 16.0, 9.0, 16.0, 19.0, 29.0, 24.0, 32.0, 33.0, 39.0, 32.0, 52.0, 51.0, 50.0, 41.0, 45.0, 55.0, 54.0, 46.0, 48.0, 33.0, 43.0, 33.0, 12.0, 21.0, 31.0, 19.0, 17.0, 19.0, 16.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.877809524536133, -16.325790405273438, -15.773771286010742, -15.221752166748047, -14.669733047485352, -14.117713928222656, -13.565695762634277, -13.013676643371582, -12.461657524108887, -11.909638404846191, -11.357619285583496, -10.8056001663208, -10.253582000732422, -9.701562881469727, -9.149543762207031, -8.597524642944336, -8.04550552368164, -7.493486404418945, -6.94146728515625, -6.389448642730713, -5.837429523468018, -5.285410404205322, -4.733391761779785, -4.18137264251709, -3.6293535232543945, -3.077334403991699, -2.525315523147583, -1.9732965230941772, -1.4212775230407715, -0.8692584037780762, -0.31723952293395996, 0.23477935791015625, 0.7867965698242188, 1.3388155698776245, 1.8908345699310303, 2.4428534507751465, 2.994872570037842, 3.546891689300537, 4.098910331726074, 4.6509294509887695, 5.202948570251465, 5.75496768951416, 6.3069868087768555, 6.859005451202393, 7.411024570465088, 7.963043689727783, 8.51506233215332, 9.067081451416016, 9.619100570678711, 10.171119689941406, 10.723138809204102, 11.275157928466797, 11.827177047729492, 12.379196166992188, 12.931214332580566, 13.483233451843262, 14.035252571105957, 14.587271690368652, 15.139290809631348, 15.691309928894043, 16.243328094482422, 16.795347213745117, 17.347366333007812, 17.899385452270508, 18.451404571533203]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 5.0, 7.0, 12.0, 12.0, 10.0, 22.0, 11.0, 30.0, 24.0, 34.0, 34.0, 34.0, 28.0, 32.0, 49.0, 43.0, 37.0, 39.0, 38.0, 42.0, 33.0, 31.0, 41.0, 42.0, 26.0, 32.0, 26.0, 32.0, 25.0, 26.0, 21.0, 22.0, 17.0, 17.0, 15.0, 3.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.759028434753418, -15.257232666015625, -14.755436897277832, -14.253641128540039, -13.751845359802246, -13.250049591064453, -12.748252868652344, -12.246458053588867, -11.744661331176758, -11.242865562438965, -10.741069793701172, -10.239274024963379, -9.737478256225586, -9.235682487487793, -8.73388671875, -8.23208999633789, -7.730295181274414, -7.228499412536621, -6.726703643798828, -6.224907875061035, -5.723112106323242, -5.221316337585449, -4.719520092010498, -4.217724323272705, -3.715928554534912, -3.214132785797119, -2.712337017059326, -2.210541009902954, -1.7087452411651611, -1.2069494724273682, -0.7051534652709961, -0.20335769653320312, 0.29843711853027344, 0.8002329468727112, 1.302028775215149, 1.8038246631622314, 2.3056204319000244, 2.8074162006378174, 3.3092122077941895, 3.8110079765319824, 4.312803745269775, 4.814599514007568, 5.316395282745361, 5.8181915283203125, 6.3199872970581055, 6.821783065795898, 7.323578834533691, 7.825374603271484, 8.327170372009277, 8.82896614074707, 9.330761909484863, 9.832557678222656, 10.33435344696045, 10.836149215698242, 11.337945938110352, 11.839740753173828, 12.341537475585938, 12.84333324432373, 13.345129013061523, 13.846924781799316, 14.34872055053711, 14.850516319274902, 15.352312088012695, 15.854108810424805, 16.35590362548828]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 17.0, 27.0, 26.0, 42.0, 59.0, 86.0, 119.0, 146.0, 223.0, 364.0, 520.0, 770.0, 1149.0, 1731.0, 2532.0, 3850.0, 5555.0, 8478.0, 12935.0, 19579.0, 29929.0, 44356.0, 64463.0, 89643.0, 114716.0, 131570.0, 129702.0, 111891.0, 86845.0, 61476.0, 42058.0, 28344.0, 18646.0, 12229.0, 8184.0, 5334.0, 3569.0, 2355.0, 1603.0, 1098.0, 743.0, 516.0, 315.0, 229.0, 145.0, 113.0, 74.0, 53.0, 45.0, 32.0, 21.0, 15.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0], "bins": [-13.7890625, -13.3572998046875, -12.925537109375, -12.4937744140625, -12.06201171875, -11.6302490234375, -11.198486328125, -10.7667236328125, -10.3349609375, -9.9031982421875, -9.471435546875, -9.0396728515625, -8.60791015625, -8.1761474609375, -7.744384765625, -7.3126220703125, -6.880859375, -6.4490966796875, -6.017333984375, -5.5855712890625, -5.15380859375, -4.7220458984375, -4.290283203125, -3.8585205078125, -3.4267578125, -2.9949951171875, -2.563232421875, -2.1314697265625, -1.69970703125, -1.2679443359375, -0.836181640625, -0.4044189453125, 0.02734375, 0.4591064453125, 0.890869140625, 1.3226318359375, 1.75439453125, 2.1861572265625, 2.617919921875, 3.0496826171875, 3.4814453125, 3.9132080078125, 4.344970703125, 4.7767333984375, 5.20849609375, 5.6402587890625, 6.072021484375, 6.5037841796875, 6.935546875, 7.3673095703125, 7.799072265625, 8.2308349609375, 8.66259765625, 9.0943603515625, 9.526123046875, 9.9578857421875, 10.3896484375, 10.8214111328125, 11.253173828125, 11.6849365234375, 12.11669921875, 12.5484619140625, 12.980224609375, 13.4119873046875, 13.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 4.0, 2.0, 6.0, 11.0, 9.0, 8.0, 15.0, 14.0, 28.0, 19.0, 20.0, 28.0, 27.0, 31.0, 40.0, 32.0, 36.0, 45.0, 41.0, 34.0, 38.0, 31.0, 44.0, 30.0, 36.0, 30.0, 35.0, 23.0, 24.0, 26.0, 41.0, 28.0, 25.0, 19.0, 22.0, 21.0, 6.0, 11.0, 14.0, 7.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.203125, -12.791259765625, -12.37939453125, -11.967529296875, -11.5556640625, -11.143798828125, -10.73193359375, -10.320068359375, -9.908203125, -9.496337890625, -9.08447265625, -8.672607421875, -8.2607421875, -7.848876953125, -7.43701171875, -7.025146484375, -6.61328125, -6.201416015625, -5.78955078125, -5.377685546875, -4.9658203125, -4.553955078125, -4.14208984375, -3.730224609375, -3.318359375, -2.906494140625, -2.49462890625, -2.082763671875, -1.6708984375, -1.259033203125, -0.84716796875, -0.435302734375, -0.0234375, 0.388427734375, 0.80029296875, 1.212158203125, 1.6240234375, 2.035888671875, 2.44775390625, 2.859619140625, 3.271484375, 3.683349609375, 4.09521484375, 4.507080078125, 4.9189453125, 5.330810546875, 5.74267578125, 6.154541015625, 6.56640625, 6.978271484375, 7.39013671875, 7.802001953125, 8.2138671875, 8.625732421875, 9.03759765625, 9.449462890625, 9.861328125, 10.273193359375, 10.68505859375, 11.096923828125, 11.5087890625, 11.920654296875, 12.33251953125, 12.744384765625, 13.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 14.0, 24.0, 34.0, 60.0, 65.0, 118.0, 151.0, 235.0, 353.0, 520.0, 880.0, 1317.0, 1979.0, 2983.0, 4770.0, 7389.0, 11925.0, 19533.0, 30922.0, 48142.0, 74336.0, 105223.0, 134385.0, 147656.0, 135934.0, 108035.0, 75723.0, 49742.0, 32398.0, 19807.0, 12305.0, 7850.0, 4939.0, 3029.0, 2016.0, 1275.0, 824.0, 559.0, 380.0, 234.0, 138.0, 98.0, 73.0, 56.0, 45.0, 32.0, 17.0, 8.0, 7.0, 1.0, 7.0, 3.0, 0.0, 1.0], "bins": [-15.8046875, -15.3333740234375, -14.862060546875, -14.3907470703125, -13.91943359375, -13.4481201171875, -12.976806640625, -12.5054931640625, -12.0341796875, -11.5628662109375, -11.091552734375, -10.6202392578125, -10.14892578125, -9.6776123046875, -9.206298828125, -8.7349853515625, -8.263671875, -7.7923583984375, -7.321044921875, -6.8497314453125, -6.37841796875, -5.9071044921875, -5.435791015625, -4.9644775390625, -4.4931640625, -4.0218505859375, -3.550537109375, -3.0792236328125, -2.60791015625, -2.1365966796875, -1.665283203125, -1.1939697265625, -0.72265625, -0.2513427734375, 0.219970703125, 0.6912841796875, 1.16259765625, 1.6339111328125, 2.105224609375, 2.5765380859375, 3.0478515625, 3.5191650390625, 3.990478515625, 4.4617919921875, 4.93310546875, 5.4044189453125, 5.875732421875, 6.3470458984375, 6.818359375, 7.2896728515625, 7.760986328125, 8.2322998046875, 8.70361328125, 9.1749267578125, 9.646240234375, 10.1175537109375, 10.5888671875, 11.0601806640625, 11.531494140625, 12.0028076171875, 12.47412109375, 12.9454345703125, 13.416748046875, 13.8880615234375, 14.359375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 15.0, 18.0, 16.0, 27.0, 28.0, 42.0, 32.0, 37.0, 37.0, 43.0, 33.0, 43.0, 35.0, 31.0, 40.0, 42.0, 45.0, 27.0, 44.0, 27.0, 44.0, 30.0, 27.0, 27.0, 14.0, 20.0, 12.0, 18.0, 12.0, 6.0, 11.0, 7.0, 11.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.59539794921875, -7.3275146484375, -7.05963134765625, -6.791748046875, -6.52386474609375, -6.2559814453125, -5.98809814453125, -5.72021484375, -5.45233154296875, -5.1844482421875, -4.91656494140625, -4.648681640625, -4.38079833984375, -4.1129150390625, -3.84503173828125, -3.5771484375, -3.30926513671875, -3.0413818359375, -2.77349853515625, -2.505615234375, -2.23773193359375, -1.9698486328125, -1.70196533203125, -1.43408203125, -1.16619873046875, -0.8983154296875, -0.63043212890625, -0.362548828125, -0.09466552734375, 0.1732177734375, 0.44110107421875, 0.708984375, 0.97686767578125, 1.2447509765625, 1.51263427734375, 1.780517578125, 2.04840087890625, 2.3162841796875, 2.58416748046875, 2.85205078125, 3.11993408203125, 3.3878173828125, 3.65570068359375, 3.923583984375, 4.19146728515625, 4.4593505859375, 4.72723388671875, 4.9951171875, 5.26300048828125, 5.5308837890625, 5.79876708984375, 6.066650390625, 6.33453369140625, 6.6024169921875, 6.87030029296875, 7.13818359375, 7.40606689453125, 7.6739501953125, 7.94183349609375, 8.209716796875, 8.47760009765625, 8.7454833984375, 9.01336669921875, 9.28125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 9.0, 4.0, 18.0, 24.0, 42.0, 60.0, 83.0, 111.0, 160.0, 233.0, 370.0, 561.0, 812.0, 1238.0, 1915.0, 3074.0, 4732.0, 7811.0, 12400.0, 20174.0, 33030.0, 53879.0, 84073.0, 124766.0, 158954.0, 163212.0, 131269.0, 91133.0, 58864.0, 36226.0, 22419.0, 13711.0, 8408.0, 5330.0, 3386.0, 2091.0, 1362.0, 826.0, 592.0, 394.0, 259.0, 184.0, 110.0, 83.0, 54.0, 39.0, 25.0, 19.0, 5.0, 6.0, 11.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.953125, -7.705322265625, -7.45751953125, -7.209716796875, -6.9619140625, -6.714111328125, -6.46630859375, -6.218505859375, -5.970703125, -5.722900390625, -5.47509765625, -5.227294921875, -4.9794921875, -4.731689453125, -4.48388671875, -4.236083984375, -3.98828125, -3.740478515625, -3.49267578125, -3.244873046875, -2.9970703125, -2.749267578125, -2.50146484375, -2.253662109375, -2.005859375, -1.758056640625, -1.51025390625, -1.262451171875, -1.0146484375, -0.766845703125, -0.51904296875, -0.271240234375, -0.0234375, 0.224365234375, 0.47216796875, 0.719970703125, 0.9677734375, 1.215576171875, 1.46337890625, 1.711181640625, 1.958984375, 2.206787109375, 2.45458984375, 2.702392578125, 2.9501953125, 3.197998046875, 3.44580078125, 3.693603515625, 3.94140625, 4.189208984375, 4.43701171875, 4.684814453125, 4.9326171875, 5.180419921875, 5.42822265625, 5.676025390625, 5.923828125, 6.171630859375, 6.41943359375, 6.667236328125, 6.9150390625, 7.162841796875, 7.41064453125, 7.658447265625, 7.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 10.0, 14.0, 20.0, 29.0, 39.0, 55.0, 74.0, 94.0, 98.0, 101.0, 108.0, 103.0, 58.0, 51.0, 36.0, 27.0, 23.0, 17.0, 10.0, 6.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00140380859375, -0.0013559907674789429, -0.0013081729412078857, -0.0012603551149368286, -0.0012125372886657715, -0.0011647194623947144, -0.0011169016361236572, -0.0010690838098526, -0.001021265983581543, -0.0009734481573104858, -0.0009256303310394287, -0.0008778125047683716, -0.0008299946784973145, -0.0007821768522262573, -0.0007343590259552002, -0.0006865411996841431, -0.0006387233734130859, -0.0005909055471420288, -0.0005430877208709717, -0.0004952698945999146, -0.0004474520683288574, -0.0003996342420578003, -0.00035181641578674316, -0.00030399858951568604, -0.0002561807632446289, -0.00020836293697357178, -0.00016054511070251465, -0.00011272728443145752, -6.490945816040039e-05, -1.7091631889343262e-05, 3.072619438171387e-05, 7.8544020652771e-05, 0.00012636184692382812, 0.00017417967319488525, 0.00022199749946594238, 0.0002698153257369995, 0.00031763315200805664, 0.00036545097827911377, 0.0004132688045501709, 0.00046108663082122803, 0.0005089044570922852, 0.0005567222833633423, 0.0006045401096343994, 0.0006523579359054565, 0.0007001757621765137, 0.0007479935884475708, 0.0007958114147186279, 0.0008436292409896851, 0.0008914470672607422, 0.0009392648935317993, 0.0009870827198028564, 0.0010349005460739136, 0.0010827183723449707, 0.0011305361986160278, 0.001178354024887085, 0.001226171851158142, 0.0012739896774291992, 0.0013218075037002563, 0.0013696253299713135, 0.0014174431562423706, 0.0014652609825134277, 0.0015130788087844849, 0.001560896635055542, 0.0016087144613265991, 0.0016565322875976562]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 17.0, 36.0, 32.0, 69.0, 86.0, 153.0, 210.0, 297.0, 442.0, 694.0, 1053.0, 1673.0, 2687.0, 4275.0, 6731.0, 10606.0, 17240.0, 27443.0, 44538.0, 68329.0, 101748.0, 137975.0, 156612.0, 144188.0, 111441.0, 76816.0, 49277.0, 31262.0, 19679.0, 12131.0, 7588.0, 4834.0, 2981.0, 1903.0, 1170.0, 776.0, 525.0, 339.0, 214.0, 155.0, 127.0, 64.0, 45.0, 28.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.0234375, -7.791748046875, -7.56005859375, -7.328369140625, -7.0966796875, -6.864990234375, -6.63330078125, -6.401611328125, -6.169921875, -5.938232421875, -5.70654296875, -5.474853515625, -5.2431640625, -5.011474609375, -4.77978515625, -4.548095703125, -4.31640625, -4.084716796875, -3.85302734375, -3.621337890625, -3.3896484375, -3.157958984375, -2.92626953125, -2.694580078125, -2.462890625, -2.231201171875, -1.99951171875, -1.767822265625, -1.5361328125, -1.304443359375, -1.07275390625, -0.841064453125, -0.609375, -0.377685546875, -0.14599609375, 0.085693359375, 0.3173828125, 0.549072265625, 0.78076171875, 1.012451171875, 1.244140625, 1.475830078125, 1.70751953125, 1.939208984375, 2.1708984375, 2.402587890625, 2.63427734375, 2.865966796875, 3.09765625, 3.329345703125, 3.56103515625, 3.792724609375, 4.0244140625, 4.256103515625, 4.48779296875, 4.719482421875, 4.951171875, 5.182861328125, 5.41455078125, 5.646240234375, 5.8779296875, 6.109619140625, 6.34130859375, 6.572998046875, 6.8046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 14.0, 13.0, 20.0, 19.0, 32.0, 42.0, 40.0, 48.0, 60.0, 61.0, 54.0, 64.0, 58.0, 61.0, 48.0, 53.0, 50.0, 33.0, 39.0, 26.0, 28.0, 21.0, 17.0, 13.0, 20.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.058135986328125, -2.96783447265625, -2.877532958984375, -2.7872314453125, -2.696929931640625, -2.60662841796875, -2.516326904296875, -2.426025390625, -2.335723876953125, -2.24542236328125, -2.155120849609375, -2.0648193359375, -1.974517822265625, -1.88421630859375, -1.793914794921875, -1.70361328125, -1.613311767578125, -1.52301025390625, -1.432708740234375, -1.3424072265625, -1.252105712890625, -1.16180419921875, -1.071502685546875, -0.981201171875, -0.890899658203125, -0.80059814453125, -0.710296630859375, -0.6199951171875, -0.529693603515625, -0.43939208984375, -0.349090576171875, -0.2587890625, -0.168487548828125, -0.07818603515625, 0.012115478515625, 0.1024169921875, 0.192718505859375, 0.28302001953125, 0.373321533203125, 0.463623046875, 0.553924560546875, 0.64422607421875, 0.734527587890625, 0.8248291015625, 0.915130615234375, 1.00543212890625, 1.095733642578125, 1.18603515625, 1.276336669921875, 1.36663818359375, 1.456939697265625, 1.5472412109375, 1.637542724609375, 1.72784423828125, 1.818145751953125, 1.908447265625, 1.998748779296875, 2.08905029296875, 2.179351806640625, 2.2696533203125, 2.359954833984375, 2.45025634765625, 2.540557861328125, 2.630859375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 8.0, 16.0, 7.0, 19.0, 24.0, 26.0, 27.0, 36.0, 36.0, 29.0, 47.0, 46.0, 42.0, 51.0, 49.0, 47.0, 49.0, 45.0, 50.0, 39.0, 41.0, 44.0, 21.0, 22.0, 33.0, 24.0, 18.0, 18.0, 8.0, 12.0, 7.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.070353507995605, -12.58980941772461, -12.10926628112793, -11.62872314453125, -11.148179054260254, -10.667634963989258, -10.187091827392578, -9.706548690795898, -9.226004600524902, -8.745460510253906, -8.264917373657227, -7.784373760223389, -7.303830146789551, -6.823286533355713, -6.342742919921875, -5.862199306488037, -5.381655693054199, -4.901112079620361, -4.420568466186523, -3.9400248527526855, -3.4594812393188477, -2.9789376258850098, -2.498394012451172, -2.017850399017334, -1.537306785583496, -1.0567631721496582, -0.5762195587158203, -0.09567594528198242, 0.38486766815185547, 0.8654112815856934, 1.3459548950195312, 1.8264985084533691, 2.3070430755615234, 2.7875866889953613, 3.268130302429199, 3.748673915863037, 4.229217529296875, 4.709761142730713, 5.190304756164551, 5.670848369598389, 6.151391983032227, 6.6319355964660645, 7.112479209899902, 7.59302282333374, 8.073566436767578, 8.554109573364258, 9.034653663635254, 9.51519775390625, 9.99574089050293, 10.47628402709961, 10.956828117370605, 11.437372207641602, 11.917915344238281, 12.398458480834961, 12.879002571105957, 13.359546661376953, 13.840089797973633, 14.320632934570312, 14.801177024841309, 15.281721115112305, 15.762264251708984, 16.242807388305664, 16.723350524902344, 17.203895568847656, 17.684438705444336]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 11.0, 15.0, 12.0, 14.0, 15.0, 24.0, 20.0, 23.0, 30.0, 34.0, 37.0, 33.0, 38.0, 41.0, 30.0, 46.0, 42.0, 35.0, 36.0, 39.0, 35.0, 41.0, 22.0, 38.0, 25.0, 33.0, 25.0, 30.0, 21.0, 20.0, 13.0, 15.0, 17.0, 9.0, 4.0, 13.0, 4.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.401455879211426, -12.971198081970215, -12.54094123840332, -12.11068344116211, -11.680426597595215, -11.250168800354004, -10.81991195678711, -10.389654159545898, -9.959396362304688, -9.529138565063477, -9.098881721496582, -8.668623924255371, -8.238367080688477, -7.808109283447266, -7.377851963043213, -6.94759464263916, -6.517337799072266, -6.087080478668213, -5.65682315826416, -5.226565361022949, -4.796308517456055, -4.366050720214844, -3.935793399810791, -3.5055360794067383, -3.0752787590026855, -2.645021438598633, -2.21476411819458, -1.7845065593719482, -1.3542492389678955, -0.9239919185638428, -0.49373435974121094, -0.0634770393371582, 0.3667793273925781, 0.7970367074012756, 1.2272940874099731, 1.6575515270233154, 2.087808847427368, 2.518066167831421, 2.9483237266540527, 3.3785810470581055, 3.808838367462158, 4.239095687866211, 4.669353008270264, 5.099610328674316, 5.529868125915527, 5.960124969482422, 6.390382766723633, 6.8206400871276855, 7.250897407531738, 7.681154727935791, 8.111412048339844, 8.541669845581055, 8.97192668914795, 9.40218448638916, 9.832441329956055, 10.262699127197266, 10.692956924438477, 11.123214721679688, 11.553471565246582, 11.983729362487793, 12.413986206054688, 12.844244003295898, 13.27450180053711, 13.704758644104004, 14.135015487670898]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 12.0, 30.0, 21.0, 36.0, 69.0, 87.0, 151.0, 228.0, 365.0, 568.0, 823.0, 1370.0, 2249.0, 3897.0, 6593.0, 11070.0, 19241.0, 33479.0, 58808.0, 106326.0, 195172.0, 353077.0, 578851.0, 763508.0, 754805.0, 555891.0, 332187.0, 182270.0, 99563.0, 55394.0, 31746.0, 18627.0, 10909.0, 6605.0, 3929.0, 2335.0, 1459.0, 903.0, 542.0, 378.0, 239.0, 142.0, 103.0, 69.0, 45.0, 34.0, 24.0, 15.0, 12.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.3515625, -10.0059814453125, -9.660400390625, -9.3148193359375, -8.96923828125, -8.6236572265625, -8.278076171875, -7.9324951171875, -7.5869140625, -7.2413330078125, -6.895751953125, -6.5501708984375, -6.20458984375, -5.8590087890625, -5.513427734375, -5.1678466796875, -4.822265625, -4.4766845703125, -4.131103515625, -3.7855224609375, -3.43994140625, -3.0943603515625, -2.748779296875, -2.4031982421875, -2.0576171875, -1.7120361328125, -1.366455078125, -1.0208740234375, -0.67529296875, -0.3297119140625, 0.015869140625, 0.3614501953125, 0.70703125, 1.0526123046875, 1.398193359375, 1.7437744140625, 2.08935546875, 2.4349365234375, 2.780517578125, 3.1260986328125, 3.4716796875, 3.8172607421875, 4.162841796875, 4.5084228515625, 4.85400390625, 5.1995849609375, 5.545166015625, 5.8907470703125, 6.236328125, 6.5819091796875, 6.927490234375, 7.2730712890625, 7.61865234375, 7.9642333984375, 8.309814453125, 8.6553955078125, 9.0009765625, 9.3465576171875, 9.692138671875, 10.0377197265625, 10.38330078125, 10.7288818359375, 11.074462890625, 11.4200439453125, 11.765625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 14.0, 14.0, 9.0, 9.0, 24.0, 18.0, 26.0, 16.0, 16.0, 29.0, 29.0, 29.0, 25.0, 29.0, 33.0, 49.0, 35.0, 43.0, 37.0, 36.0, 36.0, 26.0, 31.0, 36.0, 31.0, 25.0, 33.0, 24.0, 31.0, 19.0, 18.0, 28.0, 24.0, 11.0, 16.0, 14.0, 9.0, 7.0, 10.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-9.484375, -9.186279296875, -8.88818359375, -8.590087890625, -8.2919921875, -7.993896484375, -7.69580078125, -7.397705078125, -7.099609375, -6.801513671875, -6.50341796875, -6.205322265625, -5.9072265625, -5.609130859375, -5.31103515625, -5.012939453125, -4.71484375, -4.416748046875, -4.11865234375, -3.820556640625, -3.5224609375, -3.224365234375, -2.92626953125, -2.628173828125, -2.330078125, -2.031982421875, -1.73388671875, -1.435791015625, -1.1376953125, -0.839599609375, -0.54150390625, -0.243408203125, 0.0546875, 0.352783203125, 0.65087890625, 0.948974609375, 1.2470703125, 1.545166015625, 1.84326171875, 2.141357421875, 2.439453125, 2.737548828125, 3.03564453125, 3.333740234375, 3.6318359375, 3.929931640625, 4.22802734375, 4.526123046875, 4.82421875, 5.122314453125, 5.42041015625, 5.718505859375, 6.0166015625, 6.314697265625, 6.61279296875, 6.910888671875, 7.208984375, 7.507080078125, 7.80517578125, 8.103271484375, 8.4013671875, 8.699462890625, 8.99755859375, 9.295654296875, 9.59375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 15.0, 25.0, 42.0, 72.0, 95.0, 156.0, 228.0, 366.0, 586.0, 988.0, 1595.0, 2553.0, 3923.0, 6484.0, 10316.0, 17017.0, 27505.0, 45216.0, 72991.0, 117722.0, 187316.0, 290765.0, 427893.0, 573515.0, 640538.0, 568463.0, 422230.0, 287066.0, 184353.0, 115971.0, 72278.0, 44714.0, 27241.0, 16885.0, 10286.0, 6394.0, 3946.0, 2416.0, 1538.0, 941.0, 623.0, 360.0, 231.0, 159.0, 96.0, 54.0, 42.0, 23.0, 20.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0], "bins": [-10.8359375, -10.5123291015625, -10.188720703125, -9.8651123046875, -9.54150390625, -9.2178955078125, -8.894287109375, -8.5706787109375, -8.2470703125, -7.9234619140625, -7.599853515625, -7.2762451171875, -6.95263671875, -6.6290283203125, -6.305419921875, -5.9818115234375, -5.658203125, -5.3345947265625, -5.010986328125, -4.6873779296875, -4.36376953125, -4.0401611328125, -3.716552734375, -3.3929443359375, -3.0693359375, -2.7457275390625, -2.422119140625, -2.0985107421875, -1.77490234375, -1.4512939453125, -1.127685546875, -0.8040771484375, -0.48046875, -0.1568603515625, 0.166748046875, 0.4903564453125, 0.81396484375, 1.1375732421875, 1.461181640625, 1.7847900390625, 2.1083984375, 2.4320068359375, 2.755615234375, 3.0792236328125, 3.40283203125, 3.7264404296875, 4.050048828125, 4.3736572265625, 4.697265625, 5.0208740234375, 5.344482421875, 5.6680908203125, 5.99169921875, 6.3153076171875, 6.638916015625, 6.9625244140625, 7.2861328125, 7.6097412109375, 7.933349609375, 8.2569580078125, 8.58056640625, 8.9041748046875, 9.227783203125, 9.5513916015625, 9.875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 12.0, 18.0, 17.0, 25.0, 44.0, 43.0, 65.0, 71.0, 95.0, 98.0, 123.0, 135.0, 165.0, 193.0, 227.0, 223.0, 244.0, 265.0, 262.0, 257.0, 221.0, 221.0, 197.0, 150.0, 149.0, 109.0, 96.0, 88.0, 44.0, 46.0, 39.0, 23.0, 25.0, 21.0, 15.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.76953125, -5.6160888671875, -5.462646484375, -5.3092041015625, -5.15576171875, -5.0023193359375, -4.848876953125, -4.6954345703125, -4.5419921875, -4.3885498046875, -4.235107421875, -4.0816650390625, -3.92822265625, -3.7747802734375, -3.621337890625, -3.4678955078125, -3.314453125, -3.1610107421875, -3.007568359375, -2.8541259765625, -2.70068359375, -2.5472412109375, -2.393798828125, -2.2403564453125, -2.0869140625, -1.9334716796875, -1.780029296875, -1.6265869140625, -1.47314453125, -1.3197021484375, -1.166259765625, -1.0128173828125, -0.859375, -0.7059326171875, -0.552490234375, -0.3990478515625, -0.24560546875, -0.0921630859375, 0.061279296875, 0.2147216796875, 0.3681640625, 0.5216064453125, 0.675048828125, 0.8284912109375, 0.98193359375, 1.1353759765625, 1.288818359375, 1.4422607421875, 1.595703125, 1.7491455078125, 1.902587890625, 2.0560302734375, 2.20947265625, 2.3629150390625, 2.516357421875, 2.6697998046875, 2.8232421875, 2.9766845703125, 3.130126953125, 3.2835693359375, 3.43701171875, 3.5904541015625, 3.743896484375, 3.8973388671875, 4.05078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 4.0, 4.0, 8.0, 14.0, 17.0, 19.0, 25.0, 34.0, 41.0, 41.0, 45.0, 37.0, 48.0, 57.0, 57.0, 66.0, 46.0, 55.0, 53.0, 52.0, 52.0, 40.0, 32.0, 22.0, 22.0, 15.0, 14.0, 11.0, 8.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.228116989135742, -13.775860786437988, -13.323604583740234, -12.871347427368164, -12.41909122467041, -11.966835021972656, -11.514578819274902, -11.062322616577148, -10.610065460205078, -10.157809257507324, -9.70555305480957, -9.2532958984375, -8.801039695739746, -8.348783493041992, -7.896527290344238, -7.444271087646484, -6.9920148849487305, -6.539758682250977, -6.0875020027160645, -5.6352458000183105, -5.182989120483398, -4.7307329177856445, -4.278476715087891, -3.8262202739715576, -3.3739638328552246, -2.9217073917388916, -2.4694509506225586, -2.0171947479248047, -1.5649383068084717, -1.1126818656921387, -0.6604256629943848, -0.20816922187805176, 0.24408817291259766, 0.6963445544242859, 1.1486009359359741, 1.6008572578430176, 2.0531136989593506, 2.5053701400756836, 2.9576263427734375, 3.4098827838897705, 3.8621392250061035, 4.314395427703857, 4.7666521072387695, 5.218908309936523, 5.671164512634277, 6.1234211921691895, 6.575677394866943, 7.0279340744018555, 7.480190277099609, 7.932446479797363, 8.384702682495117, 8.836959838867188, 9.289216041564941, 9.741472244262695, 10.19372844696045, 10.645984649658203, 11.098241806030273, 11.550498008728027, 12.002754211425781, 12.455011367797852, 12.907267570495605, 13.35952377319336, 13.811779975891113, 14.264036178588867, 14.716292381286621]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 13.0, 11.0, 12.0, 10.0, 14.0, 16.0, 22.0, 19.0, 20.0, 27.0, 26.0, 24.0, 33.0, 52.0, 40.0, 35.0, 41.0, 30.0, 44.0, 35.0, 41.0, 35.0, 40.0, 34.0, 30.0, 38.0, 28.0, 27.0, 28.0, 19.0, 21.0, 19.0, 18.0, 22.0, 13.0, 11.0, 10.0, 4.0, 4.0, 7.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.525537490844727, -10.185063362121582, -9.844590187072754, -9.50411605834961, -9.163642883300781, -8.823168754577637, -8.482694625854492, -8.142221450805664, -7.801747798919678, -7.461274147033691, -7.120800495147705, -6.780326843261719, -6.439852714538574, -6.099379539489746, -5.758905410766602, -5.418431758880615, -5.077958106994629, -4.737484455108643, -4.397010803222656, -4.056536674499512, -3.7160632610321045, -3.375589609146118, -3.0351157188415527, -2.6946420669555664, -2.35416841506958, -2.0136947631835938, -1.6732209920883179, -1.332747220993042, -0.9922735691070557, -0.6517999172210693, -0.3113260269165039, 0.029147624969482422, 0.36962223052978516, 0.7100959420204163, 1.0505696535110474, 1.3910434246063232, 1.7315170764923096, 2.071990728378296, 2.4124646186828613, 2.7529382705688477, 3.093411922454834, 3.4338855743408203, 3.7743592262268066, 4.114832878112793, 4.4553070068359375, 4.795780181884766, 5.13625431060791, 5.4767279624938965, 5.817201614379883, 6.157675266265869, 6.4981489181518555, 6.838623046875, 7.179096221923828, 7.519570350646973, 7.860044002532959, 8.200517654418945, 8.540990829467773, 8.881464958190918, 9.221938133239746, 9.56241226196289, 9.902885437011719, 10.243359565734863, 10.583833694458008, 10.924306869506836, 11.26478099822998]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 15.0, 25.0, 40.0, 53.0, 76.0, 129.0, 167.0, 269.0, 410.0, 627.0, 962.0, 1504.0, 2238.0, 3293.0, 4812.0, 7283.0, 10814.0, 15949.0, 23721.0, 35060.0, 51081.0, 74672.0, 104481.0, 135839.0, 147348.0, 127751.0, 94001.0, 66203.0, 44949.0, 30923.0, 20660.0, 14231.0, 9551.0, 6479.0, 4356.0, 2888.0, 1980.0, 1249.0, 829.0, 556.0, 355.0, 245.0, 148.0, 108.0, 66.0, 50.0, 37.0, 16.0, 15.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-9.0390625, -8.7679443359375, -8.496826171875, -8.2257080078125, -7.95458984375, -7.6834716796875, -7.412353515625, -7.1412353515625, -6.8701171875, -6.5989990234375, -6.327880859375, -6.0567626953125, -5.78564453125, -5.5145263671875, -5.243408203125, -4.9722900390625, -4.701171875, -4.4300537109375, -4.158935546875, -3.8878173828125, -3.61669921875, -3.3455810546875, -3.074462890625, -2.8033447265625, -2.5322265625, -2.2611083984375, -1.989990234375, -1.7188720703125, -1.44775390625, -1.1766357421875, -0.905517578125, -0.6343994140625, -0.36328125, -0.0921630859375, 0.178955078125, 0.4500732421875, 0.72119140625, 0.9923095703125, 1.263427734375, 1.5345458984375, 1.8056640625, 2.0767822265625, 2.347900390625, 2.6190185546875, 2.89013671875, 3.1612548828125, 3.432373046875, 3.7034912109375, 3.974609375, 4.2457275390625, 4.516845703125, 4.7879638671875, 5.05908203125, 5.3302001953125, 5.601318359375, 5.8724365234375, 6.1435546875, 6.4146728515625, 6.685791015625, 6.9569091796875, 7.22802734375, 7.4991455078125, 7.770263671875, 8.0413818359375, 8.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 8.0, 8.0, 18.0, 11.0, 17.0, 14.0, 25.0, 20.0, 21.0, 25.0, 28.0, 31.0, 20.0, 36.0, 29.0, 40.0, 43.0, 36.0, 42.0, 33.0, 37.0, 32.0, 41.0, 38.0, 29.0, 27.0, 30.0, 24.0, 31.0, 21.0, 23.0, 20.0, 15.0, 11.0, 10.0, 13.0, 16.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3333740234375, -9.026123046875, -8.7188720703125, -8.41162109375, -8.1043701171875, -7.797119140625, -7.4898681640625, -7.1826171875, -6.8753662109375, -6.568115234375, -6.2608642578125, -5.95361328125, -5.6463623046875, -5.339111328125, -5.0318603515625, -4.724609375, -4.4173583984375, -4.110107421875, -3.8028564453125, -3.49560546875, -3.1883544921875, -2.881103515625, -2.5738525390625, -2.2666015625, -1.9593505859375, -1.652099609375, -1.3448486328125, -1.03759765625, -0.7303466796875, -0.423095703125, -0.1158447265625, 0.19140625, 0.4986572265625, 0.805908203125, 1.1131591796875, 1.42041015625, 1.7276611328125, 2.034912109375, 2.3421630859375, 2.6494140625, 2.9566650390625, 3.263916015625, 3.5711669921875, 3.87841796875, 4.1856689453125, 4.492919921875, 4.8001708984375, 5.107421875, 5.4146728515625, 5.721923828125, 6.0291748046875, 6.33642578125, 6.6436767578125, 6.950927734375, 7.2581787109375, 7.5654296875, 7.8726806640625, 8.179931640625, 8.4871826171875, 8.79443359375, 9.1016845703125, 9.408935546875, 9.7161865234375, 10.0234375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 12.0, 18.0, 25.0, 29.0, 57.0, 55.0, 84.0, 145.0, 157.0, 205.0, 294.0, 452.0, 609.0, 851.0, 1287.0, 1793.0, 2717.0, 3863.0, 5919.0, 9275.0, 15152.0, 28784.0, 396290.0, 506438.0, 30269.0, 15679.0, 9420.0, 5863.0, 3813.0, 2723.0, 1873.0, 1226.0, 936.0, 609.0, 435.0, 352.0, 231.0, 175.0, 127.0, 84.0, 59.0, 43.0, 25.0, 26.0, 21.0, 12.0, 8.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-14.9765625, -14.5089111328125, -14.041259765625, -13.5736083984375, -13.10595703125, -12.6383056640625, -12.170654296875, -11.7030029296875, -11.2353515625, -10.7677001953125, -10.300048828125, -9.8323974609375, -9.36474609375, -8.8970947265625, -8.429443359375, -7.9617919921875, -7.494140625, -7.0264892578125, -6.558837890625, -6.0911865234375, -5.62353515625, -5.1558837890625, -4.688232421875, -4.2205810546875, -3.7529296875, -3.2852783203125, -2.817626953125, -2.3499755859375, -1.88232421875, -1.4146728515625, -0.947021484375, -0.4793701171875, -0.01171875, 0.4559326171875, 0.923583984375, 1.3912353515625, 1.85888671875, 2.3265380859375, 2.794189453125, 3.2618408203125, 3.7294921875, 4.1971435546875, 4.664794921875, 5.1324462890625, 5.60009765625, 6.0677490234375, 6.535400390625, 7.0030517578125, 7.470703125, 7.9383544921875, 8.406005859375, 8.8736572265625, 9.34130859375, 9.8089599609375, 10.276611328125, 10.7442626953125, 11.2119140625, 11.6795654296875, 12.147216796875, 12.6148681640625, 13.08251953125, 13.5501708984375, 14.017822265625, 14.4854736328125, 14.953125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 10.0, 16.0, 13.0, 14.0, 16.0, 25.0, 30.0, 34.0, 38.0, 38.0, 36.0, 47.0, 46.0, 41.0, 40.0, 57.0, 36.0, 46.0, 56.0, 39.0, 38.0, 31.0, 33.0, 25.0, 31.0, 25.0, 28.0, 19.0, 10.0, 10.0, 10.0, 8.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.5859375, -10.2733154296875, -9.960693359375, -9.6480712890625, -9.33544921875, -9.0228271484375, -8.710205078125, -8.3975830078125, -8.0849609375, -7.7723388671875, -7.459716796875, -7.1470947265625, -6.83447265625, -6.5218505859375, -6.209228515625, -5.8966064453125, -5.583984375, -5.2713623046875, -4.958740234375, -4.6461181640625, -4.33349609375, -4.0208740234375, -3.708251953125, -3.3956298828125, -3.0830078125, -2.7703857421875, -2.457763671875, -2.1451416015625, -1.83251953125, -1.5198974609375, -1.207275390625, -0.8946533203125, -0.58203125, -0.2694091796875, 0.043212890625, 0.3558349609375, 0.66845703125, 0.9810791015625, 1.293701171875, 1.6063232421875, 1.9189453125, 2.2315673828125, 2.544189453125, 2.8568115234375, 3.16943359375, 3.4820556640625, 3.794677734375, 4.1072998046875, 4.419921875, 4.7325439453125, 5.045166015625, 5.3577880859375, 5.67041015625, 5.9830322265625, 6.295654296875, 6.6082763671875, 6.9208984375, 7.2335205078125, 7.546142578125, 7.8587646484375, 8.17138671875, 8.4840087890625, 8.796630859375, 9.1092529296875, 9.421875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 19.0, 21.0, 25.0, 18.0, 41.0, 62.0, 91.0, 120.0, 134.0, 225.0, 284.0, 440.0, 697.0, 1014.0, 1618.0, 2767.0, 4744.0, 8478.0, 17236.0, 49938.0, 843003.0, 73936.0, 20300.0, 9616.0, 5299.0, 3085.0, 1802.0, 1135.0, 698.0, 497.0, 314.0, 223.0, 161.0, 122.0, 84.0, 80.0, 47.0, 37.0, 35.0, 19.0, 18.0, 13.0, 5.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0], "bins": [-8.3515625, -8.116943359375, -7.88232421875, -7.647705078125, -7.4130859375, -7.178466796875, -6.94384765625, -6.709228515625, -6.474609375, -6.239990234375, -6.00537109375, -5.770751953125, -5.5361328125, -5.301513671875, -5.06689453125, -4.832275390625, -4.59765625, -4.363037109375, -4.12841796875, -3.893798828125, -3.6591796875, -3.424560546875, -3.18994140625, -2.955322265625, -2.720703125, -2.486083984375, -2.25146484375, -2.016845703125, -1.7822265625, -1.547607421875, -1.31298828125, -1.078369140625, -0.84375, -0.609130859375, -0.37451171875, -0.139892578125, 0.0947265625, 0.329345703125, 0.56396484375, 0.798583984375, 1.033203125, 1.267822265625, 1.50244140625, 1.737060546875, 1.9716796875, 2.206298828125, 2.44091796875, 2.675537109375, 2.91015625, 3.144775390625, 3.37939453125, 3.614013671875, 3.8486328125, 4.083251953125, 4.31787109375, 4.552490234375, 4.787109375, 5.021728515625, 5.25634765625, 5.490966796875, 5.7255859375, 5.960205078125, 6.19482421875, 6.429443359375, 6.6640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 13.0, 8.0, 9.0, 17.0, 22.0, 29.0, 35.0, 67.0, 88.0, 151.0, 156.0, 119.0, 62.0, 46.0, 31.0, 27.0, 20.0, 15.0, 10.0, 8.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010576248168945312, -0.0010138154029846191, -0.000970005989074707, -0.0009261965751647949, -0.0008823871612548828, -0.0008385777473449707, -0.0007947683334350586, -0.0007509589195251465, -0.0007071495056152344, -0.0006633400917053223, -0.0006195306777954102, -0.000575721263885498, -0.0005319118499755859, -0.00048810243606567383, -0.0004442930221557617, -0.0004004836082458496, -0.0003566741943359375, -0.0003128647804260254, -0.0002690553665161133, -0.00022524595260620117, -0.00018143653869628906, -0.00013762712478637695, -9.381771087646484e-05, -5.0008296966552734e-05, -6.198883056640625e-06, 3.7610530853271484e-05, 8.14199447631836e-05, 0.0001252293586730957, 0.0001690387725830078, 0.00021284818649291992, 0.00025665760040283203, 0.00030046701431274414, 0.00034427642822265625, 0.00038808584213256836, 0.00043189525604248047, 0.0004757046699523926, 0.0005195140838623047, 0.0005633234977722168, 0.0006071329116821289, 0.000650942325592041, 0.0006947517395019531, 0.0007385611534118652, 0.0007823705673217773, 0.0008261799812316895, 0.0008699893951416016, 0.0009137988090515137, 0.0009576082229614258, 0.0010014176368713379, 0.00104522705078125, 0.0010890364646911621, 0.0011328458786010742, 0.0011766552925109863, 0.0012204647064208984, 0.0012642741203308105, 0.0013080835342407227, 0.0013518929481506348, 0.0013957023620605469, 0.001439511775970459, 0.001483321189880371, 0.0015271306037902832, 0.0015709400177001953, 0.0016147494316101074, 0.0016585588455200195, 0.0017023682594299316, 0.0017461776733398438]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 10.0, 17.0, 12.0, 17.0, 25.0, 33.0, 48.0, 68.0, 81.0, 134.0, 158.0, 257.0, 392.0, 614.0, 981.0, 1658.0, 2742.0, 4794.0, 8730.0, 17221.0, 38524.0, 94946.0, 230141.0, 326906.0, 184924.0, 72890.0, 30321.0, 14060.0, 7190.0, 4092.0, 2389.0, 1513.0, 905.0, 551.0, 382.0, 256.0, 171.0, 125.0, 79.0, 41.0, 46.0, 29.0, 24.0, 11.0, 13.0, 7.0, 11.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.232421875, -3.132537841796875, -3.03265380859375, -2.932769775390625, -2.8328857421875, -2.733001708984375, -2.63311767578125, -2.533233642578125, -2.433349609375, -2.333465576171875, -2.23358154296875, -2.133697509765625, -2.0338134765625, -1.933929443359375, -1.83404541015625, -1.734161376953125, -1.63427734375, -1.534393310546875, -1.43450927734375, -1.334625244140625, -1.2347412109375, -1.134857177734375, -1.03497314453125, -0.935089111328125, -0.835205078125, -0.735321044921875, -0.63543701171875, -0.535552978515625, -0.4356689453125, -0.335784912109375, -0.23590087890625, -0.136016845703125, -0.0361328125, 0.063751220703125, 0.16363525390625, 0.263519287109375, 0.3634033203125, 0.463287353515625, 0.56317138671875, 0.663055419921875, 0.762939453125, 0.862823486328125, 0.96270751953125, 1.062591552734375, 1.1624755859375, 1.262359619140625, 1.36224365234375, 1.462127685546875, 1.56201171875, 1.661895751953125, 1.76177978515625, 1.861663818359375, 1.9615478515625, 2.061431884765625, 2.16131591796875, 2.261199951171875, 2.361083984375, 2.460968017578125, 2.56085205078125, 2.660736083984375, 2.7606201171875, 2.860504150390625, 2.96038818359375, 3.060272216796875, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 5.0, 8.0, 10.0, 12.0, 14.0, 22.0, 21.0, 21.0, 30.0, 36.0, 40.0, 65.0, 53.0, 78.0, 65.0, 67.0, 80.0, 53.0, 60.0, 46.0, 41.0, 26.0, 21.0, 25.0, 8.0, 6.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5145263671875, -0.495361328125, -0.4761962890625, -0.45703125, -0.4378662109375, -0.418701171875, -0.3995361328125, -0.38037109375, -0.3612060546875, -0.342041015625, -0.3228759765625, -0.3037109375, -0.2845458984375, -0.265380859375, -0.2462158203125, -0.22705078125, -0.2078857421875, -0.188720703125, -0.1695556640625, -0.150390625, -0.1312255859375, -0.112060546875, -0.0928955078125, -0.07373046875, -0.0545654296875, -0.035400390625, -0.0162353515625, 0.0029296875, 0.0220947265625, 0.041259765625, 0.0604248046875, 0.07958984375, 0.0987548828125, 0.117919921875, 0.1370849609375, 0.15625, 0.1754150390625, 0.194580078125, 0.2137451171875, 0.23291015625, 0.2520751953125, 0.271240234375, 0.2904052734375, 0.3095703125, 0.3287353515625, 0.347900390625, 0.3670654296875, 0.38623046875, 0.4053955078125, 0.424560546875, 0.4437255859375, 0.462890625, 0.4820556640625, 0.501220703125, 0.5203857421875, 0.53955078125, 0.5587158203125, 0.577880859375, 0.5970458984375, 0.6162109375, 0.6353759765625, 0.654541015625, 0.6737060546875, 0.69287109375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 15.0, 6.0, 14.0, 11.0, 10.0, 18.0, 18.0, 30.0, 34.0, 42.0, 55.0, 49.0, 53.0, 48.0, 55.0, 45.0, 66.0, 50.0, 51.0, 56.0, 52.0, 37.0, 39.0, 19.0, 28.0, 10.0, 15.0, 16.0, 14.0, 5.0, 6.0, 11.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.213982582092285, -13.781763076782227, -13.349544525146484, -12.917325019836426, -12.485105514526367, -12.052886009216309, -11.62066650390625, -11.188447952270508, -10.75622844696045, -10.32400894165039, -9.891790390014648, -9.45957088470459, -9.027351379394531, -8.595131874084473, -8.162912368774414, -7.730693817138672, -7.298474311828613, -6.866254806518555, -6.434035778045654, -6.001816749572754, -5.569597244262695, -5.137377738952637, -4.705158710479736, -4.272939682006836, -3.8407201766967773, -3.408500909805298, -2.9762816429138184, -2.544062376022339, -2.1118431091308594, -1.6796238422393799, -1.2474045753479004, -0.8151853084564209, -0.3829669952392578, 0.04925227165222168, 0.48147153854370117, 0.9136908054351807, 1.3459100723266602, 1.7781293392181396, 2.210348606109619, 2.6425678730010986, 3.074787139892578, 3.5070064067840576, 3.939225673675537, 4.3714447021484375, 4.803664207458496, 5.235883712768555, 5.668102741241455, 6.1003217697143555, 6.532541275024414, 6.964760780334473, 7.396979808807373, 7.829198837280273, 8.261418342590332, 8.69363784790039, 9.125856399536133, 9.558075904846191, 9.99029541015625, 10.422514915466309, 10.854734420776367, 11.28695297241211, 11.719172477722168, 12.151391983032227, 12.583610534667969, 13.015830039978027, 13.448049545288086]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 15.0, 11.0, 13.0, 15.0, 19.0, 24.0, 24.0, 20.0, 26.0, 31.0, 41.0, 42.0, 32.0, 36.0, 41.0, 40.0, 39.0, 40.0, 36.0, 41.0, 41.0, 29.0, 34.0, 28.0, 27.0, 29.0, 29.0, 18.0, 19.0, 20.0, 25.0, 14.0, 8.0, 18.0, 7.0, 6.0, 5.0, 6.0, 1.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.732009887695312, -9.416609764099121, -9.101210594177246, -8.785810470581055, -8.47041130065918, -8.155011177062988, -7.839611530303955, -7.524211883544922, -7.208812236785889, -6.8934125900268555, -6.578012943267822, -6.262613296508789, -5.947213172912598, -5.631814002990723, -5.316413879394531, -5.001014232635498, -4.685614585876465, -4.370214939117432, -4.054815292358398, -3.739415407180786, -3.424015760421753, -3.1086161136627197, -2.7932162284851074, -2.477816581726074, -2.162416934967041, -1.8470172882080078, -1.531617522239685, -1.2162177562713623, -0.9008181095123291, -0.5854184627532959, -0.27001869678497314, 0.04538106918334961, 0.3607816696166992, 0.6761813759803772, 0.9915810823440552, 1.306980848312378, 1.6223804950714111, 1.9377801418304443, 2.2531800270080566, 2.56857967376709, 2.883979320526123, 3.1993789672851562, 3.5147786140441895, 3.8301784992218018, 4.145578384399414, 4.460977554321289, 4.7763776779174805, 5.091777324676514, 5.407176971435547, 5.72257661819458, 6.037976264953613, 6.3533759117126465, 6.66877555847168, 6.984175682067871, 7.299575328826904, 7.6149749755859375, 7.930374622344971, 8.245774269104004, 8.561174392700195, 8.87657356262207, 9.191973686218262, 9.507372856140137, 9.822772979736328, 10.138172149658203, 10.453572273254395]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 18.0, 30.0, 47.0, 79.0, 154.0, 268.0, 515.0, 876.0, 1592.0, 3057.0, 5713.0, 10713.0, 19830.0, 36602.0, 64949.0, 106147.0, 152297.0, 179042.0, 165238.0, 123306.0, 78149.0, 45754.0, 25138.0, 13640.0, 7211.0, 3730.0, 1978.0, 1090.0, 605.0, 336.0, 149.0, 94.0, 80.0, 30.0, 31.0, 15.0, 15.0, 2.0, 1.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.5703125, -14.1619873046875, -13.753662109375, -13.3453369140625, -12.93701171875, -12.5286865234375, -12.120361328125, -11.7120361328125, -11.3037109375, -10.8953857421875, -10.487060546875, -10.0787353515625, -9.67041015625, -9.2620849609375, -8.853759765625, -8.4454345703125, -8.037109375, -7.6287841796875, -7.220458984375, -6.8121337890625, -6.40380859375, -5.9954833984375, -5.587158203125, -5.1788330078125, -4.7705078125, -4.3621826171875, -3.953857421875, -3.5455322265625, -3.13720703125, -2.7288818359375, -2.320556640625, -1.9122314453125, -1.50390625, -1.0955810546875, -0.687255859375, -0.2789306640625, 0.12939453125, 0.5377197265625, 0.946044921875, 1.3543701171875, 1.7626953125, 2.1710205078125, 2.579345703125, 2.9876708984375, 3.39599609375, 3.8043212890625, 4.212646484375, 4.6209716796875, 5.029296875, 5.4376220703125, 5.845947265625, 6.2542724609375, 6.66259765625, 7.0709228515625, 7.479248046875, 7.8875732421875, 8.2958984375, 8.7042236328125, 9.112548828125, 9.5208740234375, 9.92919921875, 10.3375244140625, 10.745849609375, 11.1541748046875, 11.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 12.0, 12.0, 22.0, 22.0, 16.0, 25.0, 21.0, 22.0, 14.0, 32.0, 36.0, 32.0, 48.0, 45.0, 57.0, 37.0, 47.0, 50.0, 34.0, 41.0, 41.0, 44.0, 38.0, 32.0, 28.0, 34.0, 26.0, 15.0, 15.0, 18.0, 21.0, 15.0, 9.0, 9.0, 1.0, 5.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.3125, -9.988525390625, -9.66455078125, -9.340576171875, -9.0166015625, -8.692626953125, -8.36865234375, -8.044677734375, -7.720703125, -7.396728515625, -7.07275390625, -6.748779296875, -6.4248046875, -6.100830078125, -5.77685546875, -5.452880859375, -5.12890625, -4.804931640625, -4.48095703125, -4.156982421875, -3.8330078125, -3.509033203125, -3.18505859375, -2.861083984375, -2.537109375, -2.213134765625, -1.88916015625, -1.565185546875, -1.2412109375, -0.917236328125, -0.59326171875, -0.269287109375, 0.0546875, 0.378662109375, 0.70263671875, 1.026611328125, 1.3505859375, 1.674560546875, 1.99853515625, 2.322509765625, 2.646484375, 2.970458984375, 3.29443359375, 3.618408203125, 3.9423828125, 4.266357421875, 4.59033203125, 4.914306640625, 5.23828125, 5.562255859375, 5.88623046875, 6.210205078125, 6.5341796875, 6.858154296875, 7.18212890625, 7.506103515625, 7.830078125, 8.154052734375, 8.47802734375, 8.802001953125, 9.1259765625, 9.449951171875, 9.77392578125, 10.097900390625, 10.421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 21.0, 33.0, 50.0, 78.0, 135.0, 173.0, 267.0, 425.0, 748.0, 1246.0, 2127.0, 3528.0, 6155.0, 10332.0, 17578.0, 28821.0, 46972.0, 73088.0, 104807.0, 136400.0, 151487.0, 141885.0, 112424.0, 79260.0, 51377.0, 31819.0, 19121.0, 11491.0, 6712.0, 3992.0, 2427.0, 1375.0, 862.0, 510.0, 318.0, 183.0, 120.0, 70.0, 47.0, 31.0, 15.0, 8.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.554931640625, -9.24267578125, -8.930419921875, -8.6181640625, -8.305908203125, -7.99365234375, -7.681396484375, -7.369140625, -7.056884765625, -6.74462890625, -6.432373046875, -6.1201171875, -5.807861328125, -5.49560546875, -5.183349609375, -4.87109375, -4.558837890625, -4.24658203125, -3.934326171875, -3.6220703125, -3.309814453125, -2.99755859375, -2.685302734375, -2.373046875, -2.060791015625, -1.74853515625, -1.436279296875, -1.1240234375, -0.811767578125, -0.49951171875, -0.187255859375, 0.125, 0.437255859375, 0.74951171875, 1.061767578125, 1.3740234375, 1.686279296875, 1.99853515625, 2.310791015625, 2.623046875, 2.935302734375, 3.24755859375, 3.559814453125, 3.8720703125, 4.184326171875, 4.49658203125, 4.808837890625, 5.12109375, 5.433349609375, 5.74560546875, 6.057861328125, 6.3701171875, 6.682373046875, 6.99462890625, 7.306884765625, 7.619140625, 7.931396484375, 8.24365234375, 8.555908203125, 8.8681640625, 9.180419921875, 9.49267578125, 9.804931640625, 10.1171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 6.0, 11.0, 5.0, 17.0, 18.0, 24.0, 28.0, 29.0, 33.0, 28.0, 26.0, 38.0, 46.0, 32.0, 39.0, 47.0, 63.0, 40.0, 48.0, 50.0, 31.0, 40.0, 36.0, 38.0, 33.0, 20.0, 33.0, 21.0, 15.0, 15.0, 21.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.145751953125, -5.93603515625, -5.726318359375, -5.5166015625, -5.306884765625, -5.09716796875, -4.887451171875, -4.677734375, -4.468017578125, -4.25830078125, -4.048583984375, -3.8388671875, -3.629150390625, -3.41943359375, -3.209716796875, -3.0, -2.790283203125, -2.58056640625, -2.370849609375, -2.1611328125, -1.951416015625, -1.74169921875, -1.531982421875, -1.322265625, -1.112548828125, -0.90283203125, -0.693115234375, -0.4833984375, -0.273681640625, -0.06396484375, 0.145751953125, 0.35546875, 0.565185546875, 0.77490234375, 0.984619140625, 1.1943359375, 1.404052734375, 1.61376953125, 1.823486328125, 2.033203125, 2.242919921875, 2.45263671875, 2.662353515625, 2.8720703125, 3.081787109375, 3.29150390625, 3.501220703125, 3.7109375, 3.920654296875, 4.13037109375, 4.340087890625, 4.5498046875, 4.759521484375, 4.96923828125, 5.178955078125, 5.388671875, 5.598388671875, 5.80810546875, 6.017822265625, 6.2275390625, 6.437255859375, 6.64697265625, 6.856689453125, 7.06640625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 16.0, 25.0, 37.0, 50.0, 89.0, 180.0, 286.0, 492.0, 1047.0, 2105.0, 4813.0, 11940.0, 31999.0, 91204.0, 242333.0, 354366.0, 195095.0, 70508.0, 24867.0, 9466.0, 3923.0, 1781.0, 834.0, 446.0, 238.0, 154.0, 82.0, 52.0, 28.0, 17.0, 25.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.5013427734375, -13.041748046875, -12.5821533203125, -12.12255859375, -11.6629638671875, -11.203369140625, -10.7437744140625, -10.2841796875, -9.8245849609375, -9.364990234375, -8.9053955078125, -8.44580078125, -7.9862060546875, -7.526611328125, -7.0670166015625, -6.607421875, -6.1478271484375, -5.688232421875, -5.2286376953125, -4.76904296875, -4.3094482421875, -3.849853515625, -3.3902587890625, -2.9306640625, -2.4710693359375, -2.011474609375, -1.5518798828125, -1.09228515625, -0.6326904296875, -0.173095703125, 0.2864990234375, 0.74609375, 1.2056884765625, 1.665283203125, 2.1248779296875, 2.58447265625, 3.0440673828125, 3.503662109375, 3.9632568359375, 4.4228515625, 4.8824462890625, 5.342041015625, 5.8016357421875, 6.26123046875, 6.7208251953125, 7.180419921875, 7.6400146484375, 8.099609375, 8.5592041015625, 9.018798828125, 9.4783935546875, 9.93798828125, 10.3975830078125, 10.857177734375, 11.3167724609375, 11.7763671875, 12.2359619140625, 12.695556640625, 13.1551513671875, 13.61474609375, 14.0743408203125, 14.533935546875, 14.9935302734375, 15.453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 13.0, 18.0, 32.0, 32.0, 36.0, 51.0, 71.0, 77.0, 89.0, 82.0, 83.0, 65.0, 60.0, 60.0, 28.0, 34.0, 29.0, 22.0, 20.0, 9.0, 12.0, 9.0, 8.0, 3.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008578747510910034, -0.0008278787136077881, -0.0007978826761245728, -0.0007678866386413574, -0.0007378906011581421, -0.0007078945636749268, -0.0006778985261917114, -0.0006479024887084961, -0.0006179064512252808, -0.0005879104137420654, -0.0005579143762588501, -0.0005279183387756348, -0.0004979223012924194, -0.0004679262638092041, -0.00043793022632598877, -0.00040793418884277344, -0.0003779381513595581, -0.0003479421138763428, -0.00031794607639312744, -0.0002879500389099121, -0.0002579540014266968, -0.00022795796394348145, -0.0001979619264602661, -0.00016796588897705078, -0.00013796985149383545, -0.00010797381401062012, -7.797777652740479e-05, -4.798173904418945e-05, -1.798570156097412e-05, 1.2010335922241211e-05, 4.200637340545654e-05, 7.200241088867188e-05, 0.00010199844837188721, 0.00013199448585510254, 0.00016199052333831787, 0.0001919865608215332, 0.00022198259830474854, 0.00025197863578796387, 0.0002819746732711792, 0.00031197071075439453, 0.00034196674823760986, 0.0003719627857208252, 0.00040195882320404053, 0.00043195486068725586, 0.0004619508981704712, 0.0004919469356536865, 0.0005219429731369019, 0.0005519390106201172, 0.0005819350481033325, 0.0006119310855865479, 0.0006419271230697632, 0.0006719231605529785, 0.0007019191980361938, 0.0007319152355194092, 0.0007619112730026245, 0.0007919073104858398, 0.0008219033479690552, 0.0008518993854522705, 0.0008818954229354858, 0.0009118914604187012, 0.0009418874979019165, 0.0009718835353851318, 0.0010018795728683472, 0.0010318756103515625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 30.0, 23.0, 32.0, 48.0, 59.0, 92.0, 137.0, 192.0, 335.0, 450.0, 840.0, 1352.0, 2395.0, 4413.0, 8617.0, 17424.0, 37035.0, 78320.0, 155757.0, 238713.0, 228306.0, 139716.0, 69449.0, 32429.0, 15288.0, 7760.0, 3930.0, 2242.0, 1173.0, 729.0, 403.0, 238.0, 179.0, 127.0, 90.0, 53.0, 53.0, 28.0, 17.0, 15.0, 15.0, 8.0, 12.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.8001708984375, -9.483154296875, -9.1661376953125, -8.84912109375, -8.5321044921875, -8.215087890625, -7.8980712890625, -7.5810546875, -7.2640380859375, -6.947021484375, -6.6300048828125, -6.31298828125, -5.9959716796875, -5.678955078125, -5.3619384765625, -5.044921875, -4.7279052734375, -4.410888671875, -4.0938720703125, -3.77685546875, -3.4598388671875, -3.142822265625, -2.8258056640625, -2.5087890625, -2.1917724609375, -1.874755859375, -1.5577392578125, -1.24072265625, -0.9237060546875, -0.606689453125, -0.2896728515625, 0.02734375, 0.3443603515625, 0.661376953125, 0.9783935546875, 1.29541015625, 1.6124267578125, 1.929443359375, 2.2464599609375, 2.5634765625, 2.8804931640625, 3.197509765625, 3.5145263671875, 3.83154296875, 4.1485595703125, 4.465576171875, 4.7825927734375, 5.099609375, 5.4166259765625, 5.733642578125, 6.0506591796875, 6.36767578125, 6.6846923828125, 7.001708984375, 7.3187255859375, 7.6357421875, 7.9527587890625, 8.269775390625, 8.5867919921875, 8.90380859375, 9.2208251953125, 9.537841796875, 9.8548583984375, 10.171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 14.0, 18.0, 16.0, 20.0, 19.0, 33.0, 46.0, 43.0, 53.0, 53.0, 67.0, 63.0, 64.0, 77.0, 60.0, 64.0, 65.0, 44.0, 30.0, 25.0, 17.0, 19.0, 14.0, 8.0, 11.0, 1.0, 10.0, 4.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.5179443359375, -2.434326171875, -2.3507080078125, -2.26708984375, -2.1834716796875, -2.099853515625, -2.0162353515625, -1.9326171875, -1.8489990234375, -1.765380859375, -1.6817626953125, -1.59814453125, -1.5145263671875, -1.430908203125, -1.3472900390625, -1.263671875, -1.1800537109375, -1.096435546875, -1.0128173828125, -0.92919921875, -0.8455810546875, -0.761962890625, -0.6783447265625, -0.5947265625, -0.5111083984375, -0.427490234375, -0.3438720703125, -0.26025390625, -0.1766357421875, -0.093017578125, -0.0093994140625, 0.07421875, 0.1578369140625, 0.241455078125, 0.3250732421875, 0.40869140625, 0.4923095703125, 0.575927734375, 0.6595458984375, 0.7431640625, 0.8267822265625, 0.910400390625, 0.9940185546875, 1.07763671875, 1.1612548828125, 1.244873046875, 1.3284912109375, 1.412109375, 1.4957275390625, 1.579345703125, 1.6629638671875, 1.74658203125, 1.8302001953125, 1.913818359375, 1.9974365234375, 2.0810546875, 2.1646728515625, 2.248291015625, 2.3319091796875, 2.41552734375, 2.4991455078125, 2.582763671875, 2.6663818359375, 2.75]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 12.0, 8.0, 8.0, 12.0, 15.0, 9.0, 19.0, 33.0, 25.0, 33.0, 36.0, 37.0, 34.0, 37.0, 60.0, 43.0, 39.0, 43.0, 35.0, 56.0, 45.0, 50.0, 45.0, 38.0, 25.0, 26.0, 19.0, 18.0, 17.0, 14.0, 14.0, 17.0, 9.0, 12.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.719067573547363, -9.397351264953613, -9.07563591003418, -8.75391960144043, -8.43220329284668, -8.11048698425293, -7.788771152496338, -7.467055320739746, -7.145339012145996, -6.823622703552246, -6.501906871795654, -6.1801910400390625, -5.8584747314453125, -5.5367584228515625, -5.215042591094971, -4.893326759338379, -4.571610450744629, -4.249894142150879, -3.928178310394287, -3.606462240219116, -3.2847461700439453, -2.9630300998687744, -2.6413140296936035, -2.3195979595184326, -1.9978818893432617, -1.6761658191680908, -1.35444974899292, -1.032733678817749, -0.7110176086425781, -0.3893015384674072, -0.06758546829223633, 0.25413060188293457, 0.5758476257324219, 0.8975636959075928, 1.2192797660827637, 1.5409958362579346, 1.8627119064331055, 2.1844279766082764, 2.5061440467834473, 2.827860116958618, 3.149576187133789, 3.47129225730896, 3.793008327484131, 4.114724159240723, 4.436440467834473, 4.758156776428223, 5.0798726081848145, 5.401588439941406, 5.723304748535156, 6.045021057128906, 6.366736888885498, 6.68845272064209, 7.01016902923584, 7.33188533782959, 7.653601169586182, 7.975317001342773, 8.297033309936523, 8.618749618530273, 8.940465927124023, 9.262181282043457, 9.583897590637207, 9.905613899230957, 10.22732925415039, 10.54904556274414, 10.87076187133789]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 6.0, 6.0, 3.0, 17.0, 15.0, 19.0, 16.0, 20.0, 12.0, 27.0, 35.0, 27.0, 35.0, 34.0, 29.0, 49.0, 39.0, 44.0, 41.0, 40.0, 44.0, 36.0, 38.0, 44.0, 38.0, 33.0, 36.0, 24.0, 21.0, 24.0, 20.0, 22.0, 21.0, 20.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.343703269958496, -10.032953262329102, -9.722203254699707, -9.411454200744629, -9.100704193115234, -8.78995418548584, -8.479204177856445, -8.16845417022705, -7.8577046394348145, -7.54695463180542, -7.236205101013184, -6.925455093383789, -6.6147050857543945, -6.303955554962158, -5.993205547332764, -5.682456016540527, -5.371706008911133, -5.060956001281738, -4.750206470489502, -4.439456462860107, -4.128706932067871, -3.8179569244384766, -3.507206916809082, -3.1964571475982666, -2.885707378387451, -2.5749576091766357, -2.2642078399658203, -1.9534578323364258, -1.6427080631256104, -1.331958293914795, -1.02120840549469, -0.710458517074585, -0.39970970153808594, -0.08895987272262573, 0.22178995609283447, 0.5325397849082947, 0.8432896137237549, 1.1540393829345703, 1.4647892713546753, 1.7755391597747803, 2.0862889289855957, 2.397038698196411, 2.7077884674072266, 3.018538475036621, 3.3292882442474365, 3.640038013458252, 3.9507880210876465, 4.261537551879883, 4.572287559509277, 4.883037567138672, 5.193787097930908, 5.504537105560303, 5.815286636352539, 6.126036643981934, 6.436786651611328, 6.747536659240723, 7.058286190032959, 7.3690361976623535, 7.67978572845459, 7.990535736083984, 8.301285743713379, 8.612035751342773, 8.922784805297852, 9.233534812927246, 9.54428482055664]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 17.0, 24.0, 44.0, 53.0, 70.0, 121.0, 180.0, 290.0, 477.0, 692.0, 1167.0, 1808.0, 2929.0, 4538.0, 7566.0, 12299.0, 20815.0, 35748.0, 62829.0, 112185.0, 203305.0, 370422.0, 610841.0, 800621.0, 751076.0, 518889.0, 298203.0, 162118.0, 88962.0, 50514.0, 29569.0, 17444.0, 10642.0, 6377.0, 4108.0, 2582.0, 1609.0, 1039.0, 712.0, 479.0, 318.0, 196.0, 119.0, 85.0, 66.0, 47.0, 19.0, 18.0, 14.0, 15.0, 4.0, 9.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.234375, -7.9755859375, -7.716796875, -7.4580078125, -7.19921875, -6.9404296875, -6.681640625, -6.4228515625, -6.1640625, -5.9052734375, -5.646484375, -5.3876953125, -5.12890625, -4.8701171875, -4.611328125, -4.3525390625, -4.09375, -3.8349609375, -3.576171875, -3.3173828125, -3.05859375, -2.7998046875, -2.541015625, -2.2822265625, -2.0234375, -1.7646484375, -1.505859375, -1.2470703125, -0.98828125, -0.7294921875, -0.470703125, -0.2119140625, 0.046875, 0.3056640625, 0.564453125, 0.8232421875, 1.08203125, 1.3408203125, 1.599609375, 1.8583984375, 2.1171875, 2.3759765625, 2.634765625, 2.8935546875, 3.15234375, 3.4111328125, 3.669921875, 3.9287109375, 4.1875, 4.4462890625, 4.705078125, 4.9638671875, 5.22265625, 5.4814453125, 5.740234375, 5.9990234375, 6.2578125, 6.5166015625, 6.775390625, 7.0341796875, 7.29296875, 7.5517578125, 7.810546875, 8.0693359375, 8.328125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 8.0, 8.0, 8.0, 9.0, 11.0, 18.0, 17.0, 24.0, 15.0, 30.0, 25.0, 30.0, 30.0, 31.0, 29.0, 34.0, 51.0, 28.0, 43.0, 49.0, 38.0, 42.0, 36.0, 25.0, 43.0, 46.0, 30.0, 30.0, 33.0, 19.0, 14.0, 17.0, 21.0, 16.0, 20.0, 10.0, 9.0, 14.0, 5.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.015625, -6.80096435546875, -6.5863037109375, -6.37164306640625, -6.156982421875, -5.94232177734375, -5.7276611328125, -5.51300048828125, -5.29833984375, -5.08367919921875, -4.8690185546875, -4.65435791015625, -4.439697265625, -4.22503662109375, -4.0103759765625, -3.79571533203125, -3.5810546875, -3.36639404296875, -3.1517333984375, -2.93707275390625, -2.722412109375, -2.50775146484375, -2.2930908203125, -2.07843017578125, -1.86376953125, -1.64910888671875, -1.4344482421875, -1.21978759765625, -1.005126953125, -0.79046630859375, -0.5758056640625, -0.36114501953125, -0.146484375, 0.06817626953125, 0.2828369140625, 0.49749755859375, 0.712158203125, 0.92681884765625, 1.1414794921875, 1.35614013671875, 1.57080078125, 1.78546142578125, 2.0001220703125, 2.21478271484375, 2.429443359375, 2.64410400390625, 2.8587646484375, 3.07342529296875, 3.2880859375, 3.50274658203125, 3.7174072265625, 3.93206787109375, 4.146728515625, 4.36138916015625, 4.5760498046875, 4.79071044921875, 5.00537109375, 5.22003173828125, 5.4346923828125, 5.64935302734375, 5.864013671875, 6.07867431640625, 6.2933349609375, 6.50799560546875, 6.72265625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 18.0, 21.0, 26.0, 41.0, 82.0, 122.0, 178.0, 306.0, 454.0, 785.0, 1216.0, 2084.0, 3358.0, 5603.0, 9921.0, 17056.0, 29552.0, 52403.0, 93519.0, 167999.0, 296895.0, 495000.0, 721810.0, 788104.0, 611985.0, 386256.0, 222038.0, 125412.0, 69962.0, 39324.0, 21911.0, 12688.0, 7206.0, 4317.0, 2609.0, 1491.0, 919.0, 607.0, 381.0, 240.0, 123.0, 93.0, 68.0, 27.0, 25.0, 17.0, 8.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.2734375, -8.98583984375, -8.6982421875, -8.41064453125, -8.123046875, -7.83544921875, -7.5478515625, -7.26025390625, -6.97265625, -6.68505859375, -6.3974609375, -6.10986328125, -5.822265625, -5.53466796875, -5.2470703125, -4.95947265625, -4.671875, -4.38427734375, -4.0966796875, -3.80908203125, -3.521484375, -3.23388671875, -2.9462890625, -2.65869140625, -2.37109375, -2.08349609375, -1.7958984375, -1.50830078125, -1.220703125, -0.93310546875, -0.6455078125, -0.35791015625, -0.0703125, 0.21728515625, 0.5048828125, 0.79248046875, 1.080078125, 1.36767578125, 1.6552734375, 1.94287109375, 2.23046875, 2.51806640625, 2.8056640625, 3.09326171875, 3.380859375, 3.66845703125, 3.9560546875, 4.24365234375, 4.53125, 4.81884765625, 5.1064453125, 5.39404296875, 5.681640625, 5.96923828125, 6.2568359375, 6.54443359375, 6.83203125, 7.11962890625, 7.4072265625, 7.69482421875, 7.982421875, 8.27001953125, 8.5576171875, 8.84521484375, 9.1328125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 10.0, 11.0, 12.0, 18.0, 20.0, 39.0, 36.0, 54.0, 66.0, 92.0, 113.0, 150.0, 162.0, 212.0, 234.0, 253.0, 265.0, 278.0, 281.0, 259.0, 245.0, 222.0, 224.0, 164.0, 147.0, 108.0, 112.0, 80.0, 61.0, 44.0, 29.0, 19.0, 9.0, 8.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.089874267578125, -3.96881103515625, -3.847747802734375, -3.7266845703125, -3.605621337890625, -3.48455810546875, -3.363494873046875, -3.242431640625, -3.121368408203125, -3.00030517578125, -2.879241943359375, -2.7581787109375, -2.637115478515625, -2.51605224609375, -2.394989013671875, -2.27392578125, -2.152862548828125, -2.03179931640625, -1.910736083984375, -1.7896728515625, -1.668609619140625, -1.54754638671875, -1.426483154296875, -1.305419921875, -1.184356689453125, -1.06329345703125, -0.942230224609375, -0.8211669921875, -0.700103759765625, -0.57904052734375, -0.457977294921875, -0.3369140625, -0.215850830078125, -0.09478759765625, 0.026275634765625, 0.1473388671875, 0.268402099609375, 0.38946533203125, 0.510528564453125, 0.631591796875, 0.752655029296875, 0.87371826171875, 0.994781494140625, 1.1158447265625, 1.236907958984375, 1.35797119140625, 1.479034423828125, 1.60009765625, 1.721160888671875, 1.84222412109375, 1.963287353515625, 2.0843505859375, 2.205413818359375, 2.32647705078125, 2.447540283203125, 2.568603515625, 2.689666748046875, 2.81072998046875, 2.931793212890625, 3.0528564453125, 3.173919677734375, 3.29498291015625, 3.416046142578125, 3.537109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 1.0, 9.0, 8.0, 5.0, 8.0, 15.0, 8.0, 15.0, 26.0, 18.0, 21.0, 23.0, 17.0, 36.0, 38.0, 44.0, 58.0, 44.0, 53.0, 53.0, 46.0, 43.0, 47.0, 55.0, 36.0, 38.0, 33.0, 42.0, 19.0, 25.0, 18.0, 20.0, 13.0, 10.0, 14.0, 4.0, 12.0, 9.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.56761646270752, -9.275262832641602, -8.982908248901367, -8.69055461883545, -8.398200035095215, -8.105846405029297, -7.813492298126221, -7.5211381912231445, -7.228784561157227, -6.93643045425415, -6.644076347351074, -6.351722717285156, -6.05936861038208, -5.767014503479004, -5.474660396575928, -5.182306289672852, -4.889952182769775, -4.597598075866699, -4.305243968963623, -4.012889862060547, -3.720536231994629, -3.4281821250915527, -3.1358280181884766, -2.8434741497039795, -2.5511200428009033, -2.258765935897827, -1.96641206741333, -1.674057960510254, -1.3817039728164673, -1.0893499851226807, -0.7969958782196045, -0.5046420097351074, -0.21228790283203125, 0.08006611466407776, 0.37242013216018677, 0.6647741794586182, 0.9571281671524048, 1.2494821548461914, 1.5418362617492676, 1.8341901302337646, 2.126544237136841, 2.418898344039917, 2.711252212524414, 3.0036063194274902, 3.2959604263305664, 3.5883142948150635, 3.8806684017181396, 4.173022270202637, 4.465376377105713, 4.757730484008789, 5.050084590911865, 5.342438697814941, 5.634792327880859, 5.9271464347839355, 6.219500541687012, 6.51185417175293, 6.804208755493164, 7.09656286239624, 7.388916969299316, 7.681270599365234, 7.9736247062683105, 8.265978813171387, 8.558332443237305, 8.850687026977539, 9.143040657043457]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 2.0, 6.0, 16.0, 12.0, 8.0, 15.0, 20.0, 14.0, 25.0, 30.0, 34.0, 27.0, 43.0, 42.0, 36.0, 42.0, 45.0, 45.0, 41.0, 39.0, 45.0, 44.0, 29.0, 42.0, 39.0, 36.0, 26.0, 21.0, 25.0, 23.0, 16.0, 12.0, 20.0, 10.0, 10.0, 13.0, 10.0, 6.0, 1.0, 2.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.662756443023682, -7.401858806610107, -7.140961647033691, -6.880064010620117, -6.619166851043701, -6.358269214630127, -6.097372055053711, -5.836474418640137, -5.5755767822265625, -5.314679145812988, -5.053781986236572, -4.792884349822998, -4.531987190246582, -4.271089553833008, -4.010191917419434, -3.7492947578430176, -3.4883975982666016, -3.2275002002716064, -2.9666028022766113, -2.705705165863037, -2.444808006286621, -2.183910369873047, -1.9230129718780518, -1.6621155738830566, -1.4012181758880615, -1.1403207778930664, -0.8794233202934265, -0.6185258626937866, -0.3576284646987915, -0.09673106670379639, 0.16416645050048828, 0.4250638484954834, 0.6859617233276367, 0.9468591213226318, 1.207756519317627, 1.4686540365219116, 1.7295514345169067, 1.9904488325119019, 2.2513463497161865, 2.5122437477111816, 2.7731411457061768, 3.034038543701172, 3.294935941696167, 3.555833339691162, 3.8167309761047363, 4.077628135681152, 4.338525772094727, 4.599423408508301, 4.860320568084717, 5.121218204498291, 5.382115364074707, 5.643013000488281, 5.903910160064697, 6.1648077964782715, 6.4257049560546875, 6.686602592468262, 6.947500228881836, 7.20839786529541, 7.469295024871826, 7.7301926612854, 7.991089820861816, 8.25198745727539, 8.512885093688965, 8.773782730102539, 9.034679412841797]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 29.0, 53.0, 83.0, 130.0, 157.0, 259.0, 388.0, 647.0, 922.0, 1470.0, 2454.0, 3909.0, 6557.0, 12383.0, 24185.0, 49598.0, 105272.0, 205733.0, 270700.0, 183630.0, 90225.0, 42556.0, 20627.0, 10956.0, 6044.0, 3522.0, 2118.0, 1384.0, 895.0, 559.0, 366.0, 230.0, 161.0, 106.0, 81.0, 37.0, 28.0, 20.0, 15.0, 15.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2890625, -8.033203125, -7.77734375, -7.521484375, -7.265625, -7.009765625, -6.75390625, -6.498046875, -6.2421875, -5.986328125, -5.73046875, -5.474609375, -5.21875, -4.962890625, -4.70703125, -4.451171875, -4.1953125, -3.939453125, -3.68359375, -3.427734375, -3.171875, -2.916015625, -2.66015625, -2.404296875, -2.1484375, -1.892578125, -1.63671875, -1.380859375, -1.125, -0.869140625, -0.61328125, -0.357421875, -0.1015625, 0.154296875, 0.41015625, 0.666015625, 0.921875, 1.177734375, 1.43359375, 1.689453125, 1.9453125, 2.201171875, 2.45703125, 2.712890625, 2.96875, 3.224609375, 3.48046875, 3.736328125, 3.9921875, 4.248046875, 4.50390625, 4.759765625, 5.015625, 5.271484375, 5.52734375, 5.783203125, 6.0390625, 6.294921875, 6.55078125, 6.806640625, 7.0625, 7.318359375, 7.57421875, 7.830078125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 6.0, 8.0, 7.0, 8.0, 12.0, 16.0, 13.0, 15.0, 11.0, 18.0, 22.0, 16.0, 29.0, 32.0, 41.0, 32.0, 42.0, 51.0, 42.0, 30.0, 41.0, 38.0, 40.0, 49.0, 34.0, 38.0, 37.0, 29.0, 27.0, 32.0, 32.0, 12.0, 14.0, 17.0, 17.0, 11.0, 16.0, 14.0, 6.0, 8.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.14453125, -6.89788818359375, -6.6512451171875, -6.40460205078125, -6.157958984375, -5.91131591796875, -5.6646728515625, -5.41802978515625, -5.17138671875, -4.92474365234375, -4.6781005859375, -4.43145751953125, -4.184814453125, -3.93817138671875, -3.6915283203125, -3.44488525390625, -3.1982421875, -2.95159912109375, -2.7049560546875, -2.45831298828125, -2.211669921875, -1.96502685546875, -1.7183837890625, -1.47174072265625, -1.22509765625, -0.97845458984375, -0.7318115234375, -0.48516845703125, -0.238525390625, 0.00811767578125, 0.2547607421875, 0.50140380859375, 0.748046875, 0.99468994140625, 1.2413330078125, 1.48797607421875, 1.734619140625, 1.98126220703125, 2.2279052734375, 2.47454833984375, 2.72119140625, 2.96783447265625, 3.2144775390625, 3.46112060546875, 3.707763671875, 3.95440673828125, 4.2010498046875, 4.44769287109375, 4.6943359375, 4.94097900390625, 5.1876220703125, 5.43426513671875, 5.680908203125, 5.92755126953125, 6.1741943359375, 6.42083740234375, 6.66748046875, 6.91412353515625, 7.1607666015625, 7.40740966796875, 7.654052734375, 7.90069580078125, 8.1473388671875, 8.39398193359375, 8.640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 15.0, 13.0, 23.0, 31.0, 51.0, 47.0, 88.0, 135.0, 193.0, 272.0, 431.0, 625.0, 1057.0, 1512.0, 2485.0, 4049.0, 6672.0, 11366.0, 21519.0, 64316.0, 843820.0, 44243.0, 18870.0, 10463.0, 5959.0, 3735.0, 2368.0, 1402.0, 910.0, 635.0, 400.0, 252.0, 201.0, 128.0, 83.0, 47.0, 33.0, 29.0, 23.0, 25.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.28125, -9.9908447265625, -9.700439453125, -9.4100341796875, -9.11962890625, -8.8292236328125, -8.538818359375, -8.2484130859375, -7.9580078125, -7.6676025390625, -7.377197265625, -7.0867919921875, -6.79638671875, -6.5059814453125, -6.215576171875, -5.9251708984375, -5.634765625, -5.3443603515625, -5.053955078125, -4.7635498046875, -4.47314453125, -4.1827392578125, -3.892333984375, -3.6019287109375, -3.3115234375, -3.0211181640625, -2.730712890625, -2.4403076171875, -2.14990234375, -1.8594970703125, -1.569091796875, -1.2786865234375, -0.98828125, -0.6978759765625, -0.407470703125, -0.1170654296875, 0.17333984375, 0.4637451171875, 0.754150390625, 1.0445556640625, 1.3349609375, 1.6253662109375, 1.915771484375, 2.2061767578125, 2.49658203125, 2.7869873046875, 3.077392578125, 3.3677978515625, 3.658203125, 3.9486083984375, 4.239013671875, 4.5294189453125, 4.81982421875, 5.1102294921875, 5.400634765625, 5.6910400390625, 5.9814453125, 6.2718505859375, 6.562255859375, 6.8526611328125, 7.14306640625, 7.4334716796875, 7.723876953125, 8.0142822265625, 8.3046875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 11.0, 8.0, 19.0, 13.0, 14.0, 22.0, 20.0, 17.0, 29.0, 36.0, 24.0, 31.0, 43.0, 36.0, 31.0, 50.0, 34.0, 42.0, 39.0, 43.0, 36.0, 41.0, 40.0, 34.0, 33.0, 22.0, 28.0, 24.0, 24.0, 19.0, 22.0, 10.0, 12.0, 14.0, 8.0, 6.0, 8.0, 12.0, 4.0, 4.0, 10.0, 2.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.78448486328125, -5.5845947265625, -5.38470458984375, -5.184814453125, -4.98492431640625, -4.7850341796875, -4.58514404296875, -4.38525390625, -4.18536376953125, -3.9854736328125, -3.78558349609375, -3.585693359375, -3.38580322265625, -3.1859130859375, -2.98602294921875, -2.7861328125, -2.58624267578125, -2.3863525390625, -2.18646240234375, -1.986572265625, -1.78668212890625, -1.5867919921875, -1.38690185546875, -1.18701171875, -0.98712158203125, -0.7872314453125, -0.58734130859375, -0.387451171875, -0.18756103515625, 0.0123291015625, 0.21221923828125, 0.412109375, 0.61199951171875, 0.8118896484375, 1.01177978515625, 1.211669921875, 1.41156005859375, 1.6114501953125, 1.81134033203125, 2.01123046875, 2.21112060546875, 2.4110107421875, 2.61090087890625, 2.810791015625, 3.01068115234375, 3.2105712890625, 3.41046142578125, 3.6103515625, 3.81024169921875, 4.0101318359375, 4.21002197265625, 4.409912109375, 4.60980224609375, 4.8096923828125, 5.00958251953125, 5.20947265625, 5.40936279296875, 5.6092529296875, 5.80914306640625, 6.009033203125, 6.20892333984375, 6.4088134765625, 6.60870361328125, 6.80859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 9.0, 7.0, 11.0, 25.0, 29.0, 41.0, 59.0, 104.0, 144.0, 219.0, 329.0, 557.0, 896.0, 1604.0, 2985.0, 5978.0, 13948.0, 44478.0, 903255.0, 45795.0, 14525.0, 6409.0, 3140.0, 1557.0, 979.0, 506.0, 354.0, 190.0, 130.0, 87.0, 63.0, 27.0, 30.0, 17.0, 13.0, 12.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.32501220703125, -6.1031494140625, -5.88128662109375, -5.659423828125, -5.43756103515625, -5.2156982421875, -4.99383544921875, -4.77197265625, -4.55010986328125, -4.3282470703125, -4.10638427734375, -3.884521484375, -3.66265869140625, -3.4407958984375, -3.21893310546875, -2.9970703125, -2.77520751953125, -2.5533447265625, -2.33148193359375, -2.109619140625, -1.88775634765625, -1.6658935546875, -1.44403076171875, -1.22216796875, -1.00030517578125, -0.7784423828125, -0.55657958984375, -0.334716796875, -0.11285400390625, 0.1090087890625, 0.33087158203125, 0.552734375, 0.77459716796875, 0.9964599609375, 1.21832275390625, 1.440185546875, 1.66204833984375, 1.8839111328125, 2.10577392578125, 2.32763671875, 2.54949951171875, 2.7713623046875, 2.99322509765625, 3.215087890625, 3.43695068359375, 3.6588134765625, 3.88067626953125, 4.1025390625, 4.32440185546875, 4.5462646484375, 4.76812744140625, 4.989990234375, 5.21185302734375, 5.4337158203125, 5.65557861328125, 5.87744140625, 6.09930419921875, 6.3211669921875, 6.54302978515625, 6.764892578125, 6.98675537109375, 7.2086181640625, 7.43048095703125, 7.65234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 8.0, 10.0, 10.0, 21.0, 23.0, 26.0, 55.0, 69.0, 85.0, 126.0, 132.0, 115.0, 81.0, 60.0, 45.0, 16.0, 21.0, 19.0, 8.0, 15.0, 15.0, 5.0, 5.0, 6.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005664825439453125, -0.0005449503660202026, -0.0005234181880950928, -0.0005018860101699829, -0.00048035383224487305, -0.0004588216543197632, -0.0004372894763946533, -0.00041575729846954346, -0.0003942251205444336, -0.00037269294261932373, -0.00035116076469421387, -0.000329628586769104, -0.00030809640884399414, -0.0002865642309188843, -0.0002650320529937744, -0.00024349987506866455, -0.0002219676971435547, -0.00020043551921844482, -0.00017890334129333496, -0.0001573711633682251, -0.00013583898544311523, -0.00011430680751800537, -9.277462959289551e-05, -7.124245166778564e-05, -4.971027374267578e-05, -2.8178095817565918e-05, -6.645917892456055e-06, 1.4886260032653809e-05, 3.641843795776367e-05, 5.7950615882873535e-05, 7.94827938079834e-05, 0.00010101497173309326, 0.00012254714965820312, 0.000144079327583313, 0.00016561150550842285, 0.00018714368343353271, 0.00020867586135864258, 0.00023020803928375244, 0.0002517402172088623, 0.00027327239513397217, 0.00029480457305908203, 0.0003163367509841919, 0.00033786892890930176, 0.0003594011068344116, 0.0003809332847595215, 0.00040246546268463135, 0.0004239976406097412, 0.0004455298185348511, 0.00046706199645996094, 0.0004885941743850708, 0.0005101263523101807, 0.0005316585302352905, 0.0005531907081604004, 0.0005747228860855103, 0.0005962550640106201, 0.00061778724193573, 0.0006393194198608398, 0.0006608515977859497, 0.0006823837757110596, 0.0007039159536361694, 0.0007254481315612793, 0.0007469803094863892, 0.000768512487411499, 0.0007900446653366089, 0.0008115768432617188]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 11.0, 22.0, 33.0, 47.0, 59.0, 78.0, 105.0, 199.0, 286.0, 400.0, 640.0, 1040.0, 1559.0, 2497.0, 3764.0, 6036.0, 9585.0, 15677.0, 26419.0, 45234.0, 80064.0, 139462.0, 212095.0, 201431.0, 126590.0, 71734.0, 40948.0, 23863.0, 14519.0, 8981.0, 5420.0, 3468.0, 2239.0, 1375.0, 894.0, 583.0, 411.0, 252.0, 181.0, 118.0, 81.0, 43.0, 35.0, 32.0, 13.0, 9.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9306640625, -1.8719940185546875, -1.813323974609375, -1.7546539306640625, -1.69598388671875, -1.6373138427734375, -1.578643798828125, -1.5199737548828125, -1.4613037109375, -1.4026336669921875, -1.343963623046875, -1.2852935791015625, -1.22662353515625, -1.1679534912109375, -1.109283447265625, -1.0506134033203125, -0.991943359375, -0.9332733154296875, -0.874603271484375, -0.8159332275390625, -0.75726318359375, -0.6985931396484375, -0.639923095703125, -0.5812530517578125, -0.5225830078125, -0.4639129638671875, -0.405242919921875, -0.3465728759765625, -0.28790283203125, -0.2292327880859375, -0.170562744140625, -0.1118927001953125, -0.05322265625, 0.0054473876953125, 0.064117431640625, 0.1227874755859375, 0.18145751953125, 0.2401275634765625, 0.298797607421875, 0.3574676513671875, 0.4161376953125, 0.4748077392578125, 0.533477783203125, 0.5921478271484375, 0.65081787109375, 0.7094879150390625, 0.768157958984375, 0.8268280029296875, 0.885498046875, 0.9441680908203125, 1.002838134765625, 1.0615081787109375, 1.12017822265625, 1.1788482666015625, 1.237518310546875, 1.2961883544921875, 1.3548583984375, 1.4135284423828125, 1.472198486328125, 1.5308685302734375, 1.58953857421875, 1.6482086181640625, 1.706878662109375, 1.7655487060546875, 1.82421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 10.0, 12.0, 7.0, 18.0, 26.0, 20.0, 12.0, 28.0, 25.0, 31.0, 30.0, 43.0, 35.0, 53.0, 46.0, 51.0, 51.0, 63.0, 54.0, 43.0, 42.0, 36.0, 32.0, 32.0, 25.0, 22.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 12.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.563812255859375, -0.54754638671875, -0.531280517578125, -0.5150146484375, -0.498748779296875, -0.48248291015625, -0.466217041015625, -0.449951171875, -0.433685302734375, -0.41741943359375, -0.401153564453125, -0.3848876953125, -0.368621826171875, -0.35235595703125, -0.336090087890625, -0.31982421875, -0.303558349609375, -0.28729248046875, -0.271026611328125, -0.2547607421875, -0.238494873046875, -0.22222900390625, -0.205963134765625, -0.189697265625, -0.173431396484375, -0.15716552734375, -0.140899658203125, -0.1246337890625, -0.108367919921875, -0.09210205078125, -0.075836181640625, -0.0595703125, -0.043304443359375, -0.02703857421875, -0.010772705078125, 0.0054931640625, 0.021759033203125, 0.03802490234375, 0.054290771484375, 0.070556640625, 0.086822509765625, 0.10308837890625, 0.119354248046875, 0.1356201171875, 0.151885986328125, 0.16815185546875, 0.184417724609375, 0.20068359375, 0.216949462890625, 0.23321533203125, 0.249481201171875, 0.2657470703125, 0.282012939453125, 0.29827880859375, 0.314544677734375, 0.330810546875, 0.347076416015625, 0.36334228515625, 0.379608154296875, 0.3958740234375, 0.412139892578125, 0.42840576171875, 0.444671630859375, 0.4609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 5.0, 12.0, 13.0, 12.0, 21.0, 10.0, 31.0, 21.0, 24.0, 18.0, 37.0, 40.0, 48.0, 42.0, 48.0, 46.0, 54.0, 44.0, 51.0, 37.0, 47.0, 52.0, 50.0, 32.0, 32.0, 34.0, 16.0, 10.0, 15.0, 13.0, 17.0, 11.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.060894012451172, -9.771018028259277, -9.4811429977417, -9.191267013549805, -8.901391983032227, -8.611515998840332, -8.321640968322754, -8.03176498413086, -7.741889476776123, -7.452013969421387, -7.16213846206665, -6.872262954711914, -6.5823869705200195, -6.292511940002441, -6.002635955810547, -5.7127604484558105, -5.422884941101074, -5.133009433746338, -4.843133926391602, -4.553258419036865, -4.263382911682129, -3.9735071659088135, -3.683631420135498, -3.3937559127807617, -3.1038804054260254, -2.814004898071289, -2.5241293907165527, -2.2342536449432373, -1.944378137588501, -1.6545026302337646, -1.3646270036697388, -1.074751377105713, -0.7848758697509766, -0.49500030279159546, -0.20512473583221436, 0.08475083112716675, 0.37462639808654785, 0.6645019054412842, 0.9543775320053101, 1.244253158569336, 1.5341286659240723, 1.8240041732788086, 2.113879680633545, 2.4037554264068604, 2.6936309337615967, 2.983506441116333, 3.2733821868896484, 3.5632576942443848, 3.853133201599121, 4.143008708953857, 4.432884216308594, 4.72275972366333, 5.012635231018066, 5.302511215209961, 5.592386722564697, 5.882262229919434, 6.17213773727417, 6.462013244628906, 6.751888751983643, 7.041764259338379, 7.331640243530273, 7.621515274047852, 7.911391258239746, 8.20126724243164, 8.491142272949219]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 8.0, 14.0, 5.0, 16.0, 9.0, 13.0, 17.0, 24.0, 22.0, 26.0, 30.0, 45.0, 37.0, 38.0, 46.0, 38.0, 40.0, 50.0, 43.0, 43.0, 49.0, 35.0, 33.0, 39.0, 35.0, 34.0, 31.0, 18.0, 22.0, 19.0, 26.0, 12.0, 11.0, 13.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855771541595459, -7.594684600830078, -7.3335981369018555, -7.072511196136475, -6.811424255371094, -6.550337791442871, -6.28925085067749, -6.028163909912109, -5.767077445983887, -5.505990505218506, -5.244904041290283, -4.983817100524902, -4.72273063659668, -4.461643695831299, -4.200556755065918, -3.939470052719116, -3.6783833503723145, -3.4172966480255127, -3.156209945678711, -2.89512300491333, -2.6340363025665283, -2.3729496002197266, -2.1118626594543457, -1.850775957107544, -1.5896892547607422, -1.3286025524139404, -1.0675157308578491, -0.8064289689064026, -0.545342206954956, -0.2842555046081543, -0.02316868305206299, 0.23791813850402832, 0.4990043640136719, 0.7600911259651184, 1.021177887916565, 1.2822647094726562, 1.543351411819458, 1.8044381141662598, 2.0655250549316406, 2.3266117572784424, 2.587698459625244, 2.848785161972046, 3.1098718643188477, 3.3709588050842285, 3.6320455074310303, 3.893132209777832, 4.154219150543213, 4.415306091308594, 4.676392555236816, 4.937479496002197, 5.19856595993042, 5.459652900695801, 5.720739364624023, 5.981826305389404, 6.242913246154785, 6.503999710083008, 6.765086650848389, 7.0261735916137695, 7.287260055541992, 7.548346996307373, 7.809433937072754, 8.070520401000977, 8.3316068649292, 8.592694282531738, 8.853780746459961]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 11.0, 11.0, 22.0, 31.0, 54.0, 83.0, 137.0, 178.0, 315.0, 464.0, 862.0, 1225.0, 1957.0, 3137.0, 4978.0, 7774.0, 12057.0, 18977.0, 29103.0, 43546.0, 63881.0, 88546.0, 113429.0, 129365.0, 129841.0, 114158.0, 90403.0, 65683.0, 44813.0, 29899.0, 19306.0, 12518.0, 8036.0, 5036.0, 3167.0, 2001.0, 1315.0, 780.0, 529.0, 329.0, 242.0, 140.0, 75.0, 41.0, 36.0, 22.0, 15.0, 12.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-9.7421875, -9.4559326171875, -9.169677734375, -8.8834228515625, -8.59716796875, -8.3109130859375, -8.024658203125, -7.7384033203125, -7.4521484375, -7.1658935546875, -6.879638671875, -6.5933837890625, -6.30712890625, -6.0208740234375, -5.734619140625, -5.4483642578125, -5.162109375, -4.8758544921875, -4.589599609375, -4.3033447265625, -4.01708984375, -3.7308349609375, -3.444580078125, -3.1583251953125, -2.8720703125, -2.5858154296875, -2.299560546875, -2.0133056640625, -1.72705078125, -1.4407958984375, -1.154541015625, -0.8682861328125, -0.58203125, -0.2957763671875, -0.009521484375, 0.2767333984375, 0.56298828125, 0.8492431640625, 1.135498046875, 1.4217529296875, 1.7080078125, 1.9942626953125, 2.280517578125, 2.5667724609375, 2.85302734375, 3.1392822265625, 3.425537109375, 3.7117919921875, 3.998046875, 4.2843017578125, 4.570556640625, 4.8568115234375, 5.14306640625, 5.4293212890625, 5.715576171875, 6.0018310546875, 6.2880859375, 6.5743408203125, 6.860595703125, 7.1468505859375, 7.43310546875, 7.7193603515625, 8.005615234375, 8.2918701171875, 8.578125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 5.0, 5.0, 10.0, 6.0, 15.0, 13.0, 13.0, 10.0, 12.0, 16.0, 23.0, 25.0, 13.0, 27.0, 38.0, 40.0, 30.0, 41.0, 33.0, 37.0, 41.0, 43.0, 44.0, 39.0, 37.0, 27.0, 37.0, 34.0, 25.0, 33.0, 32.0, 31.0, 28.0, 10.0, 16.0, 7.0, 16.0, 15.0, 15.0, 11.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.0625, -6.8468017578125, -6.631103515625, -6.4154052734375, -6.19970703125, -5.9840087890625, -5.768310546875, -5.5526123046875, -5.3369140625, -5.1212158203125, -4.905517578125, -4.6898193359375, -4.47412109375, -4.2584228515625, -4.042724609375, -3.8270263671875, -3.611328125, -3.3956298828125, -3.179931640625, -2.9642333984375, -2.74853515625, -2.5328369140625, -2.317138671875, -2.1014404296875, -1.8857421875, -1.6700439453125, -1.454345703125, -1.2386474609375, -1.02294921875, -0.8072509765625, -0.591552734375, -0.3758544921875, -0.16015625, 0.0555419921875, 0.271240234375, 0.4869384765625, 0.70263671875, 0.9183349609375, 1.134033203125, 1.3497314453125, 1.5654296875, 1.7811279296875, 1.996826171875, 2.2125244140625, 2.42822265625, 2.6439208984375, 2.859619140625, 3.0753173828125, 3.291015625, 3.5067138671875, 3.722412109375, 3.9381103515625, 4.15380859375, 4.3695068359375, 4.585205078125, 4.8009033203125, 5.0166015625, 5.2322998046875, 5.447998046875, 5.6636962890625, 5.87939453125, 6.0950927734375, 6.310791015625, 6.5264892578125, 6.7421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 27.0, 34.0, 53.0, 75.0, 135.0, 196.0, 294.0, 426.0, 610.0, 961.0, 1530.0, 2176.0, 3489.0, 4966.0, 7708.0, 11825.0, 17313.0, 25558.0, 36354.0, 50381.0, 68076.0, 87439.0, 104432.0, 113779.0, 112589.0, 100717.0, 82802.0, 63753.0, 46737.0, 33383.0, 23103.0, 15772.0, 10533.0, 7175.0, 4839.0, 3165.0, 2170.0, 1403.0, 858.0, 580.0, 368.0, 252.0, 182.0, 116.0, 67.0, 42.0, 37.0, 21.0, 9.0, 9.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.08203125, -6.85272216796875, -6.6234130859375, -6.39410400390625, -6.164794921875, -5.93548583984375, -5.7061767578125, -5.47686767578125, -5.24755859375, -5.01824951171875, -4.7889404296875, -4.55963134765625, -4.330322265625, -4.10101318359375, -3.8717041015625, -3.64239501953125, -3.4130859375, -3.18377685546875, -2.9544677734375, -2.72515869140625, -2.495849609375, -2.26654052734375, -2.0372314453125, -1.80792236328125, -1.57861328125, -1.34930419921875, -1.1199951171875, -0.89068603515625, -0.661376953125, -0.43206787109375, -0.2027587890625, 0.02655029296875, 0.255859375, 0.48516845703125, 0.7144775390625, 0.94378662109375, 1.173095703125, 1.40240478515625, 1.6317138671875, 1.86102294921875, 2.09033203125, 2.31964111328125, 2.5489501953125, 2.77825927734375, 3.007568359375, 3.23687744140625, 3.4661865234375, 3.69549560546875, 3.9248046875, 4.15411376953125, 4.3834228515625, 4.61273193359375, 4.842041015625, 5.07135009765625, 5.3006591796875, 5.52996826171875, 5.75927734375, 5.98858642578125, 6.2178955078125, 6.44720458984375, 6.676513671875, 6.90582275390625, 7.1351318359375, 7.36444091796875, 7.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 4.0, 11.0, 19.0, 8.0, 11.0, 25.0, 26.0, 30.0, 33.0, 29.0, 42.0, 28.0, 39.0, 38.0, 32.0, 36.0, 38.0, 43.0, 53.0, 47.0, 38.0, 52.0, 37.0, 40.0, 28.0, 23.0, 23.0, 22.0, 21.0, 18.0, 17.0, 17.0, 12.0, 17.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.68511962890625, -4.5225830078125, -4.36004638671875, -4.197509765625, -4.03497314453125, -3.8724365234375, -3.70989990234375, -3.54736328125, -3.38482666015625, -3.2222900390625, -3.05975341796875, -2.897216796875, -2.73468017578125, -2.5721435546875, -2.40960693359375, -2.2470703125, -2.08453369140625, -1.9219970703125, -1.75946044921875, -1.596923828125, -1.43438720703125, -1.2718505859375, -1.10931396484375, -0.94677734375, -0.78424072265625, -0.6217041015625, -0.45916748046875, -0.296630859375, -0.13409423828125, 0.0284423828125, 0.19097900390625, 0.353515625, 0.51605224609375, 0.6785888671875, 0.84112548828125, 1.003662109375, 1.16619873046875, 1.3287353515625, 1.49127197265625, 1.65380859375, 1.81634521484375, 1.9788818359375, 2.14141845703125, 2.303955078125, 2.46649169921875, 2.6290283203125, 2.79156494140625, 2.9541015625, 3.11663818359375, 3.2791748046875, 3.44171142578125, 3.604248046875, 3.76678466796875, 3.9293212890625, 4.09185791015625, 4.25439453125, 4.41693115234375, 4.5794677734375, 4.74200439453125, 4.904541015625, 5.06707763671875, 5.2296142578125, 5.39215087890625, 5.5546875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 16.0, 18.0, 25.0, 38.0, 62.0, 68.0, 122.0, 173.0, 294.0, 509.0, 783.0, 1303.0, 2260.0, 3947.0, 7121.0, 13454.0, 26432.0, 54661.0, 124783.0, 268067.0, 283316.0, 139514.0, 60150.0, 28810.0, 14613.0, 7825.0, 4260.0, 2395.0, 1325.0, 852.0, 503.0, 296.0, 190.0, 134.0, 78.0, 51.0, 34.0, 26.0, 21.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.807373046875, -11.42724609375, -11.047119140625, -10.6669921875, -10.286865234375, -9.90673828125, -9.526611328125, -9.146484375, -8.766357421875, -8.38623046875, -8.006103515625, -7.6259765625, -7.245849609375, -6.86572265625, -6.485595703125, -6.10546875, -5.725341796875, -5.34521484375, -4.965087890625, -4.5849609375, -4.204833984375, -3.82470703125, -3.444580078125, -3.064453125, -2.684326171875, -2.30419921875, -1.924072265625, -1.5439453125, -1.163818359375, -0.78369140625, -0.403564453125, -0.0234375, 0.356689453125, 0.73681640625, 1.116943359375, 1.4970703125, 1.877197265625, 2.25732421875, 2.637451171875, 3.017578125, 3.397705078125, 3.77783203125, 4.157958984375, 4.5380859375, 4.918212890625, 5.29833984375, 5.678466796875, 6.05859375, 6.438720703125, 6.81884765625, 7.198974609375, 7.5791015625, 7.959228515625, 8.33935546875, 8.719482421875, 9.099609375, 9.479736328125, 9.85986328125, 10.239990234375, 10.6201171875, 11.000244140625, 11.38037109375, 11.760498046875, 12.140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 1.0, 9.0, 10.0, 13.0, 14.0, 14.0, 20.0, 22.0, 17.0, 26.0, 35.0, 48.0, 53.0, 65.0, 71.0, 79.0, 78.0, 75.0, 60.0, 51.0, 43.0, 42.0, 32.0, 24.0, 18.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008592531085014343, -0.0008306354284286499, -0.0008020177483558655, -0.0007734000682830811, -0.0007447823882102966, -0.0007161647081375122, -0.0006875470280647278, -0.0006589293479919434, -0.0006303116679191589, -0.0006016939878463745, -0.0005730763077735901, -0.0005444586277008057, -0.0005158409476280212, -0.0004872232675552368, -0.0004586055874824524, -0.00042998790740966797, -0.00040137022733688354, -0.0003727525472640991, -0.0003441348671913147, -0.0003155171871185303, -0.00028689950704574585, -0.0002582818269729614, -0.000229664146900177, -0.00020104646682739258, -0.00017242878675460815, -0.00014381110668182373, -0.0001151934266090393, -8.657574653625488e-05, -5.795806646347046e-05, -2.9340386390686035e-05, -7.227063179016113e-07, 2.7894973754882812e-05, 5.6512653827667236e-05, 8.513033390045166e-05, 0.00011374801397323608, 0.0001423656940460205, 0.00017098337411880493, 0.00019960105419158936, 0.00022821873426437378, 0.0002568364143371582, 0.0002854540944099426, 0.00031407177448272705, 0.0003426894545555115, 0.0003713071346282959, 0.0003999248147010803, 0.00042854249477386475, 0.00045716017484664917, 0.0004857778549194336, 0.000514395534992218, 0.0005430132150650024, 0.0005716308951377869, 0.0006002485752105713, 0.0006288662552833557, 0.0006574839353561401, 0.0006861016154289246, 0.000714719295501709, 0.0007433369755744934, 0.0007719546556472778, 0.0008005723357200623, 0.0008291900157928467, 0.0008578076958656311, 0.0008864253759384155, 0.0009150430560112, 0.0009436607360839844]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 1.0, 10.0, 11.0, 21.0, 32.0, 40.0, 52.0, 75.0, 115.0, 192.0, 240.0, 379.0, 554.0, 797.0, 1303.0, 2050.0, 3091.0, 4856.0, 7722.0, 12611.0, 20275.0, 33985.0, 57398.0, 96471.0, 152021.0, 190058.0, 171335.0, 116294.0, 70379.0, 41409.0, 24411.0, 14709.0, 9266.0, 5786.0, 3638.0, 2368.0, 1565.0, 945.0, 656.0, 463.0, 325.0, 191.0, 139.0, 105.0, 63.0, 45.0, 28.0, 23.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.55859375, -6.35162353515625, -6.1446533203125, -5.93768310546875, -5.730712890625, -5.52374267578125, -5.3167724609375, -5.10980224609375, -4.90283203125, -4.69586181640625, -4.4888916015625, -4.28192138671875, -4.074951171875, -3.86798095703125, -3.6610107421875, -3.45404052734375, -3.2470703125, -3.04010009765625, -2.8331298828125, -2.62615966796875, -2.419189453125, -2.21221923828125, -2.0052490234375, -1.79827880859375, -1.59130859375, -1.38433837890625, -1.1773681640625, -0.97039794921875, -0.763427734375, -0.55645751953125, -0.3494873046875, -0.14251708984375, 0.064453125, 0.27142333984375, 0.4783935546875, 0.68536376953125, 0.892333984375, 1.09930419921875, 1.3062744140625, 1.51324462890625, 1.72021484375, 1.92718505859375, 2.1341552734375, 2.34112548828125, 2.548095703125, 2.75506591796875, 2.9620361328125, 3.16900634765625, 3.3759765625, 3.58294677734375, 3.7899169921875, 3.99688720703125, 4.203857421875, 4.41082763671875, 4.6177978515625, 4.82476806640625, 5.03173828125, 5.23870849609375, 5.4456787109375, 5.65264892578125, 5.859619140625, 6.06658935546875, 6.2735595703125, 6.48052978515625, 6.6875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 8.0, 8.0, 9.0, 18.0, 30.0, 29.0, 35.0, 55.0, 50.0, 97.0, 94.0, 89.0, 78.0, 92.0, 55.0, 56.0, 49.0, 23.0, 30.0, 18.0, 11.0, 18.0, 7.0, 3.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.585357666015625, -3.47540283203125, -3.365447998046875, -3.2554931640625, -3.145538330078125, -3.03558349609375, -2.925628662109375, -2.815673828125, -2.705718994140625, -2.59576416015625, -2.485809326171875, -2.3758544921875, -2.265899658203125, -2.15594482421875, -2.045989990234375, -1.93603515625, -1.826080322265625, -1.71612548828125, -1.606170654296875, -1.4962158203125, -1.386260986328125, -1.27630615234375, -1.166351318359375, -1.056396484375, -0.946441650390625, -0.83648681640625, -0.726531982421875, -0.6165771484375, -0.506622314453125, -0.39666748046875, -0.286712646484375, -0.1767578125, -0.066802978515625, 0.04315185546875, 0.153106689453125, 0.2630615234375, 0.373016357421875, 0.48297119140625, 0.592926025390625, 0.702880859375, 0.812835693359375, 0.92279052734375, 1.032745361328125, 1.1427001953125, 1.252655029296875, 1.36260986328125, 1.472564697265625, 1.58251953125, 1.692474365234375, 1.80242919921875, 1.912384033203125, 2.0223388671875, 2.132293701171875, 2.24224853515625, 2.352203369140625, 2.462158203125, 2.572113037109375, 2.68206787109375, 2.792022705078125, 2.9019775390625, 3.011932373046875, 3.12188720703125, 3.231842041015625, 3.341796875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 11.0, 13.0, 12.0, 16.0, 23.0, 25.0, 25.0, 33.0, 35.0, 37.0, 47.0, 39.0, 44.0, 50.0, 63.0, 57.0, 58.0, 55.0, 37.0, 37.0, 31.0, 39.0, 37.0, 29.0, 19.0, 17.0, 21.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-10.720756530761719, -10.420270919799805, -10.119786262512207, -9.819300651550293, -9.518815994262695, -9.218330383300781, -8.917844772338867, -8.617359161376953, -8.316874504089355, -8.016388893127441, -7.715904235839844, -7.41541862487793, -7.114933490753174, -6.814448356628418, -6.513962745666504, -6.213477611541748, -5.912992477416992, -5.612507343292236, -5.3120222091674805, -5.011536598205566, -4.7110514640808105, -4.410566329956055, -4.110080718994141, -3.8095955848693848, -3.509110450744629, -3.208625316619873, -2.908139944076538, -2.607654571533203, -2.3071694374084473, -2.0066843032836914, -1.7061989307403564, -1.4057135581970215, -1.105229377746582, -0.8047441244125366, -0.5042588710784912, -0.2037736177444458, 0.09671163558959961, 0.397196888923645, 0.6976821422576904, 0.9981675148010254, 1.2986526489257812, 1.5991379022598267, 1.899623155593872, 2.200108528137207, 2.500593662261963, 2.8010787963867188, 3.1015641689300537, 3.4020495414733887, 3.7025346755981445, 4.0030198097229, 4.303504943847656, 4.60399055480957, 4.904475688934326, 5.204960823059082, 5.505446434020996, 5.805931568145752, 6.106416702270508, 6.406901836395264, 6.7073869705200195, 7.007872581481934, 7.3083577156066895, 7.608842849731445, 7.909328460693359, 8.209814071655273, 8.510298728942871]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 12.0, 9.0, 12.0, 11.0, 15.0, 13.0, 16.0, 15.0, 21.0, 24.0, 25.0, 36.0, 38.0, 29.0, 48.0, 34.0, 41.0, 42.0, 28.0, 35.0, 52.0, 39.0, 26.0, 33.0, 33.0, 36.0, 26.0, 26.0, 25.0, 27.0, 18.0, 12.0, 23.0, 10.0, 16.0, 16.0, 10.0, 7.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-7.543928146362305, -7.321154594421387, -7.098381042480469, -6.875607490539551, -6.652833938598633, -6.430060386657715, -6.207286834716797, -5.984513759613037, -5.761740207672119, -5.538966655731201, -5.316193103790283, -5.093419551849365, -4.870645999908447, -4.6478729248046875, -4.4250993728637695, -4.202325820922852, -3.9795520305633545, -3.7567784786224365, -3.5340049266815186, -3.3112316131591797, -3.0884580612182617, -2.8656845092773438, -2.642910957336426, -2.420137405395508, -2.19736385345459, -1.9745903015136719, -1.7518168687820435, -1.5290433168411255, -1.306269884109497, -1.083496332168579, -0.8607227802276611, -0.6379493474960327, -0.4151759147644043, -0.1924024075269699, 0.030371099710464478, 0.25314462184906006, 0.47591811418533325, 0.6986916065216064, 0.9214651584625244, 1.1442385911941528, 1.3670121431350708, 1.5897856950759888, 1.8125591278076172, 2.035332679748535, 2.258106231689453, 2.480879783630371, 2.703653335571289, 2.926426649093628, 3.149200201034546, 3.371973752975464, 3.594747304916382, 3.8175206184387207, 4.040294170379639, 4.263067722320557, 4.485841274261475, 4.708614826202393, 4.9313883781433105, 5.1541619300842285, 5.3769354820251465, 5.5997090339660645, 5.822482585906982, 6.045255661010742, 6.26802921295166, 6.490802764892578, 6.713576316833496]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 17.0, 31.0, 32.0, 56.0, 78.0, 109.0, 168.0, 303.0, 417.0, 651.0, 1078.0, 1719.0, 2944.0, 4770.0, 8296.0, 14328.0, 25254.0, 45626.0, 86464.0, 166599.0, 331000.0, 614813.0, 894592.0, 850681.0, 545320.0, 283812.0, 144057.0, 75290.0, 40789.0, 22880.0, 12857.0, 7482.0, 4476.0, 2689.0, 1700.0, 1025.0, 644.0, 400.0, 266.0, 204.0, 113.0, 93.0, 50.0, 27.0, 27.0, 23.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.3515625, -7.11358642578125, -6.8756103515625, -6.63763427734375, -6.399658203125, -6.16168212890625, -5.9237060546875, -5.68572998046875, -5.44775390625, -5.20977783203125, -4.9718017578125, -4.73382568359375, -4.495849609375, -4.25787353515625, -4.0198974609375, -3.78192138671875, -3.5439453125, -3.30596923828125, -3.0679931640625, -2.83001708984375, -2.592041015625, -2.35406494140625, -2.1160888671875, -1.87811279296875, -1.64013671875, -1.40216064453125, -1.1641845703125, -0.92620849609375, -0.688232421875, -0.45025634765625, -0.2122802734375, 0.02569580078125, 0.263671875, 0.50164794921875, 0.7396240234375, 0.97760009765625, 1.215576171875, 1.45355224609375, 1.6915283203125, 1.92950439453125, 2.16748046875, 2.40545654296875, 2.6434326171875, 2.88140869140625, 3.119384765625, 3.35736083984375, 3.5953369140625, 3.83331298828125, 4.0712890625, 4.30926513671875, 4.5472412109375, 4.78521728515625, 5.023193359375, 5.26116943359375, 5.4991455078125, 5.73712158203125, 5.97509765625, 6.21307373046875, 6.4510498046875, 6.68902587890625, 6.927001953125, 7.16497802734375, 7.4029541015625, 7.64093017578125, 7.87890625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 8.0, 18.0, 14.0, 25.0, 19.0, 27.0, 23.0, 24.0, 41.0, 52.0, 33.0, 36.0, 53.0, 42.0, 48.0, 46.0, 33.0, 29.0, 34.0, 33.0, 36.0, 27.0, 22.0, 32.0, 24.0, 22.0, 20.0, 20.0, 17.0, 17.0, 15.0, 6.0, 9.0, 6.0, 5.0, 3.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.4296875, -5.2633056640625, -5.096923828125, -4.9305419921875, -4.76416015625, -4.5977783203125, -4.431396484375, -4.2650146484375, -4.0986328125, -3.9322509765625, -3.765869140625, -3.5994873046875, -3.43310546875, -3.2667236328125, -3.100341796875, -2.9339599609375, -2.767578125, -2.6011962890625, -2.434814453125, -2.2684326171875, -2.10205078125, -1.9356689453125, -1.769287109375, -1.6029052734375, -1.4365234375, -1.2701416015625, -1.103759765625, -0.9373779296875, -0.77099609375, -0.6046142578125, -0.438232421875, -0.2718505859375, -0.10546875, 0.0609130859375, 0.227294921875, 0.3936767578125, 0.56005859375, 0.7264404296875, 0.892822265625, 1.0592041015625, 1.2255859375, 1.3919677734375, 1.558349609375, 1.7247314453125, 1.89111328125, 2.0574951171875, 2.223876953125, 2.3902587890625, 2.556640625, 2.7230224609375, 2.889404296875, 3.0557861328125, 3.22216796875, 3.3885498046875, 3.554931640625, 3.7213134765625, 3.8876953125, 4.0540771484375, 4.220458984375, 4.3868408203125, 4.55322265625, 4.7196044921875, 4.885986328125, 5.0523681640625, 5.21875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 11.0, 31.0, 54.0, 78.0, 118.0, 204.0, 321.0, 506.0, 877.0, 1415.0, 2497.0, 4007.0, 6859.0, 12094.0, 21487.0, 38404.0, 70958.0, 132556.0, 245837.0, 447001.0, 730841.0, 887211.0, 687002.0, 410612.0, 225317.0, 121236.0, 65149.0, 35214.0, 19747.0, 11207.0, 6421.0, 3602.0, 2090.0, 1287.0, 805.0, 461.0, 277.0, 171.0, 98.0, 60.0, 50.0, 33.0, 21.0, 9.0, 5.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-8.171875, -7.91986083984375, -7.6678466796875, -7.41583251953125, -7.163818359375, -6.91180419921875, -6.6597900390625, -6.40777587890625, -6.15576171875, -5.90374755859375, -5.6517333984375, -5.39971923828125, -5.147705078125, -4.89569091796875, -4.6436767578125, -4.39166259765625, -4.1396484375, -3.88763427734375, -3.6356201171875, -3.38360595703125, -3.131591796875, -2.87957763671875, -2.6275634765625, -2.37554931640625, -2.12353515625, -1.87152099609375, -1.6195068359375, -1.36749267578125, -1.115478515625, -0.86346435546875, -0.6114501953125, -0.35943603515625, -0.107421875, 0.14459228515625, 0.3966064453125, 0.64862060546875, 0.900634765625, 1.15264892578125, 1.4046630859375, 1.65667724609375, 1.90869140625, 2.16070556640625, 2.4127197265625, 2.66473388671875, 2.916748046875, 3.16876220703125, 3.4207763671875, 3.67279052734375, 3.9248046875, 4.17681884765625, 4.4288330078125, 4.68084716796875, 4.932861328125, 5.18487548828125, 5.4368896484375, 5.68890380859375, 5.94091796875, 6.19293212890625, 6.4449462890625, 6.69696044921875, 6.948974609375, 7.20098876953125, 7.4530029296875, 7.70501708984375, 7.95703125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 19.0, 23.0, 24.0, 39.0, 50.0, 42.0, 68.0, 81.0, 105.0, 128.0, 133.0, 173.0, 183.0, 204.0, 222.0, 251.0, 240.0, 261.0, 246.0, 210.0, 229.0, 195.0, 197.0, 153.0, 123.0, 94.0, 91.0, 63.0, 33.0, 43.0, 29.0, 27.0, 12.0, 18.0, 7.0, 11.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.365692138671875, -2.28216552734375, -2.198638916015625, -2.1151123046875, -2.031585693359375, -1.94805908203125, -1.864532470703125, -1.781005859375, -1.697479248046875, -1.61395263671875, -1.530426025390625, -1.4468994140625, -1.363372802734375, -1.27984619140625, -1.196319580078125, -1.11279296875, -1.029266357421875, -0.94573974609375, -0.862213134765625, -0.7786865234375, -0.695159912109375, -0.61163330078125, -0.528106689453125, -0.444580078125, -0.361053466796875, -0.27752685546875, -0.194000244140625, -0.1104736328125, -0.026947021484375, 0.05657958984375, 0.140106201171875, 0.2236328125, 0.307159423828125, 0.39068603515625, 0.474212646484375, 0.5577392578125, 0.641265869140625, 0.72479248046875, 0.808319091796875, 0.891845703125, 0.975372314453125, 1.05889892578125, 1.142425537109375, 1.2259521484375, 1.309478759765625, 1.39300537109375, 1.476531982421875, 1.56005859375, 1.643585205078125, 1.72711181640625, 1.810638427734375, 1.8941650390625, 1.977691650390625, 2.06121826171875, 2.144744873046875, 2.228271484375, 2.311798095703125, 2.39532470703125, 2.478851318359375, 2.5623779296875, 2.645904541015625, 2.72943115234375, 2.812957763671875, 2.896484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 8.0, 6.0, 10.0, 10.0, 13.0, 26.0, 28.0, 29.0, 50.0, 30.0, 37.0, 44.0, 69.0, 54.0, 49.0, 64.0, 58.0, 48.0, 47.0, 53.0, 55.0, 32.0, 28.0, 29.0, 26.0, 3.0, 19.0, 14.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.61583137512207, -8.329607009887695, -8.04338264465332, -7.757158279418945, -7.47093391418457, -7.184709548950195, -6.898484706878662, -6.612260341644287, -6.326035976409912, -6.039811611175537, -5.753587245941162, -5.467362880706787, -5.181138038635254, -4.894913673400879, -4.608689308166504, -4.322464942932129, -4.036240577697754, -3.750016212463379, -3.463791847229004, -3.17756724357605, -2.891342878341675, -2.6051185131073, -2.3188939094543457, -2.0326695442199707, -1.7464451789855957, -1.4602208137512207, -1.1739963293075562, -0.8877719044685364, -0.6015474796295166, -0.3153231143951416, -0.02909862995147705, 0.2571258544921875, 0.5433511734008789, 0.8295755982398987, 1.1158000230789185, 1.402024507522583, 1.688248872756958, 1.974473237991333, 2.260697841644287, 2.546922206878662, 2.833146572113037, 3.119370937347412, 3.405595302581787, 3.691819906234741, 3.978044271469116, 4.26426887512207, 4.550493240356445, 4.83671760559082, 5.122941970825195, 5.40916633605957, 5.695390701293945, 5.98161506652832, 6.267839431762695, 6.55406379699707, 6.8402886390686035, 7.1265130043029785, 7.4127373695373535, 7.6989617347717285, 7.9851861000061035, 8.271410942077637, 8.557635307312012, 8.843859672546387, 9.130084037780762, 9.416308403015137, 9.702532768249512]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 12.0, 18.0, 25.0, 17.0, 26.0, 29.0, 30.0, 30.0, 48.0, 29.0, 34.0, 37.0, 37.0, 40.0, 44.0, 24.0, 42.0, 40.0, 32.0, 35.0, 41.0, 30.0, 32.0, 21.0, 23.0, 21.0, 22.0, 17.0, 11.0, 15.0, 13.0, 13.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.515998840332031, -5.333995819091797, -5.151993274688721, -4.969990253448486, -4.78798770904541, -4.605984687805176, -4.423981666564941, -4.241978645324707, -4.059976100921631, -3.8779733180999756, -3.6959705352783203, -3.513967514038086, -3.3319647312164307, -3.1499619483947754, -2.967958927154541, -2.7859561443328857, -2.6039533615112305, -2.421950578689575, -2.23994779586792, -2.0579447746276855, -1.8759419918060303, -1.693939208984375, -1.5119363069534302, -1.3299334049224854, -1.14793062210083, -0.96592777967453, -0.78392493724823, -0.6019220948219299, -0.4199192523956299, -0.23791640996932983, -0.055913567543029785, 0.12608933448791504, 0.3080916404724121, 0.49009448289871216, 0.6720973253250122, 0.8541001677513123, 1.0361030101776123, 1.2181057929992676, 1.4001086950302124, 1.5821115970611572, 1.7641143798828125, 1.9461171627044678, 2.128119945526123, 2.3101229667663574, 2.4921257495880127, 2.674128532409668, 2.8561315536499023, 3.0381343364715576, 3.220137119293213, 3.402139902114868, 3.5841426849365234, 3.766145706176758, 3.948148488998413, 4.130151271820068, 4.312154293060303, 4.494156837463379, 4.676159858703613, 4.858162879943848, 5.040165424346924, 5.222168445587158, 5.404170989990234, 5.586174011230469, 5.768177032470703, 5.9501800537109375, 6.132182598114014]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 5.0, 9.0, 11.0, 18.0, 25.0, 42.0, 50.0, 69.0, 101.0, 146.0, 222.0, 308.0, 482.0, 682.0, 978.0, 1488.0, 2288.0, 3346.0, 5112.0, 7630.0, 11771.0, 17443.0, 27202.0, 41491.0, 63116.0, 90782.0, 124535.0, 148296.0, 143223.0, 114674.0, 81227.0, 55246.0, 36433.0, 24295.0, 15561.0, 10003.0, 6655.0, 4499.0, 2857.0, 2060.0, 1370.0, 922.0, 576.0, 414.0, 280.0, 203.0, 115.0, 95.0, 67.0, 47.0, 35.0, 23.0, 22.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.3515625, -2.27532958984375, -2.1990966796875, -2.12286376953125, -2.046630859375, -1.97039794921875, -1.8941650390625, -1.81793212890625, -1.74169921875, -1.66546630859375, -1.5892333984375, -1.51300048828125, -1.436767578125, -1.36053466796875, -1.2843017578125, -1.20806884765625, -1.1318359375, -1.05560302734375, -0.9793701171875, -0.90313720703125, -0.826904296875, -0.75067138671875, -0.6744384765625, -0.59820556640625, -0.52197265625, -0.44573974609375, -0.3695068359375, -0.29327392578125, -0.217041015625, -0.14080810546875, -0.0645751953125, 0.01165771484375, 0.087890625, 0.16412353515625, 0.2403564453125, 0.31658935546875, 0.392822265625, 0.46905517578125, 0.5452880859375, 0.62152099609375, 0.69775390625, 0.77398681640625, 0.8502197265625, 0.92645263671875, 1.002685546875, 1.07891845703125, 1.1551513671875, 1.23138427734375, 1.3076171875, 1.38385009765625, 1.4600830078125, 1.53631591796875, 1.612548828125, 1.68878173828125, 1.7650146484375, 1.84124755859375, 1.91748046875, 1.99371337890625, 2.0699462890625, 2.14617919921875, 2.222412109375, 2.29864501953125, 2.3748779296875, 2.45111083984375, 2.52734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 8.0, 14.0, 14.0, 19.0, 18.0, 14.0, 25.0, 18.0, 38.0, 30.0, 41.0, 39.0, 40.0, 46.0, 37.0, 40.0, 39.0, 33.0, 42.0, 35.0, 39.0, 41.0, 36.0, 24.0, 25.0, 29.0, 27.0, 15.0, 17.0, 21.0, 10.0, 22.0, 9.0, 17.0, 8.0, 10.0, 6.0, 5.0, 10.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1484375, -5.950439453125, -5.75244140625, -5.554443359375, -5.3564453125, -5.158447265625, -4.96044921875, -4.762451171875, -4.564453125, -4.366455078125, -4.16845703125, -3.970458984375, -3.7724609375, -3.574462890625, -3.37646484375, -3.178466796875, -2.98046875, -2.782470703125, -2.58447265625, -2.386474609375, -2.1884765625, -1.990478515625, -1.79248046875, -1.594482421875, -1.396484375, -1.198486328125, -1.00048828125, -0.802490234375, -0.6044921875, -0.406494140625, -0.20849609375, -0.010498046875, 0.1875, 0.385498046875, 0.58349609375, 0.781494140625, 0.9794921875, 1.177490234375, 1.37548828125, 1.573486328125, 1.771484375, 1.969482421875, 2.16748046875, 2.365478515625, 2.5634765625, 2.761474609375, 2.95947265625, 3.157470703125, 3.35546875, 3.553466796875, 3.75146484375, 3.949462890625, 4.1474609375, 4.345458984375, 4.54345703125, 4.741455078125, 4.939453125, 5.137451171875, 5.33544921875, 5.533447265625, 5.7314453125, 5.929443359375, 6.12744140625, 6.325439453125, 6.5234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 20.0, 24.0, 35.0, 62.0, 87.0, 123.0, 218.0, 324.0, 526.0, 832.0, 1275.0, 2083.0, 3514.0, 6024.0, 10588.0, 20403.0, 56507.0, 858412.0, 44531.0, 18681.0, 9906.0, 5435.0, 3466.0, 1990.0, 1286.0, 736.0, 505.0, 333.0, 193.0, 143.0, 94.0, 68.0, 43.0, 30.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-8.859375, -8.63470458984375, -8.4100341796875, -8.18536376953125, -7.960693359375, -7.73602294921875, -7.5113525390625, -7.28668212890625, -7.06201171875, -6.83734130859375, -6.6126708984375, -6.38800048828125, -6.163330078125, -5.93865966796875, -5.7139892578125, -5.48931884765625, -5.2646484375, -5.03997802734375, -4.8153076171875, -4.59063720703125, -4.365966796875, -4.14129638671875, -3.9166259765625, -3.69195556640625, -3.46728515625, -3.24261474609375, -3.0179443359375, -2.79327392578125, -2.568603515625, -2.34393310546875, -2.1192626953125, -1.89459228515625, -1.669921875, -1.44525146484375, -1.2205810546875, -0.99591064453125, -0.771240234375, -0.54656982421875, -0.3218994140625, -0.09722900390625, 0.12744140625, 0.35211181640625, 0.5767822265625, 0.80145263671875, 1.026123046875, 1.25079345703125, 1.4754638671875, 1.70013427734375, 1.9248046875, 2.14947509765625, 2.3741455078125, 2.59881591796875, 2.823486328125, 3.04815673828125, 3.2728271484375, 3.49749755859375, 3.72216796875, 3.94683837890625, 4.1715087890625, 4.39617919921875, 4.620849609375, 4.84552001953125, 5.0701904296875, 5.29486083984375, 5.51953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 10.0, 4.0, 11.0, 13.0, 11.0, 20.0, 18.0, 29.0, 23.0, 24.0, 30.0, 30.0, 29.0, 34.0, 30.0, 35.0, 38.0, 41.0, 41.0, 36.0, 33.0, 36.0, 50.0, 42.0, 30.0, 35.0, 44.0, 26.0, 27.0, 23.0, 18.0, 23.0, 24.0, 14.0, 17.0, 8.0, 7.0, 4.0, 14.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.69732666015625, -4.5430908203125, -4.38885498046875, -4.234619140625, -4.08038330078125, -3.9261474609375, -3.77191162109375, -3.61767578125, -3.46343994140625, -3.3092041015625, -3.15496826171875, -3.000732421875, -2.84649658203125, -2.6922607421875, -2.53802490234375, -2.3837890625, -2.22955322265625, -2.0753173828125, -1.92108154296875, -1.766845703125, -1.61260986328125, -1.4583740234375, -1.30413818359375, -1.14990234375, -0.99566650390625, -0.8414306640625, -0.68719482421875, -0.532958984375, -0.37872314453125, -0.2244873046875, -0.07025146484375, 0.083984375, 0.23822021484375, 0.3924560546875, 0.54669189453125, 0.700927734375, 0.85516357421875, 1.0093994140625, 1.16363525390625, 1.31787109375, 1.47210693359375, 1.6263427734375, 1.78057861328125, 1.934814453125, 2.08905029296875, 2.2432861328125, 2.39752197265625, 2.5517578125, 2.70599365234375, 2.8602294921875, 3.01446533203125, 3.168701171875, 3.32293701171875, 3.4771728515625, 3.63140869140625, 3.78564453125, 3.93988037109375, 4.0941162109375, 4.24835205078125, 4.402587890625, 4.55682373046875, 4.7110595703125, 4.86529541015625, 5.01953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 9.0, 14.0, 23.0, 41.0, 57.0, 100.0, 158.0, 229.0, 413.0, 720.0, 1285.0, 2416.0, 4514.0, 9502.0, 24101.0, 615508.0, 348575.0, 22511.0, 9077.0, 4207.0, 2184.0, 1217.0, 660.0, 379.0, 196.0, 113.0, 96.0, 59.0, 39.0, 30.0, 19.0, 18.0, 15.0, 11.0, 11.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.05078125, -4.8975830078125, -4.744384765625, -4.5911865234375, -4.43798828125, -4.2847900390625, -4.131591796875, -3.9783935546875, -3.8251953125, -3.6719970703125, -3.518798828125, -3.3656005859375, -3.21240234375, -3.0592041015625, -2.906005859375, -2.7528076171875, -2.599609375, -2.4464111328125, -2.293212890625, -2.1400146484375, -1.98681640625, -1.8336181640625, -1.680419921875, -1.5272216796875, -1.3740234375, -1.2208251953125, -1.067626953125, -0.9144287109375, -0.76123046875, -0.6080322265625, -0.454833984375, -0.3016357421875, -0.1484375, 0.0047607421875, 0.157958984375, 0.3111572265625, 0.46435546875, 0.6175537109375, 0.770751953125, 0.9239501953125, 1.0771484375, 1.2303466796875, 1.383544921875, 1.5367431640625, 1.68994140625, 1.8431396484375, 1.996337890625, 2.1495361328125, 2.302734375, 2.4559326171875, 2.609130859375, 2.7623291015625, 2.91552734375, 3.0687255859375, 3.221923828125, 3.3751220703125, 3.5283203125, 3.6815185546875, 3.834716796875, 3.9879150390625, 4.14111328125, 4.2943115234375, 4.447509765625, 4.6007080078125, 4.75390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 16.0, 10.0, 10.0, 12.0, 19.0, 21.0, 18.0, 23.0, 36.0, 41.0, 60.0, 60.0, 59.0, 67.0, 67.0, 64.0, 55.0, 40.0, 41.0, 46.0, 33.0, 35.0, 26.0, 19.0, 10.0, 18.0, 11.0, 19.0, 5.0, 9.0, 10.0, 6.0, 4.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002180337905883789, -0.00021154806017875671, -0.00020506232976913452, -0.00019857659935951233, -0.00019209086894989014, -0.00018560513854026794, -0.00017911940813064575, -0.00017263367772102356, -0.00016614794731140137, -0.00015966221690177917, -0.00015317648649215698, -0.0001466907560825348, -0.0001402050256729126, -0.0001337192952632904, -0.0001272335648536682, -0.00012074783444404602, -0.00011426210403442383, -0.00010777637362480164, -0.00010129064321517944, -9.480491280555725e-05, -8.831918239593506e-05, -8.183345198631287e-05, -7.534772157669067e-05, -6.886199116706848e-05, -6.237626075744629e-05, -5.58905303478241e-05, -4.9404799938201904e-05, -4.291906952857971e-05, -3.643333911895752e-05, -2.9947608709335327e-05, -2.3461878299713135e-05, -1.6976147890090942e-05, -1.049041748046875e-05, -4.004687070846558e-06, 2.4810433387756348e-06, 8.966773748397827e-06, 1.545250415802002e-05, 2.1938234567642212e-05, 2.8423964977264404e-05, 3.49096953868866e-05, 4.139542579650879e-05, 4.788115620613098e-05, 5.4366886615753174e-05, 6.0852617025375366e-05, 6.733834743499756e-05, 7.382407784461975e-05, 8.030980825424194e-05, 8.679553866386414e-05, 9.328126907348633e-05, 9.976699948310852e-05, 0.00010625272989273071, 0.0001127384603023529, 0.0001192241907119751, 0.0001257099211215973, 0.00013219565153121948, 0.00013868138194084167, 0.00014516711235046387, 0.00015165284276008606, 0.00015813857316970825, 0.00016462430357933044, 0.00017111003398895264, 0.00017759576439857483, 0.00018408149480819702, 0.00019056722521781921, 0.0001970529556274414]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 14.0, 17.0, 17.0, 37.0, 43.0, 82.0, 131.0, 166.0, 272.0, 421.0, 699.0, 1196.0, 1910.0, 3174.0, 5535.0, 10072.0, 18396.0, 35723.0, 69917.0, 139327.0, 249604.0, 240833.0, 131793.0, 65405.0, 33467.0, 17510.0, 9578.0, 5307.0, 3128.0, 1801.0, 1128.0, 657.0, 396.0, 285.0, 162.0, 116.0, 78.0, 52.0, 39.0, 19.0, 13.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4430389404296875, -1.394866943359375, -1.3466949462890625, -1.29852294921875, -1.2503509521484375, -1.202178955078125, -1.1540069580078125, -1.1058349609375, -1.0576629638671875, -1.009490966796875, -0.9613189697265625, -0.91314697265625, -0.8649749755859375, -0.816802978515625, -0.7686309814453125, -0.720458984375, -0.6722869873046875, -0.624114990234375, -0.5759429931640625, -0.52777099609375, -0.4795989990234375, -0.431427001953125, -0.3832550048828125, -0.3350830078125, -0.2869110107421875, -0.238739013671875, -0.1905670166015625, -0.14239501953125, -0.0942230224609375, -0.046051025390625, 0.0021209716796875, 0.05029296875, 0.0984649658203125, 0.146636962890625, 0.1948089599609375, 0.24298095703125, 0.2911529541015625, 0.339324951171875, 0.3874969482421875, 0.4356689453125, 0.4838409423828125, 0.532012939453125, 0.5801849365234375, 0.62835693359375, 0.6765289306640625, 0.724700927734375, 0.7728729248046875, 0.821044921875, 0.8692169189453125, 0.917388916015625, 0.9655609130859375, 1.01373291015625, 1.0619049072265625, 1.110076904296875, 1.1582489013671875, 1.2064208984375, 1.2545928955078125, 1.302764892578125, 1.3509368896484375, 1.39910888671875, 1.4472808837890625, 1.495452880859375, 1.5436248779296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 5.0, 9.0, 11.0, 11.0, 15.0, 14.0, 25.0, 27.0, 33.0, 37.0, 47.0, 45.0, 42.0, 47.0, 54.0, 48.0, 53.0, 60.0, 49.0, 36.0, 30.0, 37.0, 46.0, 41.0, 25.0, 23.0, 15.0, 10.0, 13.0, 13.0, 16.0, 11.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.36554718017578125, -0.3531646728515625, -0.34078216552734375, -0.328399658203125, -0.31601715087890625, -0.3036346435546875, -0.29125213623046875, -0.27886962890625, -0.26648712158203125, -0.2541046142578125, -0.24172210693359375, -0.229339599609375, -0.21695709228515625, -0.2045745849609375, -0.19219207763671875, -0.1798095703125, -0.16742706298828125, -0.1550445556640625, -0.14266204833984375, -0.130279541015625, -0.11789703369140625, -0.1055145263671875, -0.09313201904296875, -0.08074951171875, -0.06836700439453125, -0.0559844970703125, -0.04360198974609375, -0.031219482421875, -0.01883697509765625, -0.0064544677734375, 0.00592803955078125, 0.018310546875, 0.03069305419921875, 0.0430755615234375, 0.05545806884765625, 0.067840576171875, 0.08022308349609375, 0.0926055908203125, 0.10498809814453125, 0.11737060546875, 0.12975311279296875, 0.1421356201171875, 0.15451812744140625, 0.166900634765625, 0.17928314208984375, 0.1916656494140625, 0.20404815673828125, 0.2164306640625, 0.22881317138671875, 0.2411956787109375, 0.25357818603515625, 0.265960693359375, 0.27834320068359375, 0.2907257080078125, 0.30310821533203125, 0.31549072265625, 0.32787322998046875, 0.3402557373046875, 0.35263824462890625, 0.365020751953125, 0.37740325927734375, 0.3897857666015625, 0.40216827392578125, 0.41455078125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 15.0, 13.0, 12.0, 29.0, 33.0, 28.0, 40.0, 38.0, 53.0, 37.0, 46.0, 61.0, 72.0, 56.0, 55.0, 51.0, 48.0, 55.0, 25.0, 44.0, 30.0, 28.0, 17.0, 14.0, 14.0, 14.0, 7.0, 7.0, 9.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.376655578613281, -8.093968391418457, -7.811281204223633, -7.528594493865967, -7.245907306671143, -6.963220119476318, -6.680533409118652, -6.397846221923828, -6.115159034729004, -5.83247184753418, -5.5497846603393555, -5.2670979499816895, -4.984410762786865, -4.701723575592041, -4.419036865234375, -4.136349678039551, -3.8536624908447266, -3.5709753036499023, -3.2882883548736572, -3.005601406097412, -2.722914218902588, -2.4402270317077637, -2.1575400829315186, -1.8748530149459839, -1.5921659469604492, -1.3094788789749146, -1.0267918109893799, -0.7441047430038452, -0.46141767501831055, -0.17873060703277588, 0.10395646095275879, 0.38664352893829346, 0.6693305969238281, 0.9520176649093628, 1.2347047328948975, 1.5173918008804321, 1.8000788688659668, 2.082766056060791, 2.365453004837036, 2.6481399536132812, 2.9308271408081055, 3.2135143280029297, 3.496201276779175, 3.77888822555542, 4.061575412750244, 4.344262599945068, 4.626949310302734, 4.909636497497559, 5.192323684692383, 5.475010871887207, 5.757698059082031, 6.040384769439697, 6.3230719566345215, 6.605759143829346, 6.888445854187012, 7.171133041381836, 7.45382022857666, 7.736507415771484, 8.019194602966309, 8.301881790161133, 8.58456802368164, 8.867255210876465, 9.149942398071289, 9.432629585266113, 9.715316772460938]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 13.0, 5.0, 16.0, 10.0, 14.0, 16.0, 26.0, 18.0, 34.0, 26.0, 32.0, 34.0, 30.0, 30.0, 48.0, 33.0, 41.0, 34.0, 36.0, 30.0, 47.0, 36.0, 37.0, 45.0, 28.0, 24.0, 27.0, 25.0, 27.0, 20.0, 23.0, 10.0, 19.0, 13.0, 11.0, 14.0, 7.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.696194648742676, -5.513446807861328, -5.3306989669799805, -5.147950649261475, -4.965202808380127, -4.782454967498779, -4.599706649780273, -4.416958808898926, -4.234210968017578, -4.0514631271362305, -3.8687150478363037, -3.685966968536377, -3.5032191276550293, -3.3204712867736816, -3.137723207473755, -2.954975128173828, -2.7722272872924805, -2.589479446411133, -2.406731367111206, -2.2239832878112793, -2.0412354469299316, -1.8584874868392944, -1.6757395267486572, -1.49299156665802, -1.3102436065673828, -1.1274956464767456, -0.9447476863861084, -0.7619997262954712, -0.579251766204834, -0.3965038061141968, -0.21375584602355957, -0.031007885932922363, 0.15174007415771484, 0.33448803424835205, 0.5172359943389893, 0.6999839544296265, 0.8827319145202637, 1.0654798746109009, 1.248227834701538, 1.4309757947921753, 1.6137237548828125, 1.7964717149734497, 1.979219675064087, 2.1619677543640137, 2.3447155952453613, 2.527463436126709, 2.7102115154266357, 2.8929595947265625, 3.07570743560791, 3.258455276489258, 3.4412033557891846, 3.6239514350891113, 3.806699275970459, 3.9894471168518066, 4.1721954345703125, 4.35494327545166, 4.537691116333008, 4.7204389572143555, 4.903186798095703, 5.085935115814209, 5.268682956695557, 5.451430797576904, 5.63417911529541, 5.816926956176758, 5.9996747970581055]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 12.0, 29.0, 44.0, 57.0, 95.0, 141.0, 197.0, 327.0, 534.0, 864.0, 1299.0, 2252.0, 3612.0, 6233.0, 10835.0, 19725.0, 35065.0, 62495.0, 105398.0, 158284.0, 191417.0, 169097.0, 116923.0, 70843.0, 39878.0, 22475.0, 12461.0, 7202.0, 4141.0, 2519.0, 1460.0, 950.0, 604.0, 394.0, 247.0, 166.0, 97.0, 68.0, 37.0, 20.0, 20.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9638671875, -7.685546875, -7.4072265625, -7.12890625, -6.8505859375, -6.572265625, -6.2939453125, -6.015625, -5.7373046875, -5.458984375, -5.1806640625, -4.90234375, -4.6240234375, -4.345703125, -4.0673828125, -3.7890625, -3.5107421875, -3.232421875, -2.9541015625, -2.67578125, -2.3974609375, -2.119140625, -1.8408203125, -1.5625, -1.2841796875, -1.005859375, -0.7275390625, -0.44921875, -0.1708984375, 0.107421875, 0.3857421875, 0.6640625, 0.9423828125, 1.220703125, 1.4990234375, 1.77734375, 2.0556640625, 2.333984375, 2.6123046875, 2.890625, 3.1689453125, 3.447265625, 3.7255859375, 4.00390625, 4.2822265625, 4.560546875, 4.8388671875, 5.1171875, 5.3955078125, 5.673828125, 5.9521484375, 6.23046875, 6.5087890625, 6.787109375, 7.0654296875, 7.34375, 7.6220703125, 7.900390625, 8.1787109375, 8.45703125, 8.7353515625, 9.013671875, 9.2919921875, 9.5703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 3.0, 12.0, 7.0, 13.0, 10.0, 8.0, 15.0, 19.0, 23.0, 25.0, 17.0, 36.0, 30.0, 29.0, 40.0, 31.0, 46.0, 49.0, 38.0, 38.0, 36.0, 39.0, 25.0, 41.0, 41.0, 38.0, 37.0, 28.0, 31.0, 26.0, 29.0, 16.0, 22.0, 15.0, 15.0, 11.0, 7.0, 10.0, 4.0, 9.0, 5.0, 5.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.21771240234375, -5.0369873046875, -4.85626220703125, -4.675537109375, -4.49481201171875, -4.3140869140625, -4.13336181640625, -3.95263671875, -3.77191162109375, -3.5911865234375, -3.41046142578125, -3.229736328125, -3.04901123046875, -2.8682861328125, -2.68756103515625, -2.5068359375, -2.32611083984375, -2.1453857421875, -1.96466064453125, -1.783935546875, -1.60321044921875, -1.4224853515625, -1.24176025390625, -1.06103515625, -0.88031005859375, -0.6995849609375, -0.51885986328125, -0.338134765625, -0.15740966796875, 0.0233154296875, 0.20404052734375, 0.384765625, 0.56549072265625, 0.7462158203125, 0.92694091796875, 1.107666015625, 1.28839111328125, 1.4691162109375, 1.64984130859375, 1.83056640625, 2.01129150390625, 2.1920166015625, 2.37274169921875, 2.553466796875, 2.73419189453125, 2.9149169921875, 3.09564208984375, 3.2763671875, 3.45709228515625, 3.6378173828125, 3.81854248046875, 3.999267578125, 4.17999267578125, 4.3607177734375, 4.54144287109375, 4.72216796875, 4.90289306640625, 5.0836181640625, 5.26434326171875, 5.445068359375, 5.62579345703125, 5.8065185546875, 5.98724365234375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [8.0, 0.0, 2.0, 6.0, 12.0, 11.0, 15.0, 18.0, 39.0, 46.0, 64.0, 101.0, 153.0, 185.0, 294.0, 420.0, 598.0, 878.0, 1310.0, 1821.0, 2803.0, 4013.0, 6337.0, 9505.0, 14818.0, 22867.0, 36199.0, 55581.0, 83225.0, 115698.0, 142173.0, 147786.0, 126237.0, 93705.0, 63336.0, 41552.0, 26814.0, 17025.0, 11082.0, 7167.0, 4661.0, 3196.0, 2079.0, 1414.0, 1046.0, 663.0, 494.0, 313.0, 242.0, 158.0, 130.0, 65.0, 56.0, 45.0, 37.0, 25.0, 15.0, 8.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.828125, -5.64111328125, -5.4541015625, -5.26708984375, -5.080078125, -4.89306640625, -4.7060546875, -4.51904296875, -4.33203125, -4.14501953125, -3.9580078125, -3.77099609375, -3.583984375, -3.39697265625, -3.2099609375, -3.02294921875, -2.8359375, -2.64892578125, -2.4619140625, -2.27490234375, -2.087890625, -1.90087890625, -1.7138671875, -1.52685546875, -1.33984375, -1.15283203125, -0.9658203125, -0.77880859375, -0.591796875, -0.40478515625, -0.2177734375, -0.03076171875, 0.15625, 0.34326171875, 0.5302734375, 0.71728515625, 0.904296875, 1.09130859375, 1.2783203125, 1.46533203125, 1.65234375, 1.83935546875, 2.0263671875, 2.21337890625, 2.400390625, 2.58740234375, 2.7744140625, 2.96142578125, 3.1484375, 3.33544921875, 3.5224609375, 3.70947265625, 3.896484375, 4.08349609375, 4.2705078125, 4.45751953125, 4.64453125, 4.83154296875, 5.0185546875, 5.20556640625, 5.392578125, 5.57958984375, 5.7666015625, 5.95361328125, 6.140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 20.0, 23.0, 23.0, 28.0, 27.0, 36.0, 35.0, 27.0, 40.0, 42.0, 42.0, 39.0, 39.0, 33.0, 37.0, 49.0, 46.0, 22.0, 37.0, 34.0, 38.0, 33.0, 31.0, 25.0, 25.0, 18.0, 16.0, 11.0, 11.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.765625, -4.63037109375, -4.4951171875, -4.35986328125, -4.224609375, -4.08935546875, -3.9541015625, -3.81884765625, -3.68359375, -3.54833984375, -3.4130859375, -3.27783203125, -3.142578125, -3.00732421875, -2.8720703125, -2.73681640625, -2.6015625, -2.46630859375, -2.3310546875, -2.19580078125, -2.060546875, -1.92529296875, -1.7900390625, -1.65478515625, -1.51953125, -1.38427734375, -1.2490234375, -1.11376953125, -0.978515625, -0.84326171875, -0.7080078125, -0.57275390625, -0.4375, -0.30224609375, -0.1669921875, -0.03173828125, 0.103515625, 0.23876953125, 0.3740234375, 0.50927734375, 0.64453125, 0.77978515625, 0.9150390625, 1.05029296875, 1.185546875, 1.32080078125, 1.4560546875, 1.59130859375, 1.7265625, 1.86181640625, 1.9970703125, 2.13232421875, 2.267578125, 2.40283203125, 2.5380859375, 2.67333984375, 2.80859375, 2.94384765625, 3.0791015625, 3.21435546875, 3.349609375, 3.48486328125, 3.6201171875, 3.75537109375, 3.890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 15.0, 19.0, 42.0, 60.0, 55.0, 79.0, 113.0, 193.0, 310.0, 568.0, 957.0, 1871.0, 3903.0, 9381.0, 24283.0, 78425.0, 274249.0, 418800.0, 161109.0, 46024.0, 15751.0, 6096.0, 2835.0, 1412.0, 732.0, 452.0, 266.0, 162.0, 103.0, 80.0, 63.0, 39.0, 25.0, 10.0, 7.0, 10.0, 7.0, 10.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.38623046875, -18.8037109375, -18.22119140625, -17.638671875, -17.05615234375, -16.4736328125, -15.89111328125, -15.30859375, -14.72607421875, -14.1435546875, -13.56103515625, -12.978515625, -12.39599609375, -11.8134765625, -11.23095703125, -10.6484375, -10.06591796875, -9.4833984375, -8.90087890625, -8.318359375, -7.73583984375, -7.1533203125, -6.57080078125, -5.98828125, -5.40576171875, -4.8232421875, -4.24072265625, -3.658203125, -3.07568359375, -2.4931640625, -1.91064453125, -1.328125, -0.74560546875, -0.1630859375, 0.41943359375, 1.001953125, 1.58447265625, 2.1669921875, 2.74951171875, 3.33203125, 3.91455078125, 4.4970703125, 5.07958984375, 5.662109375, 6.24462890625, 6.8271484375, 7.40966796875, 7.9921875, 8.57470703125, 9.1572265625, 9.73974609375, 10.322265625, 10.90478515625, 11.4873046875, 12.06982421875, 12.65234375, 13.23486328125, 13.8173828125, 14.39990234375, 14.982421875, 15.56494140625, 16.1474609375, 16.72998046875, 17.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 13.0, 13.0, 6.0, 17.0, 23.0, 24.0, 51.0, 51.0, 66.0, 91.0, 108.0, 121.0, 100.0, 80.0, 55.0, 38.0, 38.0, 30.0, 19.0, 12.0, 16.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009517073631286621, -0.0009087324142456055, -0.0008657574653625488, -0.0008227825164794922, -0.0007798075675964355, -0.0007368326187133789, -0.0006938576698303223, -0.0006508827209472656, -0.000607907772064209, -0.0005649328231811523, -0.0005219578742980957, -0.00047898292541503906, -0.0004360079765319824, -0.0003930330276489258, -0.00035005807876586914, -0.0003070831298828125, -0.00026410818099975586, -0.00022113323211669922, -0.00017815828323364258, -0.00013518333435058594, -9.22083854675293e-05, -4.9233436584472656e-05, -6.258487701416016e-06, 3.6716461181640625e-05, 7.969141006469727e-05, 0.0001226663589477539, 0.00016564130783081055, 0.0002086162567138672, 0.00025159120559692383, 0.00029456615447998047, 0.0003375411033630371, 0.00038051605224609375, 0.0004234910011291504, 0.00046646595001220703, 0.0005094408988952637, 0.0005524158477783203, 0.000595390796661377, 0.0006383657455444336, 0.0006813406944274902, 0.0007243156433105469, 0.0007672905921936035, 0.0008102655410766602, 0.0008532404899597168, 0.0008962154388427734, 0.0009391903877258301, 0.0009821653366088867, 0.0010251402854919434, 0.001068115234375, 0.0011110901832580566, 0.0011540651321411133, 0.00119704008102417, 0.0012400150299072266, 0.0012829899787902832, 0.0013259649276733398, 0.0013689398765563965, 0.0014119148254394531, 0.0014548897743225098, 0.0014978647232055664, 0.001540839672088623, 0.0015838146209716797, 0.0016267895698547363, 0.001669764518737793, 0.0017127394676208496, 0.0017557144165039062]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 11.0, 9.0, 24.0, 21.0, 38.0, 53.0, 66.0, 85.0, 120.0, 165.0, 249.0, 407.0, 666.0, 1371.0, 3293.0, 9587.0, 36036.0, 156658.0, 447038.0, 292679.0, 72490.0, 17508.0, 5412.0, 2035.0, 966.0, 526.0, 349.0, 170.0, 135.0, 102.0, 54.0, 52.0, 33.0, 34.0, 25.0, 18.0, 13.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.8125, -20.21337890625, -19.6142578125, -19.01513671875, -18.416015625, -17.81689453125, -17.2177734375, -16.61865234375, -16.01953125, -15.42041015625, -14.8212890625, -14.22216796875, -13.623046875, -13.02392578125, -12.4248046875, -11.82568359375, -11.2265625, -10.62744140625, -10.0283203125, -9.42919921875, -8.830078125, -8.23095703125, -7.6318359375, -7.03271484375, -6.43359375, -5.83447265625, -5.2353515625, -4.63623046875, -4.037109375, -3.43798828125, -2.8388671875, -2.23974609375, -1.640625, -1.04150390625, -0.4423828125, 0.15673828125, 0.755859375, 1.35498046875, 1.9541015625, 2.55322265625, 3.15234375, 3.75146484375, 4.3505859375, 4.94970703125, 5.548828125, 6.14794921875, 6.7470703125, 7.34619140625, 7.9453125, 8.54443359375, 9.1435546875, 9.74267578125, 10.341796875, 10.94091796875, 11.5400390625, 12.13916015625, 12.73828125, 13.33740234375, 13.9365234375, 14.53564453125, 15.134765625, 15.73388671875, 16.3330078125, 16.93212890625, 17.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 10.0, 17.0, 25.0, 35.0, 39.0, 71.0, 121.0, 119.0, 128.0, 113.0, 99.0, 65.0, 49.0, 32.0, 20.0, 22.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.949462890625, -4.80517578125, -4.660888671875, -4.5166015625, -4.372314453125, -4.22802734375, -4.083740234375, -3.939453125, -3.795166015625, -3.65087890625, -3.506591796875, -3.3623046875, -3.218017578125, -3.07373046875, -2.929443359375, -2.78515625, -2.640869140625, -2.49658203125, -2.352294921875, -2.2080078125, -2.063720703125, -1.91943359375, -1.775146484375, -1.630859375, -1.486572265625, -1.34228515625, -1.197998046875, -1.0537109375, -0.909423828125, -0.76513671875, -0.620849609375, -0.4765625, -0.332275390625, -0.18798828125, -0.043701171875, 0.1005859375, 0.244873046875, 0.38916015625, 0.533447265625, 0.677734375, 0.822021484375, 0.96630859375, 1.110595703125, 1.2548828125, 1.399169921875, 1.54345703125, 1.687744140625, 1.83203125, 1.976318359375, 2.12060546875, 2.264892578125, 2.4091796875, 2.553466796875, 2.69775390625, 2.842041015625, 2.986328125, 3.130615234375, 3.27490234375, 3.419189453125, 3.5634765625, 3.707763671875, 3.85205078125, 3.996337890625, 4.140625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 11.0, 11.0, 17.0, 8.0, 14.0, 20.0, 28.0, 45.0, 48.0, 52.0, 49.0, 58.0, 71.0, 65.0, 59.0, 52.0, 50.0, 55.0, 47.0, 38.0, 31.0, 31.0, 33.0, 19.0, 23.0, 12.0, 11.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.411050796508789, -8.113692283630371, -7.816334247589111, -7.518975734710693, -7.221617698669434, -6.924259185791016, -6.626900672912598, -6.329542636871338, -6.032184600830078, -5.73482608795166, -5.4374680519104, -5.140109539031982, -4.842751502990723, -4.545392990112305, -4.248034477233887, -3.950676441192627, -3.653317928314209, -3.35595965385437, -3.0586013793945312, -2.7612428665161133, -2.4638848304748535, -2.1665263175964355, -1.8691680431365967, -1.5718097686767578, -1.274451494216919, -0.9770932197570801, -0.6797348856925964, -0.3823765516281128, -0.08501827716827393, 0.21233999729156494, 0.5096983909606934, 0.8070566654205322, 1.104414939880371, 1.40177321434021, 1.6991314888000488, 1.9964898824691772, 2.2938480377197266, 2.5912065505981445, 2.8885648250579834, 3.1859230995178223, 3.483281373977661, 3.7806396484375, 4.077998161315918, 4.375356197357178, 4.672714710235596, 4.9700727462768555, 5.267431259155273, 5.564789772033691, 5.862147808074951, 6.159506320953369, 6.456864356994629, 6.754222869873047, 7.051580905914307, 7.348939418792725, 7.646297454833984, 7.943655967712402, 8.24101448059082, 8.538372993469238, 8.835731506347656, 9.133089065551758, 9.430447578430176, 9.727806091308594, 10.025164604187012, 10.32252311706543, 10.619880676269531]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 7.0, 5.0, 2.0, 2.0, 9.0, 10.0, 6.0, 14.0, 16.0, 15.0, 18.0, 18.0, 34.0, 29.0, 17.0, 30.0, 27.0, 28.0, 27.0, 36.0, 35.0, 47.0, 38.0, 48.0, 27.0, 47.0, 36.0, 28.0, 22.0, 39.0, 32.0, 30.0, 26.0, 25.0, 28.0, 21.0, 14.0, 20.0, 13.0, 10.0, 19.0, 14.0, 5.0, 7.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.186312198638916, -6.003700256347656, -5.8210883140563965, -5.638476371765137, -5.455864429473877, -5.273252487182617, -5.090640544891357, -4.908028602600098, -4.725416660308838, -4.542804718017578, -4.360192775726318, -4.177580833435059, -3.994968891143799, -3.812356948852539, -3.6297450065612793, -3.4471330642700195, -3.2645208835601807, -3.081908941268921, -2.899296998977661, -2.7166850566864014, -2.5340731143951416, -2.351461172103882, -2.168848991394043, -1.9862371683120728, -1.803625226020813, -1.6210132837295532, -1.4384013414382935, -1.2557892799377441, -1.0731773376464844, -0.8905654549598694, -0.7079534530639648, -0.5253415107727051, -0.3427295684814453, -0.16011761128902435, 0.022494345903396606, 0.20510631799697876, 0.3877182602882385, 0.5703302025794983, 0.7529422044754028, 0.9355541467666626, 1.1181660890579224, 1.3007780313491821, 1.483389973640442, 1.6660020351409912, 1.848613977432251, 2.0312259197235107, 2.2138378620147705, 2.3964498043060303, 2.57906174659729, 2.76167368888855, 2.9442856311798096, 3.1268975734710693, 3.309509515762329, 3.492121458053589, 3.6747336387634277, 3.8573455810546875, 4.039957523345947, 4.222569465637207, 4.405181407928467, 4.587793350219727, 4.770405292510986, 4.953017234802246, 5.135629177093506, 5.318241119384766, 5.500853061676025]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 7.0, 7.0, 7.0, 10.0, 14.0, 31.0, 32.0, 68.0, 70.0, 163.0, 203.0, 274.0, 407.0, 625.0, 1017.0, 1546.0, 2396.0, 3777.0, 5652.0, 9263.0, 15120.0, 25485.0, 44816.0, 79050.0, 145080.0, 273344.0, 506066.0, 790298.0, 860680.0, 628876.0, 359274.0, 192795.0, 104658.0, 58145.0, 33571.0, 19636.0, 11622.0, 7274.0, 4510.0, 2843.0, 1927.0, 1185.0, 808.0, 556.0, 379.0, 214.0, 178.0, 109.0, 96.0, 50.0, 31.0, 19.0, 18.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.140625, -5.94390869140625, -5.7471923828125, -5.55047607421875, -5.353759765625, -5.15704345703125, -4.9603271484375, -4.76361083984375, -4.56689453125, -4.37017822265625, -4.1734619140625, -3.97674560546875, -3.780029296875, -3.58331298828125, -3.3865966796875, -3.18988037109375, -2.9931640625, -2.79644775390625, -2.5997314453125, -2.40301513671875, -2.206298828125, -2.00958251953125, -1.8128662109375, -1.61614990234375, -1.41943359375, -1.22271728515625, -1.0260009765625, -0.82928466796875, -0.632568359375, -0.43585205078125, -0.2391357421875, -0.04241943359375, 0.154296875, 0.35101318359375, 0.5477294921875, 0.74444580078125, 0.941162109375, 1.13787841796875, 1.3345947265625, 1.53131103515625, 1.72802734375, 1.92474365234375, 2.1214599609375, 2.31817626953125, 2.514892578125, 2.71160888671875, 2.9083251953125, 3.10504150390625, 3.3017578125, 3.49847412109375, 3.6951904296875, 3.89190673828125, 4.088623046875, 4.28533935546875, 4.4820556640625, 4.67877197265625, 4.87548828125, 5.07220458984375, 5.2689208984375, 5.46563720703125, 5.662353515625, 5.85906982421875, 6.0557861328125, 6.25250244140625, 6.44921875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 9.0, 5.0, 6.0, 13.0, 5.0, 6.0, 9.0, 16.0, 25.0, 23.0, 29.0, 26.0, 23.0, 36.0, 20.0, 34.0, 19.0, 38.0, 39.0, 41.0, 27.0, 29.0, 49.0, 33.0, 48.0, 31.0, 38.0, 32.0, 32.0, 34.0, 24.0, 20.0, 29.0, 21.0, 21.0, 19.0, 17.0, 14.0, 7.0, 11.0, 6.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.724609375, -3.599578857421875, -3.47454833984375, -3.349517822265625, -3.2244873046875, -3.099456787109375, -2.97442626953125, -2.849395751953125, -2.724365234375, -2.599334716796875, -2.47430419921875, -2.349273681640625, -2.2242431640625, -2.099212646484375, -1.97418212890625, -1.849151611328125, -1.72412109375, -1.599090576171875, -1.47406005859375, -1.349029541015625, -1.2239990234375, -1.098968505859375, -0.97393798828125, -0.848907470703125, -0.723876953125, -0.598846435546875, -0.47381591796875, -0.348785400390625, -0.2237548828125, -0.098724365234375, 0.02630615234375, 0.151336669921875, 0.2763671875, 0.401397705078125, 0.52642822265625, 0.651458740234375, 0.7764892578125, 0.901519775390625, 1.02655029296875, 1.151580810546875, 1.276611328125, 1.401641845703125, 1.52667236328125, 1.651702880859375, 1.7767333984375, 1.901763916015625, 2.02679443359375, 2.151824951171875, 2.27685546875, 2.401885986328125, 2.52691650390625, 2.651947021484375, 2.7769775390625, 2.902008056640625, 3.02703857421875, 3.152069091796875, 3.277099609375, 3.402130126953125, 3.52716064453125, 3.652191162109375, 3.7772216796875, 3.902252197265625, 4.02728271484375, 4.152313232421875, 4.27734375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 15.0, 12.0, 23.0, 38.0, 58.0, 100.0, 147.0, 210.0, 293.0, 423.0, 713.0, 1105.0, 1669.0, 2598.0, 4135.0, 6563.0, 10398.0, 17365.0, 28614.0, 48184.0, 82582.0, 142720.0, 241622.0, 402969.0, 608902.0, 753030.0, 672889.0, 465473.0, 288033.0, 169470.0, 99109.0, 57487.0, 34194.0, 20221.0, 12338.0, 7460.0, 4723.0, 3009.0, 1900.0, 1213.0, 802.0, 501.0, 301.0, 225.0, 148.0, 95.0, 81.0, 36.0, 27.0, 20.0, 15.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-5.67578125, -5.49652099609375, -5.3172607421875, -5.13800048828125, -4.958740234375, -4.77947998046875, -4.6002197265625, -4.42095947265625, -4.24169921875, -4.06243896484375, -3.8831787109375, -3.70391845703125, -3.524658203125, -3.34539794921875, -3.1661376953125, -2.98687744140625, -2.8076171875, -2.62835693359375, -2.4490966796875, -2.26983642578125, -2.090576171875, -1.91131591796875, -1.7320556640625, -1.55279541015625, -1.37353515625, -1.19427490234375, -1.0150146484375, -0.83575439453125, -0.656494140625, -0.47723388671875, -0.2979736328125, -0.11871337890625, 0.060546875, 0.23980712890625, 0.4190673828125, 0.59832763671875, 0.777587890625, 0.95684814453125, 1.1361083984375, 1.31536865234375, 1.49462890625, 1.67388916015625, 1.8531494140625, 2.03240966796875, 2.211669921875, 2.39093017578125, 2.5701904296875, 2.74945068359375, 2.9287109375, 3.10797119140625, 3.2872314453125, 3.46649169921875, 3.645751953125, 3.82501220703125, 4.0042724609375, 4.18353271484375, 4.36279296875, 4.54205322265625, 4.7213134765625, 4.90057373046875, 5.079833984375, 5.25909423828125, 5.4383544921875, 5.61761474609375, 5.796875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 10.0, 2.0, 12.0, 14.0, 20.0, 21.0, 25.0, 26.0, 23.0, 41.0, 55.0, 67.0, 93.0, 102.0, 132.0, 163.0, 182.0, 172.0, 211.0, 246.0, 254.0, 244.0, 258.0, 240.0, 231.0, 186.0, 164.0, 167.0, 138.0, 107.0, 90.0, 74.0, 59.0, 50.0, 36.0, 31.0, 28.0, 18.0, 16.0, 18.0, 14.0, 8.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.041015625, -1.974884033203125, -1.90875244140625, -1.842620849609375, -1.7764892578125, -1.710357666015625, -1.64422607421875, -1.578094482421875, -1.511962890625, -1.445831298828125, -1.37969970703125, -1.313568115234375, -1.2474365234375, -1.181304931640625, -1.11517333984375, -1.049041748046875, -0.98291015625, -0.916778564453125, -0.85064697265625, -0.784515380859375, -0.7183837890625, -0.652252197265625, -0.58612060546875, -0.519989013671875, -0.453857421875, -0.387725830078125, -0.32159423828125, -0.255462646484375, -0.1893310546875, -0.123199462890625, -0.05706787109375, 0.009063720703125, 0.0751953125, 0.141326904296875, 0.20745849609375, 0.273590087890625, 0.3397216796875, 0.405853271484375, 0.47198486328125, 0.538116455078125, 0.604248046875, 0.670379638671875, 0.73651123046875, 0.802642822265625, 0.8687744140625, 0.934906005859375, 1.00103759765625, 1.067169189453125, 1.13330078125, 1.199432373046875, 1.26556396484375, 1.331695556640625, 1.3978271484375, 1.463958740234375, 1.53009033203125, 1.596221923828125, 1.662353515625, 1.728485107421875, 1.79461669921875, 1.860748291015625, 1.9268798828125, 1.993011474609375, 2.05914306640625, 2.125274658203125, 2.19140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 17.0, 14.0, 33.0, 33.0, 29.0, 38.0, 55.0, 55.0, 55.0, 81.0, 84.0, 67.0, 57.0, 57.0, 55.0, 49.0, 49.0, 25.0, 32.0, 20.0, 17.0, 14.0, 9.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.106962203979492, -7.835235118865967, -7.5635085105896, -7.291781425476074, -7.020054817199707, -6.748327732086182, -6.476600646972656, -6.204874038696289, -5.933146953582764, -5.661419868469238, -5.389693260192871, -5.117966175079346, -4.84623908996582, -4.574512481689453, -4.302785396575928, -4.031058311462402, -3.759331703186035, -3.487604856491089, -3.2158780097961426, -2.944150924682617, -2.672424077987671, -2.4006972312927246, -2.128970146179199, -1.857243299484253, -1.5855164527893066, -1.3137896060943604, -1.0420626401901245, -0.7703357338905334, -0.4986088275909424, -0.2268819808959961, 0.044844985008239746, 0.3165719509124756, 0.5882987976074219, 0.8600257039070129, 1.131752610206604, 1.4034795761108398, 1.6752064228057861, 1.9469332695007324, 2.218660354614258, 2.490387201309204, 2.7621140480041504, 3.0338408946990967, 3.305567741394043, 3.5772948265075684, 3.8490216732025146, 4.120748519897461, 4.392475605010986, 4.664202690124512, 4.935929298400879, 5.207656383514404, 5.4793829917907715, 5.751110076904297, 6.022836685180664, 6.2945637702941895, 6.566290855407715, 6.838017463684082, 7.109744548797607, 7.381471633911133, 7.6531982421875, 7.924925327301025, 8.19665241241455, 8.468379020690918, 8.740105628967285, 9.011833190917969, 9.283559799194336]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 9.0, 12.0, 8.0, 7.0, 16.0, 18.0, 18.0, 23.0, 28.0, 26.0, 23.0, 39.0, 36.0, 40.0, 38.0, 38.0, 51.0, 45.0, 38.0, 37.0, 49.0, 41.0, 36.0, 31.0, 30.0, 35.0, 33.0, 21.0, 23.0, 21.0, 26.0, 23.0, 14.0, 14.0, 11.0, 7.0, 8.0, 11.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.849778175354004, -5.6817708015441895, -5.513762950897217, -5.345755577087402, -5.17774772644043, -5.009740352630615, -4.841732978820801, -4.673725128173828, -4.5057172775268555, -4.337709903717041, -4.169702053070068, -4.001694679260254, -3.8336868286132812, -3.665679454803467, -3.4976718425750732, -3.3296642303466797, -3.1616568565368652, -2.9936492443084717, -2.825641632080078, -2.6576342582702637, -2.489626407623291, -2.3216190338134766, -2.153611421585083, -1.9856038093566895, -1.817596197128296, -1.6495885848999023, -1.4815809726715088, -1.3135734796524048, -1.1455658674240112, -0.9775582551956177, -0.8095507621765137, -0.6415431499481201, -0.47353506088256836, -0.3055274784564972, -0.13751989603042603, 0.030487656593322754, 0.1984952688217163, 0.36650288105010986, 0.5345103740692139, 0.7025179862976074, 0.870525598526001, 1.0385332107543945, 1.206540822982788, 1.374548316001892, 1.5425559282302856, 1.7105635404586792, 1.8785710334777832, 2.0465786457061768, 2.2145862579345703, 2.382593870162964, 2.5506014823913574, 2.718608856201172, 2.8866167068481445, 3.054624080657959, 3.2226316928863525, 3.390639305114746, 3.5586469173431396, 3.726654529571533, 3.8946621417999268, 4.06266975402832, 4.230677127838135, 4.398684978485107, 4.566692352294922, 4.7347002029418945, 4.902707576751709]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 9.0, 23.0, 19.0, 30.0, 56.0, 79.0, 121.0, 199.0, 284.0, 429.0, 619.0, 937.0, 1306.0, 2049.0, 3371.0, 5073.0, 7916.0, 12267.0, 19274.0, 30350.0, 47941.0, 75047.0, 111741.0, 151599.0, 165040.0, 138344.0, 97719.0, 63699.0, 40961.0, 25758.0, 16423.0, 10638.0, 6805.0, 4282.0, 2793.0, 1798.0, 1191.0, 814.0, 513.0, 330.0, 231.0, 156.0, 94.0, 69.0, 57.0, 34.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.5595703125, -1.5081329345703125, -1.456695556640625, -1.4052581787109375, -1.35382080078125, -1.3023834228515625, -1.250946044921875, -1.1995086669921875, -1.1480712890625, -1.0966339111328125, -1.045196533203125, -0.9937591552734375, -0.94232177734375, -0.8908843994140625, -0.839447021484375, -0.7880096435546875, -0.736572265625, -0.6851348876953125, -0.633697509765625, -0.5822601318359375, -0.53082275390625, -0.4793853759765625, -0.427947998046875, -0.3765106201171875, -0.3250732421875, -0.2736358642578125, -0.222198486328125, -0.1707611083984375, -0.11932373046875, -0.0678863525390625, -0.016448974609375, 0.0349884033203125, 0.08642578125, 0.1378631591796875, 0.189300537109375, 0.2407379150390625, 0.29217529296875, 0.3436126708984375, 0.395050048828125, 0.4464874267578125, 0.4979248046875, 0.5493621826171875, 0.600799560546875, 0.6522369384765625, 0.70367431640625, 0.7551116943359375, 0.806549072265625, 0.8579864501953125, 0.909423828125, 0.9608612060546875, 1.012298583984375, 1.0637359619140625, 1.11517333984375, 1.1666107177734375, 1.218048095703125, 1.2694854736328125, 1.3209228515625, 1.3723602294921875, 1.423797607421875, 1.4752349853515625, 1.52667236328125, 1.5781097412109375, 1.629547119140625, 1.6809844970703125, 1.732421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 13.0, 12.0, 17.0, 26.0, 21.0, 27.0, 30.0, 35.0, 43.0, 31.0, 39.0, 31.0, 53.0, 50.0, 34.0, 40.0, 50.0, 40.0, 47.0, 40.0, 42.0, 24.0, 31.0, 31.0, 22.0, 21.0, 22.0, 16.0, 17.0, 25.0, 7.0, 8.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.2890625, -6.106201171875, -5.92333984375, -5.740478515625, -5.5576171875, -5.374755859375, -5.19189453125, -5.009033203125, -4.826171875, -4.643310546875, -4.46044921875, -4.277587890625, -4.0947265625, -3.911865234375, -3.72900390625, -3.546142578125, -3.36328125, -3.180419921875, -2.99755859375, -2.814697265625, -2.6318359375, -2.448974609375, -2.26611328125, -2.083251953125, -1.900390625, -1.717529296875, -1.53466796875, -1.351806640625, -1.1689453125, -0.986083984375, -0.80322265625, -0.620361328125, -0.4375, -0.254638671875, -0.07177734375, 0.111083984375, 0.2939453125, 0.476806640625, 0.65966796875, 0.842529296875, 1.025390625, 1.208251953125, 1.39111328125, 1.573974609375, 1.7568359375, 1.939697265625, 2.12255859375, 2.305419921875, 2.48828125, 2.671142578125, 2.85400390625, 3.036865234375, 3.2197265625, 3.402587890625, 3.58544921875, 3.768310546875, 3.951171875, 4.134033203125, 4.31689453125, 4.499755859375, 4.6826171875, 4.865478515625, 5.04833984375, 5.231201171875, 5.4140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 20.0, 30.0, 34.0, 56.0, 90.0, 111.0, 153.0, 202.0, 316.0, 453.0, 606.0, 916.0, 1330.0, 1950.0, 2878.0, 4533.0, 7138.0, 11989.0, 22749.0, 81009.0, 824131.0, 42079.0, 18066.0, 9979.0, 5996.0, 3784.0, 2440.0, 1703.0, 1193.0, 815.0, 484.0, 360.0, 247.0, 199.0, 128.0, 94.0, 82.0, 30.0, 41.0, 27.0, 16.0, 9.0, 8.0, 11.0, 3.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.947998046875, -3.81787109375, -3.687744140625, -3.5576171875, -3.427490234375, -3.29736328125, -3.167236328125, -3.037109375, -2.906982421875, -2.77685546875, -2.646728515625, -2.5166015625, -2.386474609375, -2.25634765625, -2.126220703125, -1.99609375, -1.865966796875, -1.73583984375, -1.605712890625, -1.4755859375, -1.345458984375, -1.21533203125, -1.085205078125, -0.955078125, -0.824951171875, -0.69482421875, -0.564697265625, -0.4345703125, -0.304443359375, -0.17431640625, -0.044189453125, 0.0859375, 0.216064453125, 0.34619140625, 0.476318359375, 0.6064453125, 0.736572265625, 0.86669921875, 0.996826171875, 1.126953125, 1.257080078125, 1.38720703125, 1.517333984375, 1.6474609375, 1.777587890625, 1.90771484375, 2.037841796875, 2.16796875, 2.298095703125, 2.42822265625, 2.558349609375, 2.6884765625, 2.818603515625, 2.94873046875, 3.078857421875, 3.208984375, 3.339111328125, 3.46923828125, 3.599365234375, 3.7294921875, 3.859619140625, 3.98974609375, 4.119873046875, 4.25]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 20.0, 17.0, 20.0, 23.0, 24.0, 27.0, 34.0, 30.0, 34.0, 43.0, 31.0, 55.0, 54.0, 44.0, 45.0, 36.0, 37.0, 39.0, 44.0, 42.0, 41.0, 33.0, 19.0, 25.0, 16.0, 23.0, 19.0, 11.0, 7.0, 6.0, 13.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.7760009765625, -3.637939453125, -3.4998779296875, -3.36181640625, -3.2237548828125, -3.085693359375, -2.9476318359375, -2.8095703125, -2.6715087890625, -2.533447265625, -2.3953857421875, -2.25732421875, -2.1192626953125, -1.981201171875, -1.8431396484375, -1.705078125, -1.5670166015625, -1.428955078125, -1.2908935546875, -1.15283203125, -1.0147705078125, -0.876708984375, -0.7386474609375, -0.6005859375, -0.4625244140625, -0.324462890625, -0.1864013671875, -0.04833984375, 0.0897216796875, 0.227783203125, 0.3658447265625, 0.50390625, 0.6419677734375, 0.780029296875, 0.9180908203125, 1.05615234375, 1.1942138671875, 1.332275390625, 1.4703369140625, 1.6083984375, 1.7464599609375, 1.884521484375, 2.0225830078125, 2.16064453125, 2.2987060546875, 2.436767578125, 2.5748291015625, 2.712890625, 2.8509521484375, 2.989013671875, 3.1270751953125, 3.26513671875, 3.4031982421875, 3.541259765625, 3.6793212890625, 3.8173828125, 3.9554443359375, 4.093505859375, 4.2315673828125, 4.36962890625, 4.5076904296875, 4.645751953125, 4.7838134765625, 4.921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 19.0, 13.0, 11.0, 28.0, 35.0, 51.0, 68.0, 66.0, 115.0, 158.0, 191.0, 281.0, 447.0, 654.0, 970.0, 1567.0, 2405.0, 3785.0, 6177.0, 10946.0, 20743.0, 73722.0, 851059.0, 35683.0, 16061.0, 8812.0, 5107.0, 3223.0, 2031.0, 1299.0, 867.0, 584.0, 405.0, 260.0, 201.0, 151.0, 91.0, 77.0, 50.0, 33.0, 30.0, 21.0, 21.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.759765625, -1.706939697265625, -1.65411376953125, -1.601287841796875, -1.5484619140625, -1.495635986328125, -1.44281005859375, -1.389984130859375, -1.337158203125, -1.284332275390625, -1.23150634765625, -1.178680419921875, -1.1258544921875, -1.073028564453125, -1.02020263671875, -0.967376708984375, -0.91455078125, -0.861724853515625, -0.80889892578125, -0.756072998046875, -0.7032470703125, -0.650421142578125, -0.59759521484375, -0.544769287109375, -0.491943359375, -0.439117431640625, -0.38629150390625, -0.333465576171875, -0.2806396484375, -0.227813720703125, -0.17498779296875, -0.122161865234375, -0.0693359375, -0.016510009765625, 0.03631591796875, 0.089141845703125, 0.1419677734375, 0.194793701171875, 0.24761962890625, 0.300445556640625, 0.353271484375, 0.406097412109375, 0.45892333984375, 0.511749267578125, 0.5645751953125, 0.617401123046875, 0.67022705078125, 0.723052978515625, 0.77587890625, 0.828704833984375, 0.88153076171875, 0.934356689453125, 0.9871826171875, 1.040008544921875, 1.09283447265625, 1.145660400390625, 1.198486328125, 1.251312255859375, 1.30413818359375, 1.356964111328125, 1.4097900390625, 1.462615966796875, 1.51544189453125, 1.568267822265625, 1.62109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 19.0, 22.0, 37.0, 57.0, 71.0, 98.0, 113.0, 122.0, 104.0, 78.0, 67.0, 44.0, 32.0, 19.0, 17.0, 17.0, 2.0, 8.0, 7.0, 4.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021076202392578125, -0.00020478293299674988, -0.0001988038420677185, -0.00019282475113868713, -0.00018684566020965576, -0.0001808665692806244, -0.00017488747835159302, -0.00016890838742256165, -0.00016292929649353027, -0.0001569502055644989, -0.00015097111463546753, -0.00014499202370643616, -0.00013901293277740479, -0.0001330338418483734, -0.00012705475091934204, -0.00012107565999031067, -0.0001150965690612793, -0.00010911747813224792, -0.00010313838720321655, -9.715929627418518e-05, -9.118020534515381e-05, -8.520111441612244e-05, -7.922202348709106e-05, -7.324293255805969e-05, -6.726384162902832e-05, -6.128475069999695e-05, -5.5305659770965576e-05, -4.9326568841934204e-05, -4.334747791290283e-05, -3.736838698387146e-05, -3.138929605484009e-05, -2.5410205125808716e-05, -1.9431114196777344e-05, -1.3452023267745972e-05, -7.4729323387146e-06, -1.4938414096832275e-06, 4.4852495193481445e-06, 1.0464340448379517e-05, 1.644343137741089e-05, 2.242252230644226e-05, 2.8401613235473633e-05, 3.4380704164505005e-05, 4.035979509353638e-05, 4.633888602256775e-05, 5.231797695159912e-05, 5.829706788063049e-05, 6.427615880966187e-05, 7.025524973869324e-05, 7.623434066772461e-05, 8.221343159675598e-05, 8.819252252578735e-05, 9.417161345481873e-05, 0.0001001507043838501, 0.00010612979531288147, 0.00011210888624191284, 0.00011808797717094421, 0.00012406706809997559, 0.00013004615902900696, 0.00013602524995803833, 0.0001420043408870697, 0.00014798343181610107, 0.00015396252274513245, 0.00015994161367416382, 0.0001659207046031952, 0.00017189979553222656]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 7.0, 13.0, 21.0, 34.0, 42.0, 61.0, 76.0, 116.0, 177.0, 260.0, 402.0, 629.0, 898.0, 1407.0, 2186.0, 3504.0, 5583.0, 9501.0, 15300.0, 25773.0, 43533.0, 73987.0, 126400.0, 198073.0, 206229.0, 135998.0, 80311.0, 47045.0, 27878.0, 16356.0, 10080.0, 6094.0, 3724.0, 2429.0, 1495.0, 985.0, 679.0, 410.0, 266.0, 190.0, 135.0, 87.0, 64.0, 36.0, 19.0, 17.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7126312255859375, -0.688934326171875, -0.6652374267578125, -0.64154052734375, -0.6178436279296875, -0.594146728515625, -0.5704498291015625, -0.5467529296875, -0.5230560302734375, -0.499359130859375, -0.4756622314453125, -0.45196533203125, -0.4282684326171875, -0.404571533203125, -0.3808746337890625, -0.357177734375, -0.3334808349609375, -0.309783935546875, -0.2860870361328125, -0.26239013671875, -0.2386932373046875, -0.214996337890625, -0.1912994384765625, -0.1676025390625, -0.1439056396484375, -0.120208740234375, -0.0965118408203125, -0.07281494140625, -0.0491180419921875, -0.025421142578125, -0.0017242431640625, 0.02197265625, 0.0456695556640625, 0.069366455078125, 0.0930633544921875, 0.11676025390625, 0.1404571533203125, 0.164154052734375, 0.1878509521484375, 0.2115478515625, 0.2352447509765625, 0.258941650390625, 0.2826385498046875, 0.30633544921875, 0.3300323486328125, 0.353729248046875, 0.3774261474609375, 0.401123046875, 0.4248199462890625, 0.448516845703125, 0.4722137451171875, 0.49591064453125, 0.5196075439453125, 0.543304443359375, 0.5670013427734375, 0.5906982421875, 0.6143951416015625, 0.638092041015625, 0.6617889404296875, 0.68548583984375, 0.7091827392578125, 0.732879638671875, 0.7565765380859375, 0.7802734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 19.0, 14.0, 25.0, 27.0, 33.0, 31.0, 40.0, 49.0, 44.0, 51.0, 54.0, 51.0, 53.0, 44.0, 65.0, 50.0, 45.0, 41.0, 27.0, 37.0, 24.0, 22.0, 18.0, 12.0, 12.0, 10.0, 14.0, 9.0, 5.0, 4.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24935150146484375, -0.2411346435546875, -0.23291778564453125, -0.224700927734375, -0.21648406982421875, -0.2082672119140625, -0.20005035400390625, -0.19183349609375, -0.18361663818359375, -0.1753997802734375, -0.16718292236328125, -0.158966064453125, -0.15074920654296875, -0.1425323486328125, -0.13431549072265625, -0.1260986328125, -0.11788177490234375, -0.1096649169921875, -0.10144805908203125, -0.093231201171875, -0.08501434326171875, -0.0767974853515625, -0.06858062744140625, -0.06036376953125, -0.05214691162109375, -0.0439300537109375, -0.03571319580078125, -0.027496337890625, -0.01927947998046875, -0.0110626220703125, -0.00284576416015625, 0.00537109375, 0.01358795166015625, 0.0218048095703125, 0.03002166748046875, 0.038238525390625, 0.04645538330078125, 0.0546722412109375, 0.06288909912109375, 0.07110595703125, 0.07932281494140625, 0.0875396728515625, 0.09575653076171875, 0.103973388671875, 0.11219024658203125, 0.1204071044921875, 0.12862396240234375, 0.1368408203125, 0.14505767822265625, 0.1532745361328125, 0.16149139404296875, 0.169708251953125, 0.17792510986328125, 0.1861419677734375, 0.19435882568359375, 0.20257568359375, 0.21079254150390625, 0.2190093994140625, 0.22722625732421875, 0.235443115234375, 0.24365997314453125, 0.2518768310546875, 0.26009368896484375, 0.268310546875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 14.0, 14.0, 16.0, 28.0, 34.0, 38.0, 47.0, 45.0, 58.0, 64.0, 74.0, 84.0, 70.0, 72.0, 46.0, 62.0, 52.0, 29.0, 33.0, 27.0, 15.0, 19.0, 14.0, 8.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.229190826416016, -7.951141834259033, -7.673092842102051, -7.395044326782227, -7.116995334625244, -6.838946342468262, -6.5608978271484375, -6.282848834991455, -6.004799842834473, -5.72675085067749, -5.448701858520508, -5.170653343200684, -4.892604351043701, -4.614555358886719, -4.3365068435668945, -4.058457851409912, -3.7804088592529297, -3.5023598670959473, -3.224311113357544, -2.9462623596191406, -2.668213367462158, -2.390164375305176, -2.1121156215667725, -1.8340667486190796, -1.5560178756713867, -1.2779690027236938, -0.999920129776001, -0.7218712568283081, -0.44382238388061523, -0.16577351093292236, 0.11227536201477051, 0.3903242349624634, 0.6683740615844727, 0.9464229345321655, 1.2244718074798584, 1.5025206804275513, 1.7805695533752441, 2.0586185455322266, 2.33666729927063, 2.614716053009033, 2.8927650451660156, 3.170814037322998, 3.4488627910614014, 3.7269115447998047, 4.004960536956787, 4.2830095291137695, 4.561058044433594, 4.839107036590576, 5.117156028747559, 5.395205020904541, 5.673254013061523, 5.951302528381348, 6.22935152053833, 6.5074005126953125, 6.785449028015137, 7.063498020172119, 7.341547012329102, 7.619596004486084, 7.897644996643066, 8.17569351196289, 8.453742980957031, 8.731791496276855, 9.00984001159668, 9.28788948059082, 9.565937995910645]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 9.0, 14.0, 21.0, 22.0, 22.0, 29.0, 28.0, 24.0, 37.0, 39.0, 43.0, 41.0, 43.0, 48.0, 46.0, 32.0, 48.0, 45.0, 46.0, 29.0, 33.0, 39.0, 28.0, 24.0, 28.0, 22.0, 24.0, 19.0, 19.0, 11.0, 15.0, 6.0, 10.0, 11.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.924797058105469, -5.7518486976623535, -5.578900337219238, -5.405952453613281, -5.233004093170166, -5.060055732727051, -4.887107849121094, -4.7141594886779785, -4.541211128234863, -4.368262767791748, -4.195314407348633, -4.022366523742676, -3.8494181632995605, -3.6764698028564453, -3.503521680831909, -3.330573558807373, -3.157625198364258, -2.9846768379211426, -2.8117287158966064, -2.6387805938720703, -2.465832233428955, -2.29288387298584, -2.1199357509613037, -1.946987509727478, -1.7740392684936523, -1.6010910272598267, -1.428142786026001, -1.2551945447921753, -1.0822463035583496, -0.9092980623245239, -0.7363498210906982, -0.5634015798568726, -0.39045286178588867, -0.217504620552063, -0.044556379318237305, 0.12839186191558838, 0.30134010314941406, 0.47428834438323975, 0.6472365856170654, 0.8201848268508911, 0.9931330680847168, 1.1660813093185425, 1.3390295505523682, 1.5119777917861938, 1.6849260330200195, 1.8578742742538452, 2.030822515487671, 2.203770637512207, 2.3767189979553223, 2.5496673583984375, 2.7226154804229736, 2.8955636024475098, 3.068511962890625, 3.2414603233337402, 3.4144084453582764, 3.5873565673828125, 3.7603049278259277, 3.933253288269043, 4.106201171875, 4.279149532318115, 4.4520978927612305, 4.625046253204346, 4.797994613647461, 4.970942497253418, 5.143890857696533]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 9.0, 16.0, 14.0, 34.0, 35.0, 55.0, 91.0, 116.0, 199.0, 252.0, 397.0, 587.0, 832.0, 1310.0, 1877.0, 2924.0, 4276.0, 6176.0, 9534.0, 14046.0, 20801.0, 30915.0, 45108.0, 64110.0, 87238.0, 111080.0, 126907.0, 126229.0, 109124.0, 85512.0, 62809.0, 44059.0, 30282.0, 20342.0, 13616.0, 9014.0, 6169.0, 4062.0, 2793.0, 1792.0, 1188.0, 859.0, 580.0, 390.0, 258.0, 178.0, 106.0, 86.0, 59.0, 32.0, 23.0, 20.0, 16.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.5546875, -4.4075927734375, -4.260498046875, -4.1134033203125, -3.96630859375, -3.8192138671875, -3.672119140625, -3.5250244140625, -3.3779296875, -3.2308349609375, -3.083740234375, -2.9366455078125, -2.78955078125, -2.6424560546875, -2.495361328125, -2.3482666015625, -2.201171875, -2.0540771484375, -1.906982421875, -1.7598876953125, -1.61279296875, -1.4656982421875, -1.318603515625, -1.1715087890625, -1.0244140625, -0.8773193359375, -0.730224609375, -0.5831298828125, -0.43603515625, -0.2889404296875, -0.141845703125, 0.0052490234375, 0.15234375, 0.2994384765625, 0.446533203125, 0.5936279296875, 0.74072265625, 0.8878173828125, 1.034912109375, 1.1820068359375, 1.3291015625, 1.4761962890625, 1.623291015625, 1.7703857421875, 1.91748046875, 2.0645751953125, 2.211669921875, 2.3587646484375, 2.505859375, 2.6529541015625, 2.800048828125, 2.9471435546875, 3.09423828125, 3.2413330078125, 3.388427734375, 3.5355224609375, 3.6826171875, 3.8297119140625, 3.976806640625, 4.1239013671875, 4.27099609375, 4.4180908203125, 4.565185546875, 4.7122802734375, 4.859375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 7.0, 24.0, 20.0, 11.0, 24.0, 27.0, 27.0, 33.0, 35.0, 37.0, 44.0, 38.0, 40.0, 50.0, 44.0, 51.0, 41.0, 47.0, 35.0, 29.0, 41.0, 40.0, 30.0, 28.0, 30.0, 26.0, 31.0, 20.0, 22.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.43634033203125, -6.2593994140625, -6.08245849609375, -5.905517578125, -5.72857666015625, -5.5516357421875, -5.37469482421875, -5.19775390625, -5.02081298828125, -4.8438720703125, -4.66693115234375, -4.489990234375, -4.31304931640625, -4.1361083984375, -3.95916748046875, -3.7822265625, -3.60528564453125, -3.4283447265625, -3.25140380859375, -3.074462890625, -2.89752197265625, -2.7205810546875, -2.54364013671875, -2.36669921875, -2.18975830078125, -2.0128173828125, -1.83587646484375, -1.658935546875, -1.48199462890625, -1.3050537109375, -1.12811279296875, -0.951171875, -0.77423095703125, -0.5972900390625, -0.42034912109375, -0.243408203125, -0.06646728515625, 0.1104736328125, 0.28741455078125, 0.46435546875, 0.64129638671875, 0.8182373046875, 0.99517822265625, 1.172119140625, 1.34906005859375, 1.5260009765625, 1.70294189453125, 1.8798828125, 2.05682373046875, 2.2337646484375, 2.41070556640625, 2.587646484375, 2.76458740234375, 2.9415283203125, 3.11846923828125, 3.29541015625, 3.47235107421875, 3.6492919921875, 3.82623291015625, 4.003173828125, 4.18011474609375, 4.3570556640625, 4.53399658203125, 4.7109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 16.0, 36.0, 37.0, 76.0, 100.0, 173.0, 275.0, 400.0, 691.0, 1173.0, 1905.0, 3180.0, 5298.0, 8996.0, 15324.0, 25724.0, 43032.0, 71236.0, 109577.0, 150350.0, 169462.0, 150723.0, 110458.0, 71969.0, 44098.0, 26385.0, 15316.0, 9062.0, 5428.0, 3205.0, 1856.0, 1160.0, 673.0, 419.0, 281.0, 175.0, 94.0, 72.0, 41.0, 21.0, 20.0, 16.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4305419921875, -4.263427734375, -4.0963134765625, -3.92919921875, -3.7620849609375, -3.594970703125, -3.4278564453125, -3.2607421875, -3.0936279296875, -2.926513671875, -2.7593994140625, -2.59228515625, -2.4251708984375, -2.258056640625, -2.0909423828125, -1.923828125, -1.7567138671875, -1.589599609375, -1.4224853515625, -1.25537109375, -1.0882568359375, -0.921142578125, -0.7540283203125, -0.5869140625, -0.4197998046875, -0.252685546875, -0.0855712890625, 0.08154296875, 0.2486572265625, 0.415771484375, 0.5828857421875, 0.75, 0.9171142578125, 1.084228515625, 1.2513427734375, 1.41845703125, 1.5855712890625, 1.752685546875, 1.9197998046875, 2.0869140625, 2.2540283203125, 2.421142578125, 2.5882568359375, 2.75537109375, 2.9224853515625, 3.089599609375, 3.2567138671875, 3.423828125, 3.5909423828125, 3.758056640625, 3.9251708984375, 4.09228515625, 4.2593994140625, 4.426513671875, 4.5936279296875, 4.7607421875, 4.9278564453125, 5.094970703125, 5.2620849609375, 5.42919921875, 5.5963134765625, 5.763427734375, 5.9305419921875, 6.09765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 5.0, 6.0, 18.0, 6.0, 10.0, 13.0, 21.0, 13.0, 24.0, 24.0, 29.0, 37.0, 28.0, 32.0, 28.0, 47.0, 46.0, 40.0, 49.0, 50.0, 41.0, 40.0, 46.0, 38.0, 23.0, 39.0, 33.0, 21.0, 18.0, 26.0, 22.0, 21.0, 18.0, 14.0, 17.0, 12.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.31640625, -4.18438720703125, -4.0523681640625, -3.92034912109375, -3.788330078125, -3.65631103515625, -3.5242919921875, -3.39227294921875, -3.26025390625, -3.12823486328125, -2.9962158203125, -2.86419677734375, -2.732177734375, -2.60015869140625, -2.4681396484375, -2.33612060546875, -2.2041015625, -2.07208251953125, -1.9400634765625, -1.80804443359375, -1.676025390625, -1.54400634765625, -1.4119873046875, -1.27996826171875, -1.14794921875, -1.01593017578125, -0.8839111328125, -0.75189208984375, -0.619873046875, -0.48785400390625, -0.3558349609375, -0.22381591796875, -0.091796875, 0.04022216796875, 0.1722412109375, 0.30426025390625, 0.436279296875, 0.56829833984375, 0.7003173828125, 0.83233642578125, 0.96435546875, 1.09637451171875, 1.2283935546875, 1.36041259765625, 1.492431640625, 1.62445068359375, 1.7564697265625, 1.88848876953125, 2.0205078125, 2.15252685546875, 2.2845458984375, 2.41656494140625, 2.548583984375, 2.68060302734375, 2.8126220703125, 2.94464111328125, 3.07666015625, 3.20867919921875, 3.3406982421875, 3.47271728515625, 3.604736328125, 3.73675537109375, 3.8687744140625, 4.00079345703125, 4.1328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 13.0, 22.0, 38.0, 68.0, 95.0, 158.0, 282.0, 499.0, 961.0, 1711.0, 3487.0, 7773.0, 18918.0, 54102.0, 169702.0, 383499.0, 267489.0, 88908.0, 29807.0, 11214.0, 4898.0, 2264.0, 1143.0, 599.0, 315.0, 223.0, 114.0, 68.0, 53.0, 38.0, 23.0, 15.0, 11.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5, -10.1790771484375, -9.858154296875, -9.5372314453125, -9.21630859375, -8.8953857421875, -8.574462890625, -8.2535400390625, -7.9326171875, -7.6116943359375, -7.290771484375, -6.9698486328125, -6.64892578125, -6.3280029296875, -6.007080078125, -5.6861572265625, -5.365234375, -5.0443115234375, -4.723388671875, -4.4024658203125, -4.08154296875, -3.7606201171875, -3.439697265625, -3.1187744140625, -2.7978515625, -2.4769287109375, -2.156005859375, -1.8350830078125, -1.51416015625, -1.1932373046875, -0.872314453125, -0.5513916015625, -0.23046875, 0.0904541015625, 0.411376953125, 0.7322998046875, 1.05322265625, 1.3741455078125, 1.695068359375, 2.0159912109375, 2.3369140625, 2.6578369140625, 2.978759765625, 3.2996826171875, 3.62060546875, 3.9415283203125, 4.262451171875, 4.5833740234375, 4.904296875, 5.2252197265625, 5.546142578125, 5.8670654296875, 6.18798828125, 6.5089111328125, 6.829833984375, 7.1507568359375, 7.4716796875, 7.7926025390625, 8.113525390625, 8.4344482421875, 8.75537109375, 9.0762939453125, 9.397216796875, 9.7181396484375, 10.0390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 11.0, 12.0, 15.0, 20.0, 31.0, 21.0, 31.0, 40.0, 52.0, 46.0, 35.0, 65.0, 53.0, 68.0, 63.0, 60.0, 50.0, 46.0, 51.0, 47.0, 30.0, 35.0, 19.0, 19.0, 13.0, 10.0, 8.0, 10.0, 8.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00045680999755859375, -0.0004429668188095093, -0.0004291236400604248, -0.00041528046131134033, -0.00040143728256225586, -0.0003875941038131714, -0.0003737509250640869, -0.00035990774631500244, -0.00034606456756591797, -0.0003322213888168335, -0.000318378210067749, -0.00030453503131866455, -0.0002906918525695801, -0.0002768486738204956, -0.00026300549507141113, -0.00024916231632232666, -0.0002353191375732422, -0.00022147595882415771, -0.00020763278007507324, -0.00019378960132598877, -0.0001799464225769043, -0.00016610324382781982, -0.00015226006507873535, -0.00013841688632965088, -0.0001245737075805664, -0.00011073052883148193, -9.688735008239746e-05, -8.304417133331299e-05, -6.920099258422852e-05, -5.535781383514404e-05, -4.151463508605957e-05, -2.7671456336975098e-05, -1.3828277587890625e-05, 1.4901161193847656e-08, 1.385807991027832e-05, 2.7701258659362793e-05, 4.1544437408447266e-05, 5.538761615753174e-05, 6.923079490661621e-05, 8.307397365570068e-05, 9.691715240478516e-05, 0.00011076033115386963, 0.0001246035099029541, 0.00013844668865203857, 0.00015228986740112305, 0.00016613304615020752, 0.000179976224899292, 0.00019381940364837646, 0.00020766258239746094, 0.0002215057611465454, 0.00023534893989562988, 0.00024919211864471436, 0.00026303529739379883, 0.0002768784761428833, 0.0002907216548919678, 0.00030456483364105225, 0.0003184080123901367, 0.0003322511911392212, 0.00034609436988830566, 0.00035993754863739014, 0.0003737807273864746, 0.0003876239061355591, 0.00040146708488464355, 0.00041531026363372803, 0.0004291534423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 13.0, 12.0, 21.0, 26.0, 37.0, 52.0, 77.0, 114.0, 204.0, 291.0, 424.0, 697.0, 1135.0, 1982.0, 3497.0, 6604.0, 13414.0, 29688.0, 69528.0, 160943.0, 280028.0, 251471.0, 127685.0, 53854.0, 23125.0, 10841.0, 5467.0, 2824.0, 1731.0, 1003.0, 643.0, 384.0, 238.0, 156.0, 112.0, 64.0, 44.0, 40.0, 18.0, 16.0, 17.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65972900390625, -6.4366455078125, -6.21356201171875, -5.990478515625, -5.76739501953125, -5.5443115234375, -5.32122802734375, -5.09814453125, -4.87506103515625, -4.6519775390625, -4.42889404296875, -4.205810546875, -3.98272705078125, -3.7596435546875, -3.53656005859375, -3.3134765625, -3.09039306640625, -2.8673095703125, -2.64422607421875, -2.421142578125, -2.19805908203125, -1.9749755859375, -1.75189208984375, -1.52880859375, -1.30572509765625, -1.0826416015625, -0.85955810546875, -0.636474609375, -0.41339111328125, -0.1903076171875, 0.03277587890625, 0.255859375, 0.47894287109375, 0.7020263671875, 0.92510986328125, 1.148193359375, 1.37127685546875, 1.5943603515625, 1.81744384765625, 2.04052734375, 2.26361083984375, 2.4866943359375, 2.70977783203125, 2.932861328125, 3.15594482421875, 3.3790283203125, 3.60211181640625, 3.8251953125, 4.04827880859375, 4.2713623046875, 4.49444580078125, 4.717529296875, 4.94061279296875, 5.1636962890625, 5.38677978515625, 5.60986328125, 5.83294677734375, 6.0560302734375, 6.27911376953125, 6.502197265625, 6.72528076171875, 6.9483642578125, 7.17144775390625, 7.39453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 5.0, 15.0, 10.0, 10.0, 20.0, 23.0, 39.0, 41.0, 81.0, 79.0, 110.0, 110.0, 92.0, 89.0, 50.0, 40.0, 27.0, 35.0, 21.0, 24.0, 9.0, 12.0, 7.0, 5.0, 6.0, 4.0, 6.0, 0.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4609375, -3.35986328125, -3.2587890625, -3.15771484375, -3.056640625, -2.95556640625, -2.8544921875, -2.75341796875, -2.65234375, -2.55126953125, -2.4501953125, -2.34912109375, -2.248046875, -2.14697265625, -2.0458984375, -1.94482421875, -1.84375, -1.74267578125, -1.6416015625, -1.54052734375, -1.439453125, -1.33837890625, -1.2373046875, -1.13623046875, -1.03515625, -0.93408203125, -0.8330078125, -0.73193359375, -0.630859375, -0.52978515625, -0.4287109375, -0.32763671875, -0.2265625, -0.12548828125, -0.0244140625, 0.07666015625, 0.177734375, 0.27880859375, 0.3798828125, 0.48095703125, 0.58203125, 0.68310546875, 0.7841796875, 0.88525390625, 0.986328125, 1.08740234375, 1.1884765625, 1.28955078125, 1.390625, 1.49169921875, 1.5927734375, 1.69384765625, 1.794921875, 1.89599609375, 1.9970703125, 2.09814453125, 2.19921875, 2.30029296875, 2.4013671875, 2.50244140625, 2.603515625, 2.70458984375, 2.8056640625, 2.90673828125, 3.0078125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 4.0, 16.0, 21.0, 25.0, 29.0, 31.0, 45.0, 48.0, 66.0, 65.0, 71.0, 91.0, 73.0, 79.0, 67.0, 53.0, 50.0, 43.0, 20.0, 20.0, 21.0, 12.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9293670654296875, -7.647541522979736, -7.365716457366943, -7.083890914916992, -6.802065372467041, -6.52023983001709, -6.238414764404297, -5.956589221954346, -5.6747636795043945, -5.392938137054443, -5.11111307144165, -4.829287528991699, -4.547461986541748, -4.265636444091797, -3.983811378479004, -3.7019858360290527, -3.4201607704162598, -3.1383354663848877, -2.8565099239349365, -2.5746846199035645, -2.2928590774536133, -2.011033773422241, -1.7292084693908691, -1.4473830461502075, -1.165557622909546, -0.8837321996688843, -0.6019068360328674, -0.3200814723968506, -0.038256049156188965, 0.24356937408447266, 0.5253946781158447, 0.8072201013565063, 1.089045524597168, 1.3708709478378296, 1.6526963710784912, 1.9345216751098633, 2.2163472175598145, 2.4981725215911865, 2.7799978256225586, 3.0618233680725098, 3.343648672103882, 3.625473976135254, 3.907299518585205, 4.189125061035156, 4.470950126647949, 4.7527756690979, 5.034601211547852, 5.3164262771606445, 5.598251819610596, 5.880077362060547, 6.16190242767334, 6.443727970123291, 6.725553512573242, 7.007378578186035, 7.289204120635986, 7.5710296630859375, 7.8528547286987305, 8.134679794311523, 8.416505813598633, 8.698330879211426, 8.980155944824219, 9.261981964111328, 9.543807029724121, 9.825632095336914, 10.107458114624023]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 5.0, 7.0, 4.0, 14.0, 12.0, 17.0, 21.0, 23.0, 24.0, 22.0, 29.0, 45.0, 27.0, 41.0, 33.0, 42.0, 52.0, 37.0, 29.0, 47.0, 39.0, 29.0, 47.0, 48.0, 28.0, 29.0, 24.0, 31.0, 24.0, 28.0, 27.0, 15.0, 19.0, 15.0, 15.0, 15.0, 11.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.836164951324463, -5.655647277832031, -5.475129127502441, -5.294610977172852, -5.11409330368042, -4.933575630187988, -4.753057479858398, -4.572539329528809, -4.392021656036377, -4.211503982543945, -4.0309858322143555, -3.8504679203033447, -3.669950008392334, -3.4894320964813232, -3.3089141845703125, -3.1283962726593018, -2.947878360748291, -2.7673604488372803, -2.5868425369262695, -2.406324625015259, -2.225806713104248, -2.0452888011932373, -1.8647708892822266, -1.6842529773712158, -1.503735065460205, -1.3232171535491943, -1.1426992416381836, -0.9621813297271729, -0.7816634178161621, -0.6011455059051514, -0.4206275939941406, -0.24010968208312988, -0.05959129333496094, 0.1209266185760498, 0.30144453048706055, 0.4819624423980713, 0.662480354309082, 0.8429982662200928, 1.0235161781311035, 1.2040340900421143, 1.384552001953125, 1.5650699138641357, 1.7455878257751465, 1.9261057376861572, 2.106623649597168, 2.2871415615081787, 2.4676594734191895, 2.6481773853302, 2.828695297241211, 3.0092132091522217, 3.1897311210632324, 3.370249032974243, 3.550766944885254, 3.7312848567962646, 3.9118027687072754, 4.092320442199707, 4.272838592529297, 4.453356742858887, 4.633874416351318, 4.81439208984375, 4.99491024017334, 5.17542839050293, 5.355946063995361, 5.536463737487793, 5.716981887817383]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 6.0, 11.0, 12.0, 15.0, 23.0, 39.0, 51.0, 103.0, 131.0, 199.0, 296.0, 463.0, 732.0, 1198.0, 1966.0, 3413.0, 6195.0, 11297.0, 20973.0, 41158.0, 84003.0, 181458.0, 404994.0, 825437.0, 1106660.0, 791045.0, 381939.0, 170126.0, 78954.0, 37907.0, 19182.0, 10273.0, 5636.0, 3266.0, 1970.0, 1161.0, 669.0, 492.0, 286.0, 169.0, 119.0, 86.0, 55.0, 32.0, 27.0, 18.0, 18.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-6.62890625, -6.4246826171875, -6.220458984375, -6.0162353515625, -5.81201171875, -5.6077880859375, -5.403564453125, -5.1993408203125, -4.9951171875, -4.7908935546875, -4.586669921875, -4.3824462890625, -4.17822265625, -3.9739990234375, -3.769775390625, -3.5655517578125, -3.361328125, -3.1571044921875, -2.952880859375, -2.7486572265625, -2.54443359375, -2.3402099609375, -2.135986328125, -1.9317626953125, -1.7275390625, -1.5233154296875, -1.319091796875, -1.1148681640625, -0.91064453125, -0.7064208984375, -0.502197265625, -0.2979736328125, -0.09375, 0.1104736328125, 0.314697265625, 0.5189208984375, 0.72314453125, 0.9273681640625, 1.131591796875, 1.3358154296875, 1.5400390625, 1.7442626953125, 1.948486328125, 2.1527099609375, 2.35693359375, 2.5611572265625, 2.765380859375, 2.9696044921875, 3.173828125, 3.3780517578125, 3.582275390625, 3.7864990234375, 3.99072265625, 4.1949462890625, 4.399169921875, 4.6033935546875, 4.8076171875, 5.0118408203125, 5.216064453125, 5.4202880859375, 5.62451171875, 5.8287353515625, 6.032958984375, 6.2371826171875, 6.44140625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 12.0, 22.0, 21.0, 22.0, 22.0, 27.0, 27.0, 37.0, 37.0, 35.0, 52.0, 45.0, 47.0, 33.0, 38.0, 43.0, 37.0, 31.0, 39.0, 22.0, 40.0, 43.0, 38.0, 33.0, 26.0, 24.0, 10.0, 19.0, 15.0, 17.0, 17.0, 10.0, 10.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.676300048828125, -3.55963134765625, -3.442962646484375, -3.3262939453125, -3.209625244140625, -3.09295654296875, -2.976287841796875, -2.859619140625, -2.742950439453125, -2.62628173828125, -2.509613037109375, -2.3929443359375, -2.276275634765625, -2.15960693359375, -2.042938232421875, -1.92626953125, -1.809600830078125, -1.69293212890625, -1.576263427734375, -1.4595947265625, -1.342926025390625, -1.22625732421875, -1.109588623046875, -0.992919921875, -0.876251220703125, -0.75958251953125, -0.642913818359375, -0.5262451171875, -0.409576416015625, -0.29290771484375, -0.176239013671875, -0.0595703125, 0.057098388671875, 0.17376708984375, 0.290435791015625, 0.4071044921875, 0.523773193359375, 0.64044189453125, 0.757110595703125, 0.873779296875, 0.990447998046875, 1.10711669921875, 1.223785400390625, 1.3404541015625, 1.457122802734375, 1.57379150390625, 1.690460205078125, 1.80712890625, 1.923797607421875, 2.04046630859375, 2.157135009765625, 2.2738037109375, 2.390472412109375, 2.50714111328125, 2.623809814453125, 2.740478515625, 2.857147216796875, 2.97381591796875, 3.090484619140625, 3.2071533203125, 3.323822021484375, 3.44049072265625, 3.557159423828125, 3.673828125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 20.0, 20.0, 31.0, 66.0, 69.0, 108.0, 128.0, 232.0, 373.0, 513.0, 745.0, 1099.0, 1795.0, 2774.0, 4490.0, 7219.0, 12021.0, 19952.0, 34184.0, 59727.0, 106214.0, 188841.0, 329165.0, 541379.0, 756543.0, 766135.0, 558444.0, 341447.0, 197232.0, 111090.0, 62699.0, 35717.0, 21235.0, 12450.0, 7281.0, 4679.0, 2781.0, 1881.0, 1114.0, 740.0, 557.0, 348.0, 230.0, 160.0, 118.0, 79.0, 50.0, 26.0, 25.0, 15.0, 17.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.9921875, -4.83636474609375, -4.6805419921875, -4.52471923828125, -4.368896484375, -4.21307373046875, -4.0572509765625, -3.90142822265625, -3.74560546875, -3.58978271484375, -3.4339599609375, -3.27813720703125, -3.122314453125, -2.96649169921875, -2.8106689453125, -2.65484619140625, -2.4990234375, -2.34320068359375, -2.1873779296875, -2.03155517578125, -1.875732421875, -1.71990966796875, -1.5640869140625, -1.40826416015625, -1.25244140625, -1.09661865234375, -0.9407958984375, -0.78497314453125, -0.629150390625, -0.47332763671875, -0.3175048828125, -0.16168212890625, -0.005859375, 0.14996337890625, 0.3057861328125, 0.46160888671875, 0.617431640625, 0.77325439453125, 0.9290771484375, 1.08489990234375, 1.24072265625, 1.39654541015625, 1.5523681640625, 1.70819091796875, 1.864013671875, 2.01983642578125, 2.1756591796875, 2.33148193359375, 2.4873046875, 2.64312744140625, 2.7989501953125, 2.95477294921875, 3.110595703125, 3.26641845703125, 3.4222412109375, 3.57806396484375, 3.73388671875, 3.88970947265625, 4.0455322265625, 4.20135498046875, 4.357177734375, 4.51300048828125, 4.6688232421875, 4.82464599609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 13.0, 18.0, 25.0, 22.0, 47.0, 51.0, 58.0, 91.0, 94.0, 121.0, 167.0, 171.0, 203.0, 240.0, 288.0, 309.0, 256.0, 268.0, 280.0, 250.0, 209.0, 180.0, 130.0, 125.0, 91.0, 78.0, 66.0, 40.0, 42.0, 29.0, 24.0, 24.0, 15.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.23046875, -2.1687164306640625, -2.106964111328125, -2.0452117919921875, -1.98345947265625, -1.9217071533203125, -1.859954833984375, -1.7982025146484375, -1.7364501953125, -1.6746978759765625, -1.612945556640625, -1.5511932373046875, -1.48944091796875, -1.4276885986328125, -1.365936279296875, -1.3041839599609375, -1.242431640625, -1.1806793212890625, -1.118927001953125, -1.0571746826171875, -0.99542236328125, -0.9336700439453125, -0.871917724609375, -0.8101654052734375, -0.7484130859375, -0.6866607666015625, -0.624908447265625, -0.5631561279296875, -0.50140380859375, -0.4396514892578125, -0.377899169921875, -0.3161468505859375, -0.25439453125, -0.1926422119140625, -0.130889892578125, -0.0691375732421875, -0.00738525390625, 0.0543670654296875, 0.116119384765625, 0.1778717041015625, 0.2396240234375, 0.3013763427734375, 0.363128662109375, 0.4248809814453125, 0.48663330078125, 0.5483856201171875, 0.610137939453125, 0.6718902587890625, 0.733642578125, 0.7953948974609375, 0.857147216796875, 0.9188995361328125, 0.98065185546875, 1.0424041748046875, 1.104156494140625, 1.1659088134765625, 1.2276611328125, 1.2894134521484375, 1.351165771484375, 1.4129180908203125, 1.47467041015625, 1.5364227294921875, 1.598175048828125, 1.6599273681640625, 1.7216796875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 13.0, 22.0, 22.0, 33.0, 41.0, 39.0, 54.0, 68.0, 81.0, 66.0, 81.0, 53.0, 81.0, 64.0, 70.0, 42.0, 33.0, 26.0, 20.0, 18.0, 15.0, 7.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.195919513702393, -5.962164402008057, -5.728409290313721, -5.494654178619385, -5.260899543762207, -5.027144432067871, -4.793389320373535, -4.559634208679199, -4.325879096984863, -4.092123985290527, -3.8583688735961914, -3.6246140003204346, -3.3908588886260986, -3.1571037769317627, -2.923348903656006, -2.68959379196167, -2.455838680267334, -2.222083568572998, -1.9883285760879517, -1.7545735836029053, -1.5208184719085693, -1.2870633602142334, -1.053308367729187, -0.8195533752441406, -0.5857982635498047, -0.3520432114601135, -0.11828815937042236, 0.1154668927192688, 0.34922194480895996, 0.5829770565032959, 0.8167320489883423, 1.0504870414733887, 1.2842426300048828, 1.5179977416992188, 1.7517527341842651, 1.9855077266693115, 2.2192628383636475, 2.4530179500579834, 2.6867728233337402, 2.920527935028076, 3.154283046722412, 3.388038158416748, 3.621793270111084, 3.855548143386841, 4.089303016662598, 4.323058128356934, 4.5568132400512695, 4.7905683517456055, 5.024323463439941, 5.258078575134277, 5.491833686828613, 5.725588798522949, 5.959343910217285, 6.193099021911621, 6.426853656768799, 6.660608768463135, 6.894363880157471, 7.128118991851807, 7.361874103546143, 7.5956292152404785, 7.829383850097656, 8.063138961791992, 8.296894073486328, 8.530649185180664, 8.764404296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 13.0, 6.0, 19.0, 14.0, 28.0, 25.0, 27.0, 34.0, 36.0, 34.0, 44.0, 51.0, 38.0, 52.0, 44.0, 43.0, 32.0, 46.0, 44.0, 33.0, 35.0, 27.0, 28.0, 30.0, 34.0, 24.0, 29.0, 25.0, 11.0, 13.0, 9.0, 13.0, 12.0, 5.0, 11.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.548825263977051, -4.397319316864014, -4.245813369750977, -4.0943074226379395, -3.9428014755249023, -3.7912955284118652, -3.639789581298828, -3.488283634185791, -3.336777687072754, -3.185271739959717, -3.0337657928466797, -2.8822598457336426, -2.7307538986206055, -2.5792479515075684, -2.4277420043945312, -2.276236057281494, -2.124730348587036, -1.973224401473999, -1.821718454360962, -1.6702125072479248, -1.5187065601348877, -1.3672006130218506, -1.215694785118103, -1.064188838005066, -0.9126828908920288, -0.7611769437789917, -0.6096709966659546, -0.45816510915756226, -0.30665916204452515, -0.15515321493148804, -0.003647327423095703, 0.1478586196899414, 0.2993645668029785, 0.4508705139160156, 0.6023764610290527, 0.7538823485374451, 0.9053882956504822, 1.056894302368164, 1.2084001302719116, 1.3599060773849487, 1.5114120244979858, 1.662917971611023, 1.81442391872406, 1.9659297466278076, 2.1174356937408447, 2.268941640853882, 2.420447587966919, 2.571953535079956, 2.723459482192993, 2.8749654293060303, 3.0264713764190674, 3.1779773235321045, 3.3294832706451416, 3.4809892177581787, 3.6324949264526367, 3.784000873565674, 3.935506820678711, 4.087012767791748, 4.238518714904785, 4.390024662017822, 4.541530609130859, 4.6930365562438965, 4.844542503356934, 4.996048450469971, 5.147554397583008]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 9.0, 8.0, 5.0, 11.0, 15.0, 27.0, 26.0, 39.0, 56.0, 81.0, 148.0, 251.0, 434.0, 729.0, 1275.0, 2242.0, 4016.0, 7384.0, 14448.0, 27744.0, 53823.0, 102481.0, 181313.0, 238863.0, 186995.0, 107195.0, 56845.0, 29499.0, 15053.0, 7970.0, 4178.0, 2229.0, 1302.0, 712.0, 398.0, 290.0, 166.0, 86.0, 67.0, 36.0, 30.0, 27.0, 10.0, 17.0, 7.0, 11.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.186920166015625, -1.14044189453125, -1.093963623046875, -1.0474853515625, -1.001007080078125, -0.95452880859375, -0.908050537109375, -0.861572265625, -0.815093994140625, -0.76861572265625, -0.722137451171875, -0.6756591796875, -0.629180908203125, -0.58270263671875, -0.536224365234375, -0.48974609375, -0.443267822265625, -0.39678955078125, -0.350311279296875, -0.3038330078125, -0.257354736328125, -0.21087646484375, -0.164398193359375, -0.117919921875, -0.071441650390625, -0.02496337890625, 0.021514892578125, 0.0679931640625, 0.114471435546875, 0.16094970703125, 0.207427978515625, 0.25390625, 0.300384521484375, 0.34686279296875, 0.393341064453125, 0.4398193359375, 0.486297607421875, 0.53277587890625, 0.579254150390625, 0.625732421875, 0.672210693359375, 0.71868896484375, 0.765167236328125, 0.8116455078125, 0.858123779296875, 0.90460205078125, 0.951080322265625, 0.99755859375, 1.044036865234375, 1.09051513671875, 1.136993408203125, 1.1834716796875, 1.229949951171875, 1.27642822265625, 1.322906494140625, 1.369384765625, 1.415863037109375, 1.46234130859375, 1.508819580078125, 1.5552978515625, 1.601776123046875, 1.64825439453125, 1.694732666015625, 1.7412109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 6.0, 11.0, 20.0, 12.0, 21.0, 26.0, 25.0, 22.0, 22.0, 30.0, 33.0, 44.0, 53.0, 42.0, 42.0, 44.0, 43.0, 40.0, 43.0, 44.0, 35.0, 39.0, 29.0, 32.0, 21.0, 29.0, 24.0, 28.0, 19.0, 20.0, 16.0, 8.0, 12.0, 14.0, 10.0, 9.0, 13.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.12518310546875, -3.9691162109375, -3.81304931640625, -3.656982421875, -3.50091552734375, -3.3448486328125, -3.18878173828125, -3.03271484375, -2.87664794921875, -2.7205810546875, -2.56451416015625, -2.408447265625, -2.25238037109375, -2.0963134765625, -1.94024658203125, -1.7841796875, -1.62811279296875, -1.4720458984375, -1.31597900390625, -1.159912109375, -1.00384521484375, -0.8477783203125, -0.69171142578125, -0.53564453125, -0.37957763671875, -0.2235107421875, -0.06744384765625, 0.088623046875, 0.24468994140625, 0.4007568359375, 0.55682373046875, 0.712890625, 0.86895751953125, 1.0250244140625, 1.18109130859375, 1.337158203125, 1.49322509765625, 1.6492919921875, 1.80535888671875, 1.96142578125, 2.11749267578125, 2.2735595703125, 2.42962646484375, 2.585693359375, 2.74176025390625, 2.8978271484375, 3.05389404296875, 3.2099609375, 3.36602783203125, 3.5220947265625, 3.67816162109375, 3.834228515625, 3.99029541015625, 4.1463623046875, 4.30242919921875, 4.45849609375, 4.61456298828125, 4.7706298828125, 4.92669677734375, 5.082763671875, 5.23883056640625, 5.3948974609375, 5.55096435546875, 5.70703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 2.0, 10.0, 5.0, 13.0, 12.0, 26.0, 28.0, 41.0, 52.0, 70.0, 109.0, 148.0, 210.0, 320.0, 502.0, 721.0, 1162.0, 1777.0, 3040.0, 5326.0, 9684.0, 20313.0, 66851.0, 844900.0, 52989.0, 18508.0, 9193.0, 4920.0, 2712.0, 1725.0, 1077.0, 700.0, 473.0, 259.0, 200.0, 126.0, 108.0, 64.0, 38.0, 30.0, 25.0, 16.0, 15.0, 10.0, 11.0, 8.0, 10.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -2.997802734375, -2.89599609375, -2.794189453125, -2.6923828125, -2.590576171875, -2.48876953125, -2.386962890625, -2.28515625, -2.183349609375, -2.08154296875, -1.979736328125, -1.8779296875, -1.776123046875, -1.67431640625, -1.572509765625, -1.470703125, -1.368896484375, -1.26708984375, -1.165283203125, -1.0634765625, -0.961669921875, -0.85986328125, -0.758056640625, -0.65625, -0.554443359375, -0.45263671875, -0.350830078125, -0.2490234375, -0.147216796875, -0.04541015625, 0.056396484375, 0.158203125, 0.260009765625, 0.36181640625, 0.463623046875, 0.5654296875, 0.667236328125, 0.76904296875, 0.870849609375, 0.97265625, 1.074462890625, 1.17626953125, 1.278076171875, 1.3798828125, 1.481689453125, 1.58349609375, 1.685302734375, 1.787109375, 1.888916015625, 1.99072265625, 2.092529296875, 2.1943359375, 2.296142578125, 2.39794921875, 2.499755859375, 2.6015625, 2.703369140625, 2.80517578125, 2.906982421875, 3.0087890625, 3.110595703125, 3.21240234375, 3.314208984375, 3.416015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 13.0, 15.0, 14.0, 16.0, 27.0, 30.0, 28.0, 28.0, 29.0, 34.0, 38.0, 42.0, 50.0, 53.0, 53.0, 44.0, 54.0, 55.0, 46.0, 41.0, 44.0, 29.0, 35.0, 33.0, 17.0, 29.0, 25.0, 14.0, 9.0, 11.0, 9.0, 7.0, 2.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.0892333984375, -4.897216796875, -4.7052001953125, -4.51318359375, -4.3211669921875, -4.129150390625, -3.9371337890625, -3.7451171875, -3.5531005859375, -3.361083984375, -3.1690673828125, -2.97705078125, -2.7850341796875, -2.593017578125, -2.4010009765625, -2.208984375, -2.0169677734375, -1.824951171875, -1.6329345703125, -1.44091796875, -1.2489013671875, -1.056884765625, -0.8648681640625, -0.6728515625, -0.4808349609375, -0.288818359375, -0.0968017578125, 0.09521484375, 0.2872314453125, 0.479248046875, 0.6712646484375, 0.86328125, 1.0552978515625, 1.247314453125, 1.4393310546875, 1.63134765625, 1.8233642578125, 2.015380859375, 2.2073974609375, 2.3994140625, 2.5914306640625, 2.783447265625, 2.9754638671875, 3.16748046875, 3.3594970703125, 3.551513671875, 3.7435302734375, 3.935546875, 4.1275634765625, 4.319580078125, 4.5115966796875, 4.70361328125, 4.8956298828125, 5.087646484375, 5.2796630859375, 5.4716796875, 5.6636962890625, 5.855712890625, 6.0477294921875, 6.23974609375, 6.4317626953125, 6.623779296875, 6.8157958984375, 7.0078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 4.0, 14.0, 16.0, 26.0, 24.0, 43.0, 56.0, 91.0, 129.0, 218.0, 322.0, 539.0, 899.0, 1573.0, 2909.0, 5476.0, 12350.0, 32948.0, 892365.0, 63667.0, 18175.0, 7762.0, 3838.0, 2051.0, 1173.0, 661.0, 405.0, 244.0, 179.0, 131.0, 83.0, 40.0, 37.0, 38.0, 16.0, 12.0, 13.0, 2.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.69140625, -1.6380615234375, -1.584716796875, -1.5313720703125, -1.47802734375, -1.4246826171875, -1.371337890625, -1.3179931640625, -1.2646484375, -1.2113037109375, -1.157958984375, -1.1046142578125, -1.05126953125, -0.9979248046875, -0.944580078125, -0.8912353515625, -0.837890625, -0.7845458984375, -0.731201171875, -0.6778564453125, -0.62451171875, -0.5711669921875, -0.517822265625, -0.4644775390625, -0.4111328125, -0.3577880859375, -0.304443359375, -0.2510986328125, -0.19775390625, -0.1444091796875, -0.091064453125, -0.0377197265625, 0.015625, 0.0689697265625, 0.122314453125, 0.1756591796875, 0.22900390625, 0.2823486328125, 0.335693359375, 0.3890380859375, 0.4423828125, 0.4957275390625, 0.549072265625, 0.6024169921875, 0.65576171875, 0.7091064453125, 0.762451171875, 0.8157958984375, 0.869140625, 0.9224853515625, 0.975830078125, 1.0291748046875, 1.08251953125, 1.1358642578125, 1.189208984375, 1.2425537109375, 1.2958984375, 1.3492431640625, 1.402587890625, 1.4559326171875, 1.50927734375, 1.5626220703125, 1.615966796875, 1.6693115234375, 1.72265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 14.0, 18.0, 21.0, 29.0, 37.0, 44.0, 47.0, 54.0, 64.0, 59.0, 57.0, 58.0, 78.0, 56.0, 39.0, 47.0, 35.0, 29.0, 26.0, 23.0, 21.0, 12.0, 15.0, 8.0, 7.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.8041343688964844e-05, -4.650000482797623e-05, -4.495866596698761e-05, -4.341732710599899e-05, -4.1875988245010376e-05, -4.033464938402176e-05, -3.879331052303314e-05, -3.7251971662044525e-05, -3.571063280105591e-05, -3.416929394006729e-05, -3.2627955079078674e-05, -3.108661621809006e-05, -2.954527735710144e-05, -2.8003938496112823e-05, -2.6462599635124207e-05, -2.492126077413559e-05, -2.3379921913146973e-05, -2.1838583052158356e-05, -2.029724419116974e-05, -1.8755905330181122e-05, -1.7214566469192505e-05, -1.5673227608203888e-05, -1.4131888747215271e-05, -1.2590549886226654e-05, -1.1049211025238037e-05, -9.50787216424942e-06, -7.966533303260803e-06, -6.425194442272186e-06, -4.883855581283569e-06, -3.3425167202949524e-06, -1.8011778593063354e-06, -2.598389983177185e-07, 1.2814998626708984e-06, 2.8228387236595154e-06, 4.364177584648132e-06, 5.905516445636749e-06, 7.446855306625366e-06, 8.988194167613983e-06, 1.05295330286026e-05, 1.2070871889591217e-05, 1.3612210750579834e-05, 1.5153549611568451e-05, 1.6694888472557068e-05, 1.8236227333545685e-05, 1.9777566194534302e-05, 2.131890505552292e-05, 2.2860243916511536e-05, 2.4401582777500153e-05, 2.594292163848877e-05, 2.7484260499477386e-05, 2.9025599360466003e-05, 3.056693822145462e-05, 3.210827708244324e-05, 3.3649615943431854e-05, 3.519095480442047e-05, 3.673229366540909e-05, 3.8273632526397705e-05, 3.981497138738632e-05, 4.135631024837494e-05, 4.2897649109363556e-05, 4.443898797035217e-05, 4.598032683134079e-05, 4.752166569232941e-05, 4.9063004553318024e-05, 5.060434341430664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 2.0, 9.0, 10.0, 17.0, 27.0, 46.0, 40.0, 73.0, 112.0, 149.0, 236.0, 333.0, 491.0, 676.0, 1048.0, 1698.0, 2533.0, 3938.0, 6196.0, 10152.0, 17297.0, 29049.0, 52089.0, 95094.0, 173293.0, 244294.0, 179787.0, 99015.0, 54012.0, 30464.0, 17699.0, 10559.0, 6479.0, 4008.0, 2544.0, 1666.0, 1089.0, 737.0, 506.0, 373.0, 240.0, 141.0, 90.0, 88.0, 43.0, 42.0, 29.0, 20.0, 9.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5234603881835938, -0.5073699951171875, -0.49127960205078125, -0.475189208984375, -0.45909881591796875, -0.4430084228515625, -0.42691802978515625, -0.41082763671875, -0.39473724365234375, -0.3786468505859375, -0.36255645751953125, -0.346466064453125, -0.33037567138671875, -0.3142852783203125, -0.29819488525390625, -0.2821044921875, -0.26601409912109375, -0.2499237060546875, -0.23383331298828125, -0.217742919921875, -0.20165252685546875, -0.1855621337890625, -0.16947174072265625, -0.15338134765625, -0.13729095458984375, -0.1212005615234375, -0.10511016845703125, -0.089019775390625, -0.07292938232421875, -0.0568389892578125, -0.04074859619140625, -0.024658203125, -0.00856781005859375, 0.0075225830078125, 0.02361297607421875, 0.039703369140625, 0.05579376220703125, 0.0718841552734375, 0.08797454833984375, 0.10406494140625, 0.12015533447265625, 0.1362457275390625, 0.15233612060546875, 0.168426513671875, 0.18451690673828125, 0.2006072998046875, 0.21669769287109375, 0.2327880859375, 0.24887847900390625, 0.2649688720703125, 0.28105926513671875, 0.297149658203125, 0.31324005126953125, 0.3293304443359375, 0.34542083740234375, 0.36151123046875, 0.37760162353515625, 0.3936920166015625, 0.40978240966796875, 0.425872802734375, 0.44196319580078125, 0.4580535888671875, 0.47414398193359375, 0.490234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 12.0, 7.0, 19.0, 17.0, 22.0, 30.0, 18.0, 41.0, 37.0, 56.0, 51.0, 54.0, 88.0, 65.0, 73.0, 65.0, 68.0, 44.0, 42.0, 27.0, 28.0, 23.0, 21.0, 11.0, 12.0, 15.0, 7.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.2678680419921875, -0.257415771484375, -0.2469635009765625, -0.23651123046875, -0.2260589599609375, -0.215606689453125, -0.2051544189453125, -0.1947021484375, -0.1842498779296875, -0.173797607421875, -0.1633453369140625, -0.15289306640625, -0.1424407958984375, -0.131988525390625, -0.1215362548828125, -0.111083984375, -0.1006317138671875, -0.090179443359375, -0.0797271728515625, -0.06927490234375, -0.0588226318359375, -0.048370361328125, -0.0379180908203125, -0.0274658203125, -0.0170135498046875, -0.006561279296875, 0.0038909912109375, 0.01434326171875, 0.0247955322265625, 0.035247802734375, 0.0457000732421875, 0.05615234375, 0.0666046142578125, 0.077056884765625, 0.0875091552734375, 0.09796142578125, 0.1084136962890625, 0.118865966796875, 0.1293182373046875, 0.1397705078125, 0.1502227783203125, 0.160675048828125, 0.1711273193359375, 0.18157958984375, 0.1920318603515625, 0.202484130859375, 0.2129364013671875, 0.223388671875, 0.2338409423828125, 0.244293212890625, 0.2547454833984375, 0.26519775390625, 0.2756500244140625, 0.286102294921875, 0.2965545654296875, 0.3070068359375, 0.3174591064453125, 0.327911376953125, 0.3383636474609375, 0.34881591796875, 0.3592681884765625, 0.369720458984375, 0.3801727294921875, 0.390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 7.0, 18.0, 16.0, 26.0, 31.0, 46.0, 49.0, 48.0, 80.0, 70.0, 65.0, 74.0, 72.0, 72.0, 72.0, 52.0, 49.0, 30.0, 30.0, 19.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2333083152771, -5.998308181762695, -5.763307571411133, -5.52830696105957, -5.293306827545166, -5.058306694030762, -4.823306083679199, -4.588305473327637, -4.353305339813232, -4.118305206298828, -3.8833045959472656, -3.6483042240142822, -3.413303852081299, -3.1783034801483154, -2.943303108215332, -2.7083027362823486, -2.4733023643493652, -2.238301992416382, -2.0033016204833984, -1.768301248550415, -1.5333008766174316, -1.2983005046844482, -1.0633001327514648, -0.8282997608184814, -0.593299388885498, -0.35829901695251465, -0.12329864501953125, 0.11170172691345215, 0.34670209884643555, 0.581702470779419, 0.8167028427124023, 1.0517032146453857, 1.286703109741211, 1.5217034816741943, 1.7567038536071777, 1.9917042255401611, 2.2267045974731445, 2.461704969406128, 2.6967053413391113, 2.9317057132720947, 3.166706085205078, 3.4017064571380615, 3.636706829071045, 3.8717072010040283, 4.106707572937012, 4.341708183288574, 4.5767083168029785, 4.811708450317383, 5.046709060668945, 5.281709671020508, 5.516709804534912, 5.751709938049316, 5.986710548400879, 6.221711158752441, 6.456711292266846, 6.69171142578125, 6.9267120361328125, 7.161712646484375, 7.396712779998779, 7.631712913513184, 7.866713523864746, 8.101714134216309, 8.336713790893555, 8.571714401245117, 8.80671501159668]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 13.0, 19.0, 33.0, 29.0, 33.0, 24.0, 41.0, 39.0, 55.0, 38.0, 49.0, 39.0, 47.0, 40.0, 50.0, 29.0, 44.0, 35.0, 35.0, 24.0, 32.0, 32.0, 27.0, 27.0, 17.0, 20.0, 13.0, 8.0, 19.0, 7.0, 12.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.304595470428467, -4.1580305099487305, -4.011465072631836, -3.8649001121520996, -3.7183351516723633, -3.571769952774048, -3.4252047538757324, -3.278639793395996, -3.1320745944976807, -2.9855093955993652, -2.838944435119629, -2.6923792362213135, -2.545814037322998, -2.3992490768432617, -2.2526838779449463, -2.106118679046631, -1.9595537185668945, -1.8129886388778687, -1.6664235591888428, -1.5198583602905273, -1.3732932806015015, -1.2267282009124756, -1.0801630020141602, -0.9335979223251343, -0.7870328426361084, -0.6404677629470825, -0.49390262365341187, -0.3473375141620636, -0.20077240467071533, -0.05420732498168945, 0.0923578143119812, 0.23892295360565186, 0.38548755645751953, 0.5320526361465454, 0.6786177754402161, 0.8251829147338867, 0.9717479944229126, 1.1183130741119385, 1.264878273010254, 1.4114433526992798, 1.5580084323883057, 1.7045735120773315, 1.8511385917663574, 1.9977037906646729, 2.1442689895629883, 2.2908339500427246, 2.43739914894104, 2.5839643478393555, 2.730529308319092, 2.8770945072174072, 3.0236594676971436, 3.170224666595459, 3.3167896270751953, 3.4633548259735107, 3.609920024871826, 3.7564849853515625, 3.903050184249878, 4.049615383148193, 4.19618034362793, 4.342745304107666, 4.4893107414245605, 4.635875701904297, 4.782440662384033, 4.929006099700928, 5.075571060180664]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 16.0, 19.0, 31.0, 39.0, 76.0, 99.0, 154.0, 227.0, 352.0, 539.0, 796.0, 1295.0, 1919.0, 2953.0, 4726.0, 7163.0, 11233.0, 17176.0, 26680.0, 40126.0, 58488.0, 82887.0, 108401.0, 127656.0, 131114.0, 118378.0, 94883.0, 69800.0, 48561.0, 32503.0, 21137.0, 13791.0, 8782.0, 5722.0, 3807.0, 2408.0, 1656.0, 1032.0, 687.0, 424.0, 285.0, 173.0, 127.0, 77.0, 62.0, 36.0, 19.0, 15.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.76171875, -3.65185546875, -3.5419921875, -3.43212890625, -3.322265625, -3.21240234375, -3.1025390625, -2.99267578125, -2.8828125, -2.77294921875, -2.6630859375, -2.55322265625, -2.443359375, -2.33349609375, -2.2236328125, -2.11376953125, -2.00390625, -1.89404296875, -1.7841796875, -1.67431640625, -1.564453125, -1.45458984375, -1.3447265625, -1.23486328125, -1.125, -1.01513671875, -0.9052734375, -0.79541015625, -0.685546875, -0.57568359375, -0.4658203125, -0.35595703125, -0.24609375, -0.13623046875, -0.0263671875, 0.08349609375, 0.193359375, 0.30322265625, 0.4130859375, 0.52294921875, 0.6328125, 0.74267578125, 0.8525390625, 0.96240234375, 1.072265625, 1.18212890625, 1.2919921875, 1.40185546875, 1.51171875, 1.62158203125, 1.7314453125, 1.84130859375, 1.951171875, 2.06103515625, 2.1708984375, 2.28076171875, 2.390625, 2.50048828125, 2.6103515625, 2.72021484375, 2.830078125, 2.93994140625, 3.0498046875, 3.15966796875, 3.26953125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 10.0, 9.0, 17.0, 21.0, 18.0, 25.0, 48.0, 39.0, 34.0, 35.0, 36.0, 42.0, 35.0, 51.0, 53.0, 50.0, 41.0, 45.0, 32.0, 42.0, 32.0, 24.0, 33.0, 39.0, 23.0, 20.0, 19.0, 16.0, 13.0, 12.0, 17.0, 9.0, 7.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.2835693359375, -4.137451171875, -3.9913330078125, -3.84521484375, -3.6990966796875, -3.552978515625, -3.4068603515625, -3.2607421875, -3.1146240234375, -2.968505859375, -2.8223876953125, -2.67626953125, -2.5301513671875, -2.384033203125, -2.2379150390625, -2.091796875, -1.9456787109375, -1.799560546875, -1.6534423828125, -1.50732421875, -1.3612060546875, -1.215087890625, -1.0689697265625, -0.9228515625, -0.7767333984375, -0.630615234375, -0.4844970703125, -0.33837890625, -0.1922607421875, -0.046142578125, 0.0999755859375, 0.24609375, 0.3922119140625, 0.538330078125, 0.6844482421875, 0.83056640625, 0.9766845703125, 1.122802734375, 1.2689208984375, 1.4150390625, 1.5611572265625, 1.707275390625, 1.8533935546875, 1.99951171875, 2.1456298828125, 2.291748046875, 2.4378662109375, 2.583984375, 2.7301025390625, 2.876220703125, 3.0223388671875, 3.16845703125, 3.3145751953125, 3.460693359375, 3.6068115234375, 3.7529296875, 3.8990478515625, 4.045166015625, 4.1912841796875, 4.33740234375, 4.4835205078125, 4.629638671875, 4.7757568359375, 4.921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 7.0, 8.0, 18.0, 26.0, 33.0, 77.0, 99.0, 142.0, 220.0, 307.0, 549.0, 767.0, 1168.0, 2005.0, 3197.0, 5069.0, 8030.0, 13053.0, 21199.0, 34063.0, 54207.0, 80869.0, 113051.0, 140179.0, 147682.0, 131324.0, 100960.0, 69943.0, 45153.0, 28328.0, 17684.0, 11034.0, 6712.0, 4079.0, 2599.0, 1741.0, 1037.0, 676.0, 406.0, 306.0, 176.0, 129.0, 73.0, 54.0, 49.0, 15.0, 14.0, 12.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.83203125, -3.7203369140625, -3.608642578125, -3.4969482421875, -3.38525390625, -3.2735595703125, -3.161865234375, -3.0501708984375, -2.9384765625, -2.8267822265625, -2.715087890625, -2.6033935546875, -2.49169921875, -2.3800048828125, -2.268310546875, -2.1566162109375, -2.044921875, -1.9332275390625, -1.821533203125, -1.7098388671875, -1.59814453125, -1.4864501953125, -1.374755859375, -1.2630615234375, -1.1513671875, -1.0396728515625, -0.927978515625, -0.8162841796875, -0.70458984375, -0.5928955078125, -0.481201171875, -0.3695068359375, -0.2578125, -0.1461181640625, -0.034423828125, 0.0772705078125, 0.18896484375, 0.3006591796875, 0.412353515625, 0.5240478515625, 0.6357421875, 0.7474365234375, 0.859130859375, 0.9708251953125, 1.08251953125, 1.1942138671875, 1.305908203125, 1.4176025390625, 1.529296875, 1.6409912109375, 1.752685546875, 1.8643798828125, 1.97607421875, 2.0877685546875, 2.199462890625, 2.3111572265625, 2.4228515625, 2.5345458984375, 2.646240234375, 2.7579345703125, 2.86962890625, 2.9813232421875, 3.093017578125, 3.2047119140625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 6.0, 5.0, 8.0, 9.0, 17.0, 12.0, 8.0, 18.0, 20.0, 32.0, 28.0, 27.0, 45.0, 33.0, 27.0, 29.0, 35.0, 45.0, 43.0, 50.0, 36.0, 41.0, 55.0, 39.0, 44.0, 32.0, 29.0, 26.0, 31.0, 24.0, 24.0, 23.0, 15.0, 10.0, 15.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.33203125, -4.212890625, -4.09375, -3.974609375, -3.85546875, -3.736328125, -3.6171875, -3.498046875, -3.37890625, -3.259765625, -3.140625, -3.021484375, -2.90234375, -2.783203125, -2.6640625, -2.544921875, -2.42578125, -2.306640625, -2.1875, -2.068359375, -1.94921875, -1.830078125, -1.7109375, -1.591796875, -1.47265625, -1.353515625, -1.234375, -1.115234375, -0.99609375, -0.876953125, -0.7578125, -0.638671875, -0.51953125, -0.400390625, -0.28125, -0.162109375, -0.04296875, 0.076171875, 0.1953125, 0.314453125, 0.43359375, 0.552734375, 0.671875, 0.791015625, 0.91015625, 1.029296875, 1.1484375, 1.267578125, 1.38671875, 1.505859375, 1.625, 1.744140625, 1.86328125, 1.982421875, 2.1015625, 2.220703125, 2.33984375, 2.458984375, 2.578125, 2.697265625, 2.81640625, 2.935546875, 3.0546875, 3.173828125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 17.0, 25.0, 27.0, 45.0, 72.0, 115.0, 161.0, 238.0, 433.0, 642.0, 1093.0, 1968.0, 3548.0, 7078.0, 15768.0, 40082.0, 113649.0, 311182.0, 338553.0, 133093.0, 46091.0, 17663.0, 7941.0, 3892.0, 2098.0, 1194.0, 708.0, 431.0, 267.0, 152.0, 112.0, 55.0, 39.0, 34.0, 25.0, 15.0, 11.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.0390625, -8.78131103515625, -8.5235595703125, -8.26580810546875, -8.008056640625, -7.75030517578125, -7.4925537109375, -7.23480224609375, -6.97705078125, -6.71929931640625, -6.4615478515625, -6.20379638671875, -5.946044921875, -5.68829345703125, -5.4305419921875, -5.17279052734375, -4.9150390625, -4.65728759765625, -4.3995361328125, -4.14178466796875, -3.884033203125, -3.62628173828125, -3.3685302734375, -3.11077880859375, -2.85302734375, -2.59527587890625, -2.3375244140625, -2.07977294921875, -1.822021484375, -1.56427001953125, -1.3065185546875, -1.04876708984375, -0.791015625, -0.53326416015625, -0.2755126953125, -0.01776123046875, 0.239990234375, 0.49774169921875, 0.7554931640625, 1.01324462890625, 1.27099609375, 1.52874755859375, 1.7864990234375, 2.04425048828125, 2.302001953125, 2.55975341796875, 2.8175048828125, 3.07525634765625, 3.3330078125, 3.59075927734375, 3.8485107421875, 4.10626220703125, 4.364013671875, 4.62176513671875, 4.8795166015625, 5.13726806640625, 5.39501953125, 5.65277099609375, 5.9105224609375, 6.16827392578125, 6.426025390625, 6.68377685546875, 6.9415283203125, 7.19927978515625, 7.45703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 12.0, 8.0, 21.0, 15.0, 26.0, 31.0, 33.0, 47.0, 50.0, 54.0, 61.0, 60.0, 81.0, 68.0, 73.0, 67.0, 71.0, 52.0, 45.0, 28.0, 23.0, 22.0, 14.0, 13.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000514984130859375, -0.0005029588937759399, -0.0004909336566925049, -0.0004789084196090698, -0.00046688318252563477, -0.0004548579454421997, -0.00044283270835876465, -0.0004308074712753296, -0.00041878223419189453, -0.00040675699710845947, -0.0003947317600250244, -0.00038270652294158936, -0.0003706812858581543, -0.00035865604877471924, -0.0003466308116912842, -0.0003346055746078491, -0.00032258033752441406, -0.000310555100440979, -0.00029852986335754395, -0.0002865046262741089, -0.00027447938919067383, -0.00026245415210723877, -0.0002504289150238037, -0.00023840367794036865, -0.0002263784408569336, -0.00021435320377349854, -0.00020232796669006348, -0.00019030272960662842, -0.00017827749252319336, -0.0001662522554397583, -0.00015422701835632324, -0.00014220178127288818, -0.00013017654418945312, -0.00011815130710601807, -0.00010612607002258301, -9.410083293914795e-05, -8.207559585571289e-05, -7.005035877227783e-05, -5.8025121688842773e-05, -4.5999884605407715e-05, -3.3974647521972656e-05, -2.1949410438537598e-05, -9.924173355102539e-06, 2.1010637283325195e-06, 1.4126300811767578e-05, 2.6151537895202637e-05, 3.8176774978637695e-05, 5.0202012062072754e-05, 6.222724914550781e-05, 7.425248622894287e-05, 8.627772331237793e-05, 9.830296039581299e-05, 0.00011032819747924805, 0.0001223534345626831, 0.00013437867164611816, 0.00014640390872955322, 0.00015842914581298828, 0.00017045438289642334, 0.0001824796199798584, 0.00019450485706329346, 0.00020653009414672852, 0.00021855533123016357, 0.00023058056831359863, 0.0002426058053970337, 0.00025463104248046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 17.0, 18.0, 23.0, 41.0, 62.0, 79.0, 117.0, 153.0, 227.0, 392.0, 591.0, 964.0, 1647.0, 3026.0, 6058.0, 13460.0, 34626.0, 99420.0, 255053.0, 342844.0, 181911.0, 64687.0, 23213.0, 9450.0, 4447.0, 2332.0, 1322.0, 811.0, 507.0, 312.0, 208.0, 149.0, 97.0, 84.0, 55.0, 48.0, 29.0, 18.0, 12.0, 10.0, 7.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0], "bins": [-7.71875, -7.506103515625, -7.29345703125, -7.080810546875, -6.8681640625, -6.655517578125, -6.44287109375, -6.230224609375, -6.017578125, -5.804931640625, -5.59228515625, -5.379638671875, -5.1669921875, -4.954345703125, -4.74169921875, -4.529052734375, -4.31640625, -4.103759765625, -3.89111328125, -3.678466796875, -3.4658203125, -3.253173828125, -3.04052734375, -2.827880859375, -2.615234375, -2.402587890625, -2.18994140625, -1.977294921875, -1.7646484375, -1.552001953125, -1.33935546875, -1.126708984375, -0.9140625, -0.701416015625, -0.48876953125, -0.276123046875, -0.0634765625, 0.149169921875, 0.36181640625, 0.574462890625, 0.787109375, 0.999755859375, 1.21240234375, 1.425048828125, 1.6376953125, 1.850341796875, 2.06298828125, 2.275634765625, 2.48828125, 2.700927734375, 2.91357421875, 3.126220703125, 3.3388671875, 3.551513671875, 3.76416015625, 3.976806640625, 4.189453125, 4.402099609375, 4.61474609375, 4.827392578125, 5.0400390625, 5.252685546875, 5.46533203125, 5.677978515625, 5.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 9.0, 4.0, 7.0, 4.0, 11.0, 12.0, 18.0, 25.0, 40.0, 61.0, 76.0, 108.0, 124.0, 110.0, 96.0, 82.0, 52.0, 42.0, 31.0, 18.0, 18.0, 7.0, 5.0, 6.0, 9.0, 2.0, 2.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99114990234375, -3.8533935546875, -3.71563720703125, -3.577880859375, -3.44012451171875, -3.3023681640625, -3.16461181640625, -3.02685546875, -2.88909912109375, -2.7513427734375, -2.61358642578125, -2.475830078125, -2.33807373046875, -2.2003173828125, -2.06256103515625, -1.9248046875, -1.78704833984375, -1.6492919921875, -1.51153564453125, -1.373779296875, -1.23602294921875, -1.0982666015625, -0.96051025390625, -0.82275390625, -0.68499755859375, -0.5472412109375, -0.40948486328125, -0.271728515625, -0.13397216796875, 0.0037841796875, 0.14154052734375, 0.279296875, 0.41705322265625, 0.5548095703125, 0.69256591796875, 0.830322265625, 0.96807861328125, 1.1058349609375, 1.24359130859375, 1.38134765625, 1.51910400390625, 1.6568603515625, 1.79461669921875, 1.932373046875, 2.07012939453125, 2.2078857421875, 2.34564208984375, 2.4833984375, 2.62115478515625, 2.7589111328125, 2.89666748046875, 3.034423828125, 3.17218017578125, 3.3099365234375, 3.44769287109375, 3.58544921875, 3.72320556640625, 3.8609619140625, 3.99871826171875, 4.136474609375, 4.27423095703125, 4.4119873046875, 4.54974365234375, 4.6875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 9.0, 20.0, 21.0, 28.0, 22.0, 44.0, 51.0, 61.0, 61.0, 59.0, 61.0, 68.0, 77.0, 71.0, 60.0, 51.0, 47.0, 34.0, 20.0, 29.0, 17.0, 13.0, 14.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9219207763671875, -5.702857494354248, -5.48379373550415, -5.264730453491211, -5.0456671714782715, -4.826603889465332, -4.607540130615234, -4.388476848602295, -4.1694135665893555, -3.950350046157837, -3.7312867641448975, -3.512223243713379, -3.2931599617004395, -3.074096441268921, -2.8550329208374023, -2.635969638824463, -2.4169058799743652, -2.1978423595428467, -1.9787790775299072, -1.7597155570983887, -1.5406521558761597, -1.3215887546539307, -1.102525234222412, -0.8834618330001831, -0.6643984317779541, -0.4453350007534027, -0.22627156972885132, -0.007208108901977539, 0.21185529232025146, 0.43091869354248047, 0.649982213973999, 0.869045615196228, 1.088109016418457, 1.307172417640686, 1.526235818862915, 1.7452993392944336, 1.9643627405166626, 2.1834261417388916, 2.40248966217041, 2.6215529441833496, 2.840616464614868, 3.0596799850463867, 3.278743267059326, 3.4978067874908447, 3.7168703079223633, 3.9359335899353027, 4.154996871948242, 4.37406063079834, 4.593123912811279, 4.812187194824219, 5.031250953674316, 5.250314235687256, 5.469377517700195, 5.688441276550293, 5.907504558563232, 6.126567840576172, 6.3456315994262695, 6.564694881439209, 6.783758640289307, 7.002821922302246, 7.2218852043151855, 7.440948486328125, 7.660012245178223, 7.879075527191162, 8.098138809204102]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 14.0, 12.0, 23.0, 23.0, 23.0, 27.0, 30.0, 25.0, 29.0, 35.0, 29.0, 48.0, 23.0, 58.0, 35.0, 41.0, 46.0, 43.0, 46.0, 34.0, 32.0, 24.0, 31.0, 22.0, 26.0, 26.0, 26.0, 16.0, 16.0, 21.0, 10.0, 11.0, 12.0, 7.0, 8.0, 7.0, 4.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.201750755310059, -4.0681376457214355, -3.9345247745513916, -3.8009116649627686, -3.6672987937927246, -3.5336856842041016, -3.4000725746154785, -3.2664594650268555, -3.1328465938568115, -2.9992334842681885, -2.8656206130981445, -2.7320075035095215, -2.5983943939208984, -2.4647815227508545, -2.3311684131622314, -2.1975555419921875, -2.0639424324035645, -1.930329442024231, -1.7967164516448975, -1.6631033420562744, -1.529490351676941, -1.3958773612976074, -1.2622642517089844, -1.1286512613296509, -0.9950382709503174, -0.8614252805709839, -0.7278122305870056, -0.5941991806030273, -0.46058619022369385, -0.32697319984436035, -0.19336014986038208, -0.05974709987640381, 0.07386636734008789, 0.20747938752174377, 0.34109240770339966, 0.47470542788505554, 0.6083184480667114, 0.7419314384460449, 0.8755444884300232, 1.0091575384140015, 1.142770528793335, 1.2763835191726685, 1.409996509552002, 1.543609619140625, 1.6772226095199585, 1.810835599899292, 1.944448709487915, 2.078061580657959, 2.211674690246582, 2.345287799835205, 2.478900671005249, 2.612513780593872, 2.746126651763916, 2.879739761352539, 3.013352870941162, 3.146965980529785, 3.280578851699829, 3.414191961288452, 3.547804832458496, 3.681417942047119, 3.815031051635742, 3.948643922805786, 4.08225679397583, 4.215869903564453, 4.349483013153076]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 10.0, 12.0, 16.0, 22.0, 37.0, 59.0, 89.0, 121.0, 167.0, 238.0, 391.0, 587.0, 908.0, 1377.0, 2223.0, 3708.0, 6034.0, 10597.0, 18808.0, 35303.0, 69897.0, 148690.0, 331050.0, 717269.0, 1103106.0, 897387.0, 449642.0, 200628.0, 94093.0, 45803.0, 24388.0, 13014.0, 7266.0, 4379.0, 2643.0, 1582.0, 974.0, 599.0, 412.0, 275.0, 159.0, 113.0, 70.0, 48.0, 30.0, 18.0, 15.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.39453125, -5.22430419921875, -5.0540771484375, -4.88385009765625, -4.713623046875, -4.54339599609375, -4.3731689453125, -4.20294189453125, -4.03271484375, -3.86248779296875, -3.6922607421875, -3.52203369140625, -3.351806640625, -3.18157958984375, -3.0113525390625, -2.84112548828125, -2.6708984375, -2.50067138671875, -2.3304443359375, -2.16021728515625, -1.989990234375, -1.81976318359375, -1.6495361328125, -1.47930908203125, -1.30908203125, -1.13885498046875, -0.9686279296875, -0.79840087890625, -0.628173828125, -0.45794677734375, -0.2877197265625, -0.11749267578125, 0.052734375, 0.22296142578125, 0.3931884765625, 0.56341552734375, 0.733642578125, 0.90386962890625, 1.0740966796875, 1.24432373046875, 1.41455078125, 1.58477783203125, 1.7550048828125, 1.92523193359375, 2.095458984375, 2.26568603515625, 2.4359130859375, 2.60614013671875, 2.7763671875, 2.94659423828125, 3.1168212890625, 3.28704833984375, 3.457275390625, 3.62750244140625, 3.7977294921875, 3.96795654296875, 4.13818359375, 4.30841064453125, 4.4786376953125, 4.64886474609375, 4.819091796875, 4.98931884765625, 5.1595458984375, 5.32977294921875, 5.5]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 10.0, 13.0, 7.0, 14.0, 14.0, 21.0, 28.0, 27.0, 26.0, 31.0, 29.0, 35.0, 36.0, 28.0, 46.0, 29.0, 33.0, 40.0, 37.0, 36.0, 40.0, 33.0, 36.0, 29.0, 22.0, 29.0, 28.0, 30.0, 18.0, 16.0, 20.0, 16.0, 15.0, 23.0, 11.0, 14.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.49609375, -2.417938232421875, -2.33978271484375, -2.261627197265625, -2.1834716796875, -2.105316162109375, -2.02716064453125, -1.949005126953125, -1.870849609375, -1.792694091796875, -1.71453857421875, -1.636383056640625, -1.5582275390625, -1.480072021484375, -1.40191650390625, -1.323760986328125, -1.24560546875, -1.167449951171875, -1.08929443359375, -1.011138916015625, -0.9329833984375, -0.854827880859375, -0.77667236328125, -0.698516845703125, -0.620361328125, -0.542205810546875, -0.46405029296875, -0.385894775390625, -0.3077392578125, -0.229583740234375, -0.15142822265625, -0.073272705078125, 0.0048828125, 0.083038330078125, 0.16119384765625, 0.239349365234375, 0.3175048828125, 0.395660400390625, 0.47381591796875, 0.551971435546875, 0.630126953125, 0.708282470703125, 0.78643798828125, 0.864593505859375, 0.9427490234375, 1.020904541015625, 1.09906005859375, 1.177215576171875, 1.25537109375, 1.333526611328125, 1.41168212890625, 1.489837646484375, 1.5679931640625, 1.646148681640625, 1.72430419921875, 1.802459716796875, 1.880615234375, 1.958770751953125, 2.03692626953125, 2.115081787109375, 2.1932373046875, 2.271392822265625, 2.34954833984375, 2.427703857421875, 2.505859375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 12.0, 9.0, 20.0, 22.0, 38.0, 46.0, 54.0, 99.0, 161.0, 229.0, 346.0, 554.0, 899.0, 1479.0, 2338.0, 3986.0, 6904.0, 11790.0, 20967.0, 37055.0, 67625.0, 127072.0, 240662.0, 446529.0, 745203.0, 907245.0, 695983.0, 405284.0, 215979.0, 114646.0, 61573.0, 33689.0, 18992.0, 10794.0, 6277.0, 3759.0, 2219.0, 1406.0, 789.0, 553.0, 343.0, 220.0, 113.0, 98.0, 77.0, 48.0, 21.0, 14.0, 16.0, 11.0, 8.0, 9.0, 6.0, 7.0, 1.0, 4.0], "bins": [-5.015625, -4.86553955078125, -4.7154541015625, -4.56536865234375, -4.415283203125, -4.26519775390625, -4.1151123046875, -3.96502685546875, -3.81494140625, -3.66485595703125, -3.5147705078125, -3.36468505859375, -3.214599609375, -3.06451416015625, -2.9144287109375, -2.76434326171875, -2.6142578125, -2.46417236328125, -2.3140869140625, -2.16400146484375, -2.013916015625, -1.86383056640625, -1.7137451171875, -1.56365966796875, -1.41357421875, -1.26348876953125, -1.1134033203125, -0.96331787109375, -0.813232421875, -0.66314697265625, -0.5130615234375, -0.36297607421875, -0.212890625, -0.06280517578125, 0.0872802734375, 0.23736572265625, 0.387451171875, 0.53753662109375, 0.6876220703125, 0.83770751953125, 0.98779296875, 1.13787841796875, 1.2879638671875, 1.43804931640625, 1.588134765625, 1.73822021484375, 1.8883056640625, 2.03839111328125, 2.1884765625, 2.33856201171875, 2.4886474609375, 2.63873291015625, 2.788818359375, 2.93890380859375, 3.0889892578125, 3.23907470703125, 3.38916015625, 3.53924560546875, 3.6893310546875, 3.83941650390625, 3.989501953125, 4.13958740234375, 4.2896728515625, 4.43975830078125, 4.58984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 4.0, 8.0, 15.0, 18.0, 18.0, 27.0, 50.0, 43.0, 51.0, 65.0, 76.0, 93.0, 90.0, 140.0, 177.0, 189.0, 201.0, 259.0, 242.0, 290.0, 265.0, 240.0, 219.0, 193.0, 201.0, 164.0, 132.0, 123.0, 101.0, 73.0, 74.0, 56.0, 44.0, 31.0, 27.0, 17.0, 18.0, 10.0, 4.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.444854736328125, -1.39752197265625, -1.350189208984375, -1.3028564453125, -1.255523681640625, -1.20819091796875, -1.160858154296875, -1.113525390625, -1.066192626953125, -1.01885986328125, -0.971527099609375, -0.9241943359375, -0.876861572265625, -0.82952880859375, -0.782196044921875, -0.73486328125, -0.687530517578125, -0.64019775390625, -0.592864990234375, -0.5455322265625, -0.498199462890625, -0.45086669921875, -0.403533935546875, -0.356201171875, -0.308868408203125, -0.26153564453125, -0.214202880859375, -0.1668701171875, -0.119537353515625, -0.07220458984375, -0.024871826171875, 0.0224609375, 0.069793701171875, 0.11712646484375, 0.164459228515625, 0.2117919921875, 0.259124755859375, 0.30645751953125, 0.353790283203125, 0.401123046875, 0.448455810546875, 0.49578857421875, 0.543121337890625, 0.5904541015625, 0.637786865234375, 0.68511962890625, 0.732452392578125, 0.77978515625, 0.827117919921875, 0.87445068359375, 0.921783447265625, 0.9691162109375, 1.016448974609375, 1.06378173828125, 1.111114501953125, 1.158447265625, 1.205780029296875, 1.25311279296875, 1.300445556640625, 1.3477783203125, 1.395111083984375, 1.44244384765625, 1.489776611328125, 1.537109375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 14.0, 15.0, 27.0, 36.0, 30.0, 42.0, 55.0, 63.0, 65.0, 84.0, 81.0, 68.0, 54.0, 62.0, 52.0, 38.0, 35.0, 31.0, 29.0, 21.0, 15.0, 16.0, 15.0, 11.0, 3.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.318307876586914, -5.1266021728515625, -4.934896469116211, -4.743190765380859, -4.55148458480835, -4.359778881072998, -4.1680731773376465, -3.976367473602295, -3.7846615314483643, -3.5929558277130127, -3.401249885559082, -3.2095441818237305, -3.017838478088379, -2.8261325359344482, -2.6344268321990967, -2.442720890045166, -2.2510151863098145, -2.059309482574463, -1.8676035404205322, -1.6758978366851807, -1.4841920137405396, -1.2924861907958984, -1.1007804870605469, -0.9090746641159058, -0.7173688411712646, -0.5256630182266235, -0.3339572548866272, -0.14225149154663086, 0.049454331398010254, 0.24116015434265137, 0.43286585807800293, 0.624571681022644, 0.8162775039672852, 1.0079833269119263, 1.1996891498565674, 1.391394853591919, 1.58310067653656, 1.7748064994812012, 1.9665122032165527, 2.1582179069519043, 2.349923849105835, 2.5416295528411865, 2.733335494995117, 2.9250411987304688, 3.1167469024658203, 3.308452844619751, 3.5001585483551025, 3.691864490509033, 3.8835701942443848, 4.075275897979736, 4.266981601715088, 4.458687782287598, 4.650393486022949, 4.842099189758301, 5.033804893493652, 5.225510597229004, 5.4172163009643555, 5.608922004699707, 5.800627708435059, 5.99233341217041, 6.18403959274292, 6.3757452964782715, 6.567451000213623, 6.759156703948975, 6.950862884521484]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 8.0, 5.0, 7.0, 19.0, 11.0, 18.0, 12.0, 20.0, 17.0, 32.0, 34.0, 19.0, 28.0, 31.0, 32.0, 42.0, 29.0, 37.0, 24.0, 45.0, 36.0, 24.0, 33.0, 36.0, 37.0, 43.0, 32.0, 34.0, 23.0, 28.0, 20.0, 21.0, 15.0, 24.0, 19.0, 11.0, 15.0, 9.0, 10.0, 12.0, 5.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.2040908336639404, -3.1065220832824707, -3.008953332901001, -2.9113845825195312, -2.8138160705566406, -2.716247320175171, -2.618678569793701, -2.5211098194122314, -2.4235410690307617, -2.325972318649292, -2.2284035682678223, -2.1308350563049316, -2.033266305923462, -1.9356975555419922, -1.8381288051605225, -1.7405600547790527, -1.642991542816162, -1.5454227924346924, -1.4478541612625122, -1.3502854108810425, -1.2527167797088623, -1.1551480293273926, -1.0575792789459229, -0.9600105881690979, -0.862441897392273, -0.764873206615448, -0.667304515838623, -0.5697357654571533, -0.47216707468032837, -0.3745983839035034, -0.2770296335220337, -0.17946094274520874, -0.08189201354980469, 0.015676692128181458, 0.1132453978061676, 0.21081411838531494, 0.3083828091621399, 0.40595149993896484, 0.5035202503204346, 0.6010889410972595, 0.6986576318740845, 0.7962263226509094, 0.8937950134277344, 0.9913637638092041, 1.0889325141906738, 1.186501145362854, 1.2840698957443237, 1.381638526916504, 1.4792072772979736, 1.5767760276794434, 1.6743446588516235, 1.7719134092330933, 1.8694820404052734, 1.9670507907867432, 2.064619541168213, 2.1621882915496826, 2.2597570419311523, 2.357325792312622, 2.454894542694092, 2.5524630546569824, 2.650031805038452, 2.747600555419922, 2.8451693058013916, 2.9427380561828613, 3.040306568145752]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 26.0, 19.0, 39.0, 73.0, 119.0, 184.0, 316.0, 499.0, 846.0, 1528.0, 2853.0, 5200.0, 9820.0, 19282.0, 39256.0, 78906.0, 152554.0, 239338.0, 225355.0, 134413.0, 68508.0, 33800.0, 16820.0, 8670.0, 4400.0, 2448.0, 1355.0, 768.0, 458.0, 257.0, 138.0, 92.0, 68.0, 50.0, 24.0, 18.0, 11.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8952713012695312, -0.8672027587890625, -0.8391342163085938, -0.811065673828125, -0.7829971313476562, -0.7549285888671875, -0.7268600463867188, -0.69879150390625, -0.6707229614257812, -0.6426544189453125, -0.6145858764648438, -0.586517333984375, -0.5584487915039062, -0.5303802490234375, -0.5023117065429688, -0.4742431640625, -0.44617462158203125, -0.4181060791015625, -0.39003753662109375, -0.361968994140625, -0.33390045166015625, -0.3058319091796875, -0.27776336669921875, -0.24969482421875, -0.22162628173828125, -0.1935577392578125, -0.16548919677734375, -0.137420654296875, -0.10935211181640625, -0.0812835693359375, -0.05321502685546875, -0.025146484375, 0.00292205810546875, 0.0309906005859375, 0.05905914306640625, 0.087127685546875, 0.11519622802734375, 0.1432647705078125, 0.17133331298828125, 0.19940185546875, 0.22747039794921875, 0.2555389404296875, 0.28360748291015625, 0.311676025390625, 0.33974456787109375, 0.3678131103515625, 0.39588165283203125, 0.4239501953125, 0.45201873779296875, 0.4800872802734375, 0.5081558227539062, 0.536224365234375, 0.5642929077148438, 0.5923614501953125, 0.6204299926757812, 0.64849853515625, 0.6765670776367188, 0.7046356201171875, 0.7327041625976562, 0.760772705078125, 0.7888412475585938, 0.8169097900390625, 0.8449783325195312, 0.873046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 13.0, 17.0, 28.0, 19.0, 10.0, 23.0, 20.0, 20.0, 37.0, 40.0, 31.0, 33.0, 22.0, 32.0, 38.0, 34.0, 34.0, 40.0, 31.0, 40.0, 27.0, 34.0, 36.0, 23.0, 34.0, 23.0, 39.0, 20.0, 30.0, 23.0, 8.0, 14.0, 11.0, 16.0, 5.0, 12.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.197265625, -3.09100341796875, -2.9847412109375, -2.87847900390625, -2.772216796875, -2.66595458984375, -2.5596923828125, -2.45343017578125, -2.34716796875, -2.24090576171875, -2.1346435546875, -2.02838134765625, -1.922119140625, -1.81585693359375, -1.7095947265625, -1.60333251953125, -1.4970703125, -1.39080810546875, -1.2845458984375, -1.17828369140625, -1.072021484375, -0.96575927734375, -0.8594970703125, -0.75323486328125, -0.64697265625, -0.54071044921875, -0.4344482421875, -0.32818603515625, -0.221923828125, -0.11566162109375, -0.0093994140625, 0.09686279296875, 0.203125, 0.30938720703125, 0.4156494140625, 0.52191162109375, 0.628173828125, 0.73443603515625, 0.8406982421875, 0.94696044921875, 1.05322265625, 1.15948486328125, 1.2657470703125, 1.37200927734375, 1.478271484375, 1.58453369140625, 1.6907958984375, 1.79705810546875, 1.9033203125, 2.00958251953125, 2.1158447265625, 2.22210693359375, 2.328369140625, 2.43463134765625, 2.5408935546875, 2.64715576171875, 2.75341796875, 2.85968017578125, 2.9659423828125, 3.07220458984375, 3.178466796875, 3.28472900390625, 3.3909912109375, 3.49725341796875, 3.603515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 11.0, 13.0, 11.0, 27.0, 27.0, 41.0, 62.0, 87.0, 120.0, 204.0, 284.0, 429.0, 727.0, 1165.0, 2045.0, 4039.0, 8765.0, 21462.0, 107276.0, 835929.0, 39045.0, 13580.0, 6064.0, 2930.0, 1614.0, 955.0, 513.0, 345.0, 222.0, 142.0, 117.0, 80.0, 54.0, 32.0, 34.0, 34.0, 16.0, 11.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.708984375, -2.632171630859375, -2.55535888671875, -2.478546142578125, -2.4017333984375, -2.324920654296875, -2.24810791015625, -2.171295166015625, -2.094482421875, -2.017669677734375, -1.94085693359375, -1.864044189453125, -1.7872314453125, -1.710418701171875, -1.63360595703125, -1.556793212890625, -1.47998046875, -1.403167724609375, -1.32635498046875, -1.249542236328125, -1.1727294921875, -1.095916748046875, -1.01910400390625, -0.942291259765625, -0.865478515625, -0.788665771484375, -0.71185302734375, -0.635040283203125, -0.5582275390625, -0.481414794921875, -0.40460205078125, -0.327789306640625, -0.2509765625, -0.174163818359375, -0.09735107421875, -0.020538330078125, 0.0562744140625, 0.133087158203125, 0.20989990234375, 0.286712646484375, 0.363525390625, 0.440338134765625, 0.51715087890625, 0.593963623046875, 0.6707763671875, 0.747589111328125, 0.82440185546875, 0.901214599609375, 0.97802734375, 1.054840087890625, 1.13165283203125, 1.208465576171875, 1.2852783203125, 1.362091064453125, 1.43890380859375, 1.515716552734375, 1.592529296875, 1.669342041015625, 1.74615478515625, 1.822967529296875, 1.8997802734375, 1.976593017578125, 2.05340576171875, 2.130218505859375, 2.20703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 7.0, 6.0, 10.0, 10.0, 8.0, 17.0, 18.0, 20.0, 19.0, 24.0, 32.0, 36.0, 40.0, 42.0, 41.0, 39.0, 55.0, 49.0, 45.0, 47.0, 49.0, 50.0, 40.0, 44.0, 37.0, 36.0, 30.0, 34.0, 13.0, 20.0, 10.0, 16.0, 16.0, 11.0, 4.0, 5.0, 2.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.467315673828125, -4.33306884765625, -4.198822021484375, -4.0645751953125, -3.930328369140625, -3.79608154296875, -3.661834716796875, -3.527587890625, -3.393341064453125, -3.25909423828125, -3.124847412109375, -2.9906005859375, -2.856353759765625, -2.72210693359375, -2.587860107421875, -2.45361328125, -2.319366455078125, -2.18511962890625, -2.050872802734375, -1.9166259765625, -1.782379150390625, -1.64813232421875, -1.513885498046875, -1.379638671875, -1.245391845703125, -1.11114501953125, -0.976898193359375, -0.8426513671875, -0.708404541015625, -0.57415771484375, -0.439910888671875, -0.3056640625, -0.171417236328125, -0.03717041015625, 0.097076416015625, 0.2313232421875, 0.365570068359375, 0.49981689453125, 0.634063720703125, 0.768310546875, 0.902557373046875, 1.03680419921875, 1.171051025390625, 1.3052978515625, 1.439544677734375, 1.57379150390625, 1.708038330078125, 1.84228515625, 1.976531982421875, 2.11077880859375, 2.245025634765625, 2.3792724609375, 2.513519287109375, 2.64776611328125, 2.782012939453125, 2.916259765625, 3.050506591796875, 3.18475341796875, 3.319000244140625, 3.4532470703125, 3.587493896484375, 3.72174072265625, 3.855987548828125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 9.0, 15.0, 24.0, 29.0, 34.0, 46.0, 76.0, 119.0, 184.0, 270.0, 432.0, 632.0, 942.0, 1477.0, 2401.0, 3956.0, 6728.0, 12622.0, 28406.0, 787769.0, 152518.0, 22975.0, 10927.0, 5982.0, 3704.0, 2201.0, 1322.0, 894.0, 617.0, 397.0, 280.0, 168.0, 117.0, 87.0, 48.0, 35.0, 32.0, 27.0, 14.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0016326904296875, -0.968109130859375, -0.9345855712890625, -0.90106201171875, -0.8675384521484375, -0.834014892578125, -0.8004913330078125, -0.7669677734375, -0.7334442138671875, -0.699920654296875, -0.6663970947265625, -0.63287353515625, -0.5993499755859375, -0.565826416015625, -0.5323028564453125, -0.498779296875, -0.4652557373046875, -0.431732177734375, -0.3982086181640625, -0.36468505859375, -0.3311614990234375, -0.297637939453125, -0.2641143798828125, -0.2305908203125, -0.1970672607421875, -0.163543701171875, -0.1300201416015625, -0.09649658203125, -0.0629730224609375, -0.029449462890625, 0.0040740966796875, 0.03759765625, 0.0711212158203125, 0.104644775390625, 0.1381683349609375, 0.17169189453125, 0.2052154541015625, 0.238739013671875, 0.2722625732421875, 0.3057861328125, 0.3393096923828125, 0.372833251953125, 0.4063568115234375, 0.43988037109375, 0.4734039306640625, 0.506927490234375, 0.5404510498046875, 0.573974609375, 0.6074981689453125, 0.641021728515625, 0.6745452880859375, 0.70806884765625, 0.7415924072265625, 0.775115966796875, 0.8086395263671875, 0.8421630859375, 0.8756866455078125, 0.909210205078125, 0.9427337646484375, 0.97625732421875, 1.0097808837890625, 1.043304443359375, 1.0768280029296875, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 4.0, 12.0, 15.0, 24.0, 38.0, 66.0, 93.0, 110.0, 115.0, 130.0, 110.0, 95.0, 52.0, 37.0, 24.0, 14.0, 7.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.7738037109375e-05, -8.535012602806091e-05, -8.296221494674683e-05, -8.057430386543274e-05, -7.818639278411865e-05, -7.579848170280457e-05, -7.341057062149048e-05, -7.102265954017639e-05, -6.86347484588623e-05, -6.624683737754822e-05, -6.385892629623413e-05, -6.147101521492004e-05, -5.908310413360596e-05, -5.669519305229187e-05, -5.430728197097778e-05, -5.1919370889663696e-05, -4.953145980834961e-05, -4.714354872703552e-05, -4.4755637645721436e-05, -4.236772656440735e-05, -3.997981548309326e-05, -3.7591904401779175e-05, -3.520399332046509e-05, -3.2816082239151e-05, -3.0428171157836914e-05, -2.8040260076522827e-05, -2.565234899520874e-05, -2.3264437913894653e-05, -2.0876526832580566e-05, -1.848861575126648e-05, -1.6100704669952393e-05, -1.3712793588638306e-05, -1.1324882507324219e-05, -8.936971426010132e-06, -6.549060344696045e-06, -4.161149263381958e-06, -1.773238182067871e-06, 6.146728992462158e-07, 3.0025839805603027e-06, 5.39049506187439e-06, 7.778406143188477e-06, 1.0166317224502563e-05, 1.255422830581665e-05, 1.4942139387130737e-05, 1.7330050468444824e-05, 1.971796154975891e-05, 2.2105872631072998e-05, 2.4493783712387085e-05, 2.6881694793701172e-05, 2.926960587501526e-05, 3.1657516956329346e-05, 3.404542803764343e-05, 3.643333911895752e-05, 3.8821250200271606e-05, 4.120916128158569e-05, 4.359707236289978e-05, 4.598498344421387e-05, 4.8372894525527954e-05, 5.076080560684204e-05, 5.314871668815613e-05, 5.5536627769470215e-05, 5.79245388507843e-05, 6.031244993209839e-05, 6.270036101341248e-05, 6.508827209472656e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 14.0, 18.0, 19.0, 27.0, 50.0, 61.0, 84.0, 105.0, 184.0, 228.0, 347.0, 530.0, 720.0, 1107.0, 1709.0, 2713.0, 4352.0, 7331.0, 12446.0, 22368.0, 42006.0, 84907.0, 178772.0, 292808.0, 197128.0, 93713.0, 46410.0, 24195.0, 13353.0, 7757.0, 4615.0, 2877.0, 1828.0, 1177.0, 766.0, 532.0, 375.0, 269.0, 177.0, 120.0, 90.0, 74.0, 51.0, 42.0, 28.0, 9.0, 17.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0], "bins": [-0.356689453125, -0.34539031982421875, -0.3340911865234375, -0.32279205322265625, -0.311492919921875, -0.30019378662109375, -0.2888946533203125, -0.27759552001953125, -0.26629638671875, -0.25499725341796875, -0.2436981201171875, -0.23239898681640625, -0.221099853515625, -0.20980072021484375, -0.1985015869140625, -0.18720245361328125, -0.1759033203125, -0.16460418701171875, -0.1533050537109375, -0.14200592041015625, -0.130706787109375, -0.11940765380859375, -0.1081085205078125, -0.09680938720703125, -0.08551025390625, -0.07421112060546875, -0.0629119873046875, -0.05161285400390625, -0.040313720703125, -0.02901458740234375, -0.0177154541015625, -0.00641632080078125, 0.0048828125, 0.01618194580078125, 0.0274810791015625, 0.03878021240234375, 0.050079345703125, 0.06137847900390625, 0.0726776123046875, 0.08397674560546875, 0.09527587890625, 0.10657501220703125, 0.1178741455078125, 0.12917327880859375, 0.140472412109375, 0.15177154541015625, 0.1630706787109375, 0.17436981201171875, 0.1856689453125, 0.19696807861328125, 0.2082672119140625, 0.21956634521484375, 0.230865478515625, 0.24216461181640625, 0.2534637451171875, 0.26476287841796875, 0.27606201171875, 0.28736114501953125, 0.2986602783203125, 0.30995941162109375, 0.321258544921875, 0.33255767822265625, 0.3438568115234375, 0.35515594482421875, 0.366455078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 13.0, 32.0, 21.0, 23.0, 38.0, 30.0, 56.0, 76.0, 85.0, 85.0, 89.0, 64.0, 69.0, 43.0, 34.0, 27.0, 28.0, 26.0, 28.0, 17.0, 13.0, 5.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24890899658203125, -0.2402496337890625, -0.23159027099609375, -0.222930908203125, -0.21427154541015625, -0.2056121826171875, -0.19695281982421875, -0.18829345703125, -0.17963409423828125, -0.1709747314453125, -0.16231536865234375, -0.153656005859375, -0.14499664306640625, -0.1363372802734375, -0.12767791748046875, -0.1190185546875, -0.11035919189453125, -0.1016998291015625, -0.09304046630859375, -0.084381103515625, -0.07572174072265625, -0.0670623779296875, -0.05840301513671875, -0.04974365234375, -0.04108428955078125, -0.0324249267578125, -0.02376556396484375, -0.015106201171875, -0.00644683837890625, 0.0022125244140625, 0.01087188720703125, 0.01953125, 0.02819061279296875, 0.0368499755859375, 0.04550933837890625, 0.054168701171875, 0.06282806396484375, 0.0714874267578125, 0.08014678955078125, 0.08880615234375, 0.09746551513671875, 0.1061248779296875, 0.11478424072265625, 0.123443603515625, 0.13210296630859375, 0.1407623291015625, 0.14942169189453125, 0.1580810546875, 0.16674041748046875, 0.1753997802734375, 0.18405914306640625, 0.192718505859375, 0.20137786865234375, 0.2100372314453125, 0.21869659423828125, 0.22735595703125, 0.23601531982421875, 0.2446746826171875, 0.25333404541015625, 0.261993408203125, 0.27065277099609375, 0.2793121337890625, 0.28797149658203125, 0.296630859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 16.0, 14.0, 20.0, 28.0, 37.0, 32.0, 55.0, 52.0, 71.0, 84.0, 64.0, 84.0, 53.0, 65.0, 56.0, 40.0, 37.0, 39.0, 27.0, 21.0, 23.0, 10.0, 17.0, 13.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.360625743865967, -5.171506881713867, -4.982387542724609, -4.79326868057251, -4.60414981842041, -4.4150309562683105, -4.225912094116211, -4.036792755126953, -3.8476738929748535, -3.658555030822754, -3.469435930252075, -3.2803168296813965, -3.091197967529297, -2.9020791053771973, -2.7129600048065186, -2.52384090423584, -2.3347220420837402, -2.1456031799316406, -1.956484079360962, -1.7673650979995728, -1.5782461166381836, -1.3891271352767944, -1.2000081539154053, -1.0108891725540161, -0.821770191192627, -0.6326512098312378, -0.44353222846984863, -0.2544132471084595, -0.06529426574707031, 0.12382471561431885, 0.312943696975708, 0.5020626783370972, 0.6911821365356445, 0.8803011178970337, 1.0694200992584229, 1.258539080619812, 1.4476580619812012, 1.6367770433425903, 1.8258960247039795, 2.015015125274658, 2.204133987426758, 2.3932528495788574, 2.582371950149536, 2.771491050720215, 2.9606099128723145, 3.149728775024414, 3.3388478755950928, 3.5279669761657715, 3.717085838317871, 3.9062047004699707, 4.09532356262207, 4.284442901611328, 4.473561763763428, 4.662680625915527, 4.851799964904785, 5.040918827056885, 5.230037689208984, 5.419156551361084, 5.608275413513184, 5.797394752502441, 5.986513614654541, 6.175632476806641, 6.364751815795898, 6.553870677947998, 6.742989540100098]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 5.0, 7.0, 10.0, 12.0, 16.0, 11.0, 24.0, 20.0, 27.0, 23.0, 33.0, 31.0, 21.0, 35.0, 31.0, 31.0, 25.0, 35.0, 44.0, 32.0, 35.0, 34.0, 28.0, 37.0, 38.0, 36.0, 36.0, 34.0, 19.0, 24.0, 28.0, 19.0, 21.0, 16.0, 18.0, 12.0, 14.0, 6.0, 14.0, 10.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-3.0880866050720215, -2.992785692214966, -2.8974850177764893, -2.8021841049194336, -2.706883192062378, -2.6115822792053223, -2.5162816047668457, -2.42098069190979, -2.3256797790527344, -2.2303788661956787, -2.135078191757202, -2.0397772789001465, -1.9444763660430908, -1.8491755723953247, -1.7538747787475586, -1.658573865890503, -1.5632731914520264, -1.4679723978042603, -1.3726714849472046, -1.2773706912994385, -1.1820697784423828, -1.0867689847946167, -0.9914681911468506, -0.8961673378944397, -0.8008664846420288, -0.7055656313896179, -0.610264778137207, -0.5149639844894409, -0.41966313123703003, -0.32436227798461914, -0.22906148433685303, -0.13376063108444214, -0.03845977783203125, 0.056841060519218445, 0.15214189887046814, 0.24744272232055664, 0.34274357557296753, 0.4380444288253784, 0.5333452224731445, 0.6286460757255554, 0.7239469289779663, 0.8192477822303772, 0.9145486354827881, 1.0098494291305542, 1.1051502227783203, 1.200451135635376, 1.295751929283142, 1.3910527229309082, 1.4863536357879639, 1.58165442943573, 1.6769553422927856, 1.7722561359405518, 1.8675570487976074, 1.9628578424453735, 2.0581586360931396, 2.1534595489501953, 2.248760223388672, 2.3440611362457275, 2.439361810684204, 2.5346627235412598, 2.6299636363983154, 2.725264549255371, 2.8205652236938477, 2.9158661365509033, 3.011167049407959]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 6.0, 11.0, 13.0, 22.0, 22.0, 47.0, 81.0, 110.0, 171.0, 302.0, 524.0, 936.0, 1580.0, 3029.0, 5480.0, 10103.0, 19143.0, 35976.0, 65418.0, 112024.0, 165511.0, 192244.0, 169839.0, 116472.0, 68522.0, 37525.0, 19848.0, 10635.0, 5743.0, 3177.0, 1670.0, 959.0, 541.0, 312.0, 188.0, 136.0, 87.0, 47.0, 32.0, 23.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2421875, -4.09857177734375, -3.9549560546875, -3.81134033203125, -3.667724609375, -3.52410888671875, -3.3804931640625, -3.23687744140625, -3.09326171875, -2.94964599609375, -2.8060302734375, -2.66241455078125, -2.518798828125, -2.37518310546875, -2.2315673828125, -2.08795166015625, -1.9443359375, -1.80072021484375, -1.6571044921875, -1.51348876953125, -1.369873046875, -1.22625732421875, -1.0826416015625, -0.93902587890625, -0.79541015625, -0.65179443359375, -0.5081787109375, -0.36456298828125, -0.220947265625, -0.07733154296875, 0.0662841796875, 0.20989990234375, 0.353515625, 0.49713134765625, 0.6407470703125, 0.78436279296875, 0.927978515625, 1.07159423828125, 1.2152099609375, 1.35882568359375, 1.50244140625, 1.64605712890625, 1.7896728515625, 1.93328857421875, 2.076904296875, 2.22052001953125, 2.3641357421875, 2.50775146484375, 2.6513671875, 2.79498291015625, 2.9385986328125, 3.08221435546875, 3.225830078125, 3.36944580078125, 3.5130615234375, 3.65667724609375, 3.80029296875, 3.94390869140625, 4.0875244140625, 4.23114013671875, 4.374755859375, 4.51837158203125, 4.6619873046875, 4.80560302734375, 4.94921875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 7.0, 17.0, 12.0, 22.0, 19.0, 22.0, 19.0, 28.0, 37.0, 29.0, 34.0, 47.0, 46.0, 32.0, 40.0, 34.0, 34.0, 40.0, 48.0, 40.0, 42.0, 46.0, 37.0, 41.0, 24.0, 25.0, 22.0, 20.0, 20.0, 19.0, 12.0, 15.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125, -3.00823974609375, -2.8914794921875, -2.77471923828125, -2.657958984375, -2.54119873046875, -2.4244384765625, -2.30767822265625, -2.19091796875, -2.07415771484375, -1.9573974609375, -1.84063720703125, -1.723876953125, -1.60711669921875, -1.4903564453125, -1.37359619140625, -1.2568359375, -1.14007568359375, -1.0233154296875, -0.90655517578125, -0.789794921875, -0.67303466796875, -0.5562744140625, -0.43951416015625, -0.32275390625, -0.20599365234375, -0.0892333984375, 0.02752685546875, 0.144287109375, 0.26104736328125, 0.3778076171875, 0.49456787109375, 0.611328125, 0.72808837890625, 0.8448486328125, 0.96160888671875, 1.078369140625, 1.19512939453125, 1.3118896484375, 1.42864990234375, 1.54541015625, 1.66217041015625, 1.7789306640625, 1.89569091796875, 2.012451171875, 2.12921142578125, 2.2459716796875, 2.36273193359375, 2.4794921875, 2.59625244140625, 2.7130126953125, 2.82977294921875, 2.946533203125, 3.06329345703125, 3.1800537109375, 3.29681396484375, 3.41357421875, 3.53033447265625, 3.6470947265625, 3.76385498046875, 3.880615234375, 3.99737548828125, 4.1141357421875, 4.23089599609375, 4.34765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 13.0, 22.0, 35.0, 35.0, 68.0, 101.0, 170.0, 219.0, 366.0, 573.0, 858.0, 1310.0, 2150.0, 3342.0, 5456.0, 8890.0, 15337.0, 26202.0, 44065.0, 72350.0, 110534.0, 149037.0, 166005.0, 149346.0, 110605.0, 72066.0, 43999.0, 26066.0, 15193.0, 9332.0, 5405.0, 3574.0, 2133.0, 1273.0, 851.0, 529.0, 320.0, 246.0, 146.0, 91.0, 65.0, 40.0, 43.0, 24.0, 15.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.521270751953125, -3.40582275390625, -3.290374755859375, -3.1749267578125, -3.059478759765625, -2.94403076171875, -2.828582763671875, -2.713134765625, -2.597686767578125, -2.48223876953125, -2.366790771484375, -2.2513427734375, -2.135894775390625, -2.02044677734375, -1.904998779296875, -1.78955078125, -1.674102783203125, -1.55865478515625, -1.443206787109375, -1.3277587890625, -1.212310791015625, -1.09686279296875, -0.981414794921875, -0.865966796875, -0.750518798828125, -0.63507080078125, -0.519622802734375, -0.4041748046875, -0.288726806640625, -0.17327880859375, -0.057830810546875, 0.0576171875, 0.173065185546875, 0.28851318359375, 0.403961181640625, 0.5194091796875, 0.634857177734375, 0.75030517578125, 0.865753173828125, 0.981201171875, 1.096649169921875, 1.21209716796875, 1.327545166015625, 1.4429931640625, 1.558441162109375, 1.67388916015625, 1.789337158203125, 1.90478515625, 2.020233154296875, 2.13568115234375, 2.251129150390625, 2.3665771484375, 2.482025146484375, 2.59747314453125, 2.712921142578125, 2.828369140625, 2.943817138671875, 3.05926513671875, 3.174713134765625, 3.2901611328125, 3.405609130859375, 3.52105712890625, 3.636505126953125, 3.751953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 13.0, 8.0, 15.0, 16.0, 24.0, 13.0, 26.0, 29.0, 23.0, 25.0, 31.0, 26.0, 36.0, 41.0, 41.0, 37.0, 35.0, 36.0, 47.0, 37.0, 37.0, 38.0, 35.0, 37.0, 37.0, 34.0, 27.0, 26.0, 31.0, 20.0, 16.0, 15.0, 7.0, 16.0, 13.0, 10.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.383148193359375, -2.30340576171875, -2.223663330078125, -2.1439208984375, -2.064178466796875, -1.98443603515625, -1.904693603515625, -1.824951171875, -1.745208740234375, -1.66546630859375, -1.585723876953125, -1.5059814453125, -1.426239013671875, -1.34649658203125, -1.266754150390625, -1.18701171875, -1.107269287109375, -1.02752685546875, -0.947784423828125, -0.8680419921875, -0.788299560546875, -0.70855712890625, -0.628814697265625, -0.549072265625, -0.469329833984375, -0.38958740234375, -0.309844970703125, -0.2301025390625, -0.150360107421875, -0.07061767578125, 0.009124755859375, 0.0888671875, 0.168609619140625, 0.24835205078125, 0.328094482421875, 0.4078369140625, 0.487579345703125, 0.56732177734375, 0.647064208984375, 0.726806640625, 0.806549072265625, 0.88629150390625, 0.966033935546875, 1.0457763671875, 1.125518798828125, 1.20526123046875, 1.285003662109375, 1.36474609375, 1.444488525390625, 1.52423095703125, 1.603973388671875, 1.6837158203125, 1.763458251953125, 1.84320068359375, 1.922943115234375, 2.002685546875, 2.082427978515625, 2.16217041015625, 2.241912841796875, 2.3216552734375, 2.401397705078125, 2.48114013671875, 2.560882568359375, 2.640625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 27.0, 38.0, 49.0, 108.0, 120.0, 193.0, 252.0, 409.0, 656.0, 1085.0, 1909.0, 3168.0, 5830.0, 11121.0, 23458.0, 49758.0, 105314.0, 203392.0, 265370.0, 190279.0, 96457.0, 44835.0, 21162.0, 10466.0, 5481.0, 3107.0, 1652.0, 998.0, 633.0, 388.0, 275.0, 169.0, 120.0, 71.0, 42.0, 33.0, 23.0, 16.0, 12.0, 16.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.748046875, -3.624908447265625, -3.50177001953125, -3.378631591796875, -3.2554931640625, -3.132354736328125, -3.00921630859375, -2.886077880859375, -2.762939453125, -2.639801025390625, -2.51666259765625, -2.393524169921875, -2.2703857421875, -2.147247314453125, -2.02410888671875, -1.900970458984375, -1.77783203125, -1.654693603515625, -1.53155517578125, -1.408416748046875, -1.2852783203125, -1.162139892578125, -1.03900146484375, -0.915863037109375, -0.792724609375, -0.669586181640625, -0.54644775390625, -0.423309326171875, -0.3001708984375, -0.177032470703125, -0.05389404296875, 0.069244384765625, 0.1923828125, 0.315521240234375, 0.43865966796875, 0.561798095703125, 0.6849365234375, 0.808074951171875, 0.93121337890625, 1.054351806640625, 1.177490234375, 1.300628662109375, 1.42376708984375, 1.546905517578125, 1.6700439453125, 1.793182373046875, 1.91632080078125, 2.039459228515625, 2.16259765625, 2.285736083984375, 2.40887451171875, 2.532012939453125, 2.6551513671875, 2.778289794921875, 2.90142822265625, 3.024566650390625, 3.147705078125, 3.270843505859375, 3.39398193359375, 3.517120361328125, 3.6402587890625, 3.763397216796875, 3.88653564453125, 4.009674072265625, 4.1328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 12.0, 13.0, 12.0, 17.0, 15.0, 26.0, 22.0, 25.0, 34.0, 35.0, 47.0, 36.0, 57.0, 58.0, 52.0, 47.0, 72.0, 48.0, 60.0, 47.0, 33.0, 46.0, 34.0, 23.0, 23.0, 22.0, 12.0, 16.0, 5.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.000209808349609375, -0.00020260736346244812, -0.00019540637731552124, -0.00018820539116859436, -0.00018100440502166748, -0.0001738034188747406, -0.00016660243272781372, -0.00015940144658088684, -0.00015220046043395996, -0.00014499947428703308, -0.0001377984881401062, -0.00013059750199317932, -0.00012339651584625244, -0.00011619552969932556, -0.00010899454355239868, -0.0001017935574054718, -9.459257125854492e-05, -8.739158511161804e-05, -8.019059896469116e-05, -7.298961281776428e-05, -6.57886266708374e-05, -5.858764052391052e-05, -5.138665437698364e-05, -4.418566823005676e-05, -3.698468208312988e-05, -2.9783695936203003e-05, -2.2582709789276123e-05, -1.5381723642349243e-05, -8.180737495422363e-06, -9.797513484954834e-07, 6.2212347984313965e-06, 1.3422220945358276e-05, 2.0623207092285156e-05, 2.7824193239212036e-05, 3.5025179386138916e-05, 4.2226165533065796e-05, 4.9427151679992676e-05, 5.6628137826919556e-05, 6.382912397384644e-05, 7.103011012077332e-05, 7.82310962677002e-05, 8.543208241462708e-05, 9.263306856155396e-05, 9.983405470848083e-05, 0.00010703504085540771, 0.0001142360270023346, 0.00012143701314926147, 0.00012863799929618835, 0.00013583898544311523, 0.00014303997159004211, 0.000150240957736969, 0.00015744194388389587, 0.00016464293003082275, 0.00017184391617774963, 0.00017904490232467651, 0.0001862458884716034, 0.00019344687461853027, 0.00020064786076545715, 0.00020784884691238403, 0.0002150498330593109, 0.0002222508192062378, 0.00022945180535316467, 0.00023665279150009155, 0.00024385377764701843, 0.0002510547637939453]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 23.0, 34.0, 46.0, 46.0, 68.0, 98.0, 123.0, 197.0, 267.0, 379.0, 616.0, 872.0, 1345.0, 2105.0, 3591.0, 6139.0, 10970.0, 20373.0, 39507.0, 76686.0, 140605.0, 213647.0, 216364.0, 145298.0, 79573.0, 40885.0, 21268.0, 11206.0, 6129.0, 3663.0, 2136.0, 1379.0, 905.0, 598.0, 435.0, 286.0, 173.0, 127.0, 98.0, 69.0, 56.0, 38.0, 34.0, 20.0, 15.0, 11.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.771697998046875, -2.67620849609375, -2.580718994140625, -2.4852294921875, -2.389739990234375, -2.29425048828125, -2.198760986328125, -2.103271484375, -2.007781982421875, -1.91229248046875, -1.816802978515625, -1.7213134765625, -1.625823974609375, -1.53033447265625, -1.434844970703125, -1.33935546875, -1.243865966796875, -1.14837646484375, -1.052886962890625, -0.9573974609375, -0.861907958984375, -0.76641845703125, -0.670928955078125, -0.575439453125, -0.479949951171875, -0.38446044921875, -0.288970947265625, -0.1934814453125, -0.097991943359375, -0.00250244140625, 0.092987060546875, 0.1884765625, 0.283966064453125, 0.37945556640625, 0.474945068359375, 0.5704345703125, 0.665924072265625, 0.76141357421875, 0.856903076171875, 0.952392578125, 1.047882080078125, 1.14337158203125, 1.238861083984375, 1.3343505859375, 1.429840087890625, 1.52532958984375, 1.620819091796875, 1.71630859375, 1.811798095703125, 1.90728759765625, 2.002777099609375, 2.0982666015625, 2.193756103515625, 2.28924560546875, 2.384735107421875, 2.480224609375, 2.575714111328125, 2.67120361328125, 2.766693115234375, 2.8621826171875, 2.957672119140625, 3.05316162109375, 3.148651123046875, 3.244140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 17.0, 16.0, 25.0, 43.0, 41.0, 50.0, 74.0, 85.0, 90.0, 99.0, 94.0, 75.0, 64.0, 61.0, 45.0, 25.0, 18.0, 16.0, 8.0, 9.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8076171875, -1.753326416015625, -1.69903564453125, -1.644744873046875, -1.5904541015625, -1.536163330078125, -1.48187255859375, -1.427581787109375, -1.373291015625, -1.319000244140625, -1.26470947265625, -1.210418701171875, -1.1561279296875, -1.101837158203125, -1.04754638671875, -0.993255615234375, -0.93896484375, -0.884674072265625, -0.83038330078125, -0.776092529296875, -0.7218017578125, -0.667510986328125, -0.61322021484375, -0.558929443359375, -0.504638671875, -0.450347900390625, -0.39605712890625, -0.341766357421875, -0.2874755859375, -0.233184814453125, -0.17889404296875, -0.124603271484375, -0.0703125, -0.016021728515625, 0.03826904296875, 0.092559814453125, 0.1468505859375, 0.201141357421875, 0.25543212890625, 0.309722900390625, 0.364013671875, 0.418304443359375, 0.47259521484375, 0.526885986328125, 0.5811767578125, 0.635467529296875, 0.68975830078125, 0.744049072265625, 0.79833984375, 0.852630615234375, 0.90692138671875, 0.961212158203125, 1.0155029296875, 1.069793701171875, 1.12408447265625, 1.178375244140625, 1.232666015625, 1.286956787109375, 1.34124755859375, 1.395538330078125, 1.4498291015625, 1.504119873046875, 1.55841064453125, 1.612701416015625, 1.6669921875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 14.0, 21.0, 27.0, 34.0, 46.0, 47.0, 60.0, 64.0, 66.0, 64.0, 76.0, 76.0, 72.0, 48.0, 38.0, 39.0, 39.0, 21.0, 20.0, 18.0, 15.0, 12.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.441328048706055, -5.262688636779785, -5.084048748016357, -4.905409336090088, -4.72676944732666, -4.548130035400391, -4.369490623474121, -4.190850734710693, -4.012210845947266, -3.833571195602417, -3.6549315452575684, -3.476292133331299, -3.297652244567871, -3.1190128326416016, -2.940373182296753, -2.7617335319519043, -2.5830941200256348, -2.404454469680786, -2.2258148193359375, -2.047175407409668, -1.8685356378555298, -1.6898959875106812, -1.511256456375122, -1.3326168060302734, -1.1539771556854248, -0.9753375053405762, -0.7966979146003723, -0.6180583238601685, -0.4394186735153198, -0.2607790231704712, -0.08213949203491211, 0.09650015830993652, 0.27513980865478516, 0.4537794291973114, 0.6324190497398376, 0.8110586404800415, 0.9896982908248901, 1.1683379411697388, 1.3469774723052979, 1.5256171226501465, 1.7042567729949951, 1.8828964233398438, 2.0615360736846924, 2.240175724029541, 2.4188151359558105, 2.5974550247192383, 2.776094436645508, 2.9547340869903564, 3.133373737335205, 3.3120133876800537, 3.4906530380249023, 3.669292449951172, 3.8479323387145996, 4.026571750640869, 4.205211639404297, 4.383851051330566, 4.562490463256836, 4.7411298751831055, 4.919769763946533, 5.098409175872803, 5.2770490646362305, 5.4556884765625, 5.6343278884887695, 5.812967777252197, 5.991607666015625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 10.0, 8.0, 15.0, 12.0, 11.0, 20.0, 23.0, 22.0, 17.0, 26.0, 35.0, 29.0, 32.0, 32.0, 40.0, 42.0, 36.0, 40.0, 39.0, 37.0, 45.0, 35.0, 53.0, 26.0, 33.0, 35.0, 27.0, 31.0, 20.0, 21.0, 23.0, 20.0, 12.0, 9.0, 10.0, 14.0, 14.0, 10.0, 3.0, 0.0, 8.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904827833175659, -2.800170660018921, -2.6955134868621826, -2.5908563137054443, -2.486199378967285, -2.381542205810547, -2.2768850326538086, -2.1722278594970703, -2.067570686340332, -1.9629135131835938, -1.8582563400268555, -1.7535992860794067, -1.6489421129226685, -1.5442849397659302, -1.4396278858184814, -1.3349707126617432, -1.2303135395050049, -1.1256563663482666, -1.0209991931915283, -0.9163421392440796, -0.8116849660873413, -0.707027792930603, -0.6023706793785095, -0.497713565826416, -0.39305639266967773, -0.28839924931526184, -0.18374210596084595, -0.07908496260643005, 0.02557218074798584, 0.13022935390472412, 0.23488646745681763, 0.33954358100891113, 0.4442005157470703, 0.5488576889038086, 0.6535148024559021, 0.7581719160079956, 0.8628290891647339, 0.9674862623214722, 1.072143316268921, 1.1768004894256592, 1.2814576625823975, 1.3861148357391357, 1.490772008895874, 1.5954290628433228, 1.700086236000061, 1.8047434091567993, 1.909400463104248, 2.0140576362609863, 2.1187148094177246, 2.223371982574463, 2.328029155731201, 2.4326863288879395, 2.5373435020446777, 2.642000675201416, 2.746657609939575, 2.8513147830963135, 2.9559719562530518, 3.06062912940979, 3.1652863025665283, 3.2699434757232666, 3.374600410461426, 3.479257583618164, 3.5839147567749023, 3.6885719299316406, 3.793229103088379]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 6.0, 11.0, 21.0, 31.0, 40.0, 62.0, 97.0, 137.0, 206.0, 341.0, 536.0, 857.0, 1391.0, 2189.0, 3936.0, 6655.0, 11866.0, 21978.0, 42679.0, 89275.0, 207019.0, 517130.0, 1103335.0, 1172823.0, 581934.0, 230019.0, 99202.0, 46537.0, 23532.0, 12924.0, 6989.0, 4121.0, 2376.0, 1473.0, 943.0, 556.0, 351.0, 249.0, 146.0, 94.0, 69.0, 46.0, 36.0, 25.0, 12.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.3203125, -5.1490478515625, -4.977783203125, -4.8065185546875, -4.63525390625, -4.4639892578125, -4.292724609375, -4.1214599609375, -3.9501953125, -3.7789306640625, -3.607666015625, -3.4364013671875, -3.26513671875, -3.0938720703125, -2.922607421875, -2.7513427734375, -2.580078125, -2.4088134765625, -2.237548828125, -2.0662841796875, -1.89501953125, -1.7237548828125, -1.552490234375, -1.3812255859375, -1.2099609375, -1.0386962890625, -0.867431640625, -0.6961669921875, -0.52490234375, -0.3536376953125, -0.182373046875, -0.0111083984375, 0.16015625, 0.3314208984375, 0.502685546875, 0.6739501953125, 0.84521484375, 1.0164794921875, 1.187744140625, 1.3590087890625, 1.5302734375, 1.7015380859375, 1.872802734375, 2.0440673828125, 2.21533203125, 2.3865966796875, 2.557861328125, 2.7291259765625, 2.900390625, 3.0716552734375, 3.242919921875, 3.4141845703125, 3.58544921875, 3.7567138671875, 3.927978515625, 4.0992431640625, 4.2705078125, 4.4417724609375, 4.613037109375, 4.7843017578125, 4.95556640625, 5.1268310546875, 5.298095703125, 5.4693603515625, 5.640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 5.0, 14.0, 10.0, 14.0, 15.0, 16.0, 23.0, 20.0, 22.0, 24.0, 21.0, 37.0, 40.0, 40.0, 40.0, 41.0, 38.0, 30.0, 47.0, 33.0, 39.0, 37.0, 28.0, 32.0, 31.0, 36.0, 36.0, 29.0, 22.0, 20.0, 10.0, 15.0, 21.0, 8.0, 15.0, 13.0, 14.0, 7.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2.22265625, -2.15447998046875, -2.0863037109375, -2.01812744140625, -1.949951171875, -1.88177490234375, -1.8135986328125, -1.74542236328125, -1.67724609375, -1.60906982421875, -1.5408935546875, -1.47271728515625, -1.404541015625, -1.33636474609375, -1.2681884765625, -1.20001220703125, -1.1318359375, -1.06365966796875, -0.9954833984375, -0.92730712890625, -0.859130859375, -0.79095458984375, -0.7227783203125, -0.65460205078125, -0.58642578125, -0.51824951171875, -0.4500732421875, -0.38189697265625, -0.313720703125, -0.24554443359375, -0.1773681640625, -0.10919189453125, -0.041015625, 0.02716064453125, 0.0953369140625, 0.16351318359375, 0.231689453125, 0.29986572265625, 0.3680419921875, 0.43621826171875, 0.50439453125, 0.57257080078125, 0.6407470703125, 0.70892333984375, 0.777099609375, 0.84527587890625, 0.9134521484375, 0.98162841796875, 1.0498046875, 1.11798095703125, 1.1861572265625, 1.25433349609375, 1.322509765625, 1.39068603515625, 1.4588623046875, 1.52703857421875, 1.59521484375, 1.66339111328125, 1.7315673828125, 1.79974365234375, 1.867919921875, 1.93609619140625, 2.0042724609375, 2.07244873046875, 2.140625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 8.0, 18.0, 20.0, 32.0, 51.0, 79.0, 128.0, 211.0, 337.0, 564.0, 1051.0, 1738.0, 3279.0, 5726.0, 10712.0, 20277.0, 39524.0, 79682.0, 166347.0, 351410.0, 713747.0, 1077336.0, 858196.0, 446810.0, 211612.0, 100617.0, 50009.0, 25007.0, 13425.0, 7092.0, 3897.0, 2150.0, 1273.0, 757.0, 438.0, 259.0, 170.0, 112.0, 60.0, 45.0, 24.0, 14.0, 11.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.57476806640625, -4.4151611328125, -4.25555419921875, -4.095947265625, -3.93634033203125, -3.7767333984375, -3.61712646484375, -3.45751953125, -3.29791259765625, -3.1383056640625, -2.97869873046875, -2.819091796875, -2.65948486328125, -2.4998779296875, -2.34027099609375, -2.1806640625, -2.02105712890625, -1.8614501953125, -1.70184326171875, -1.542236328125, -1.38262939453125, -1.2230224609375, -1.06341552734375, -0.90380859375, -0.74420166015625, -0.5845947265625, -0.42498779296875, -0.265380859375, -0.10577392578125, 0.0538330078125, 0.21343994140625, 0.373046875, 0.53265380859375, 0.6922607421875, 0.85186767578125, 1.011474609375, 1.17108154296875, 1.3306884765625, 1.49029541015625, 1.64990234375, 1.80950927734375, 1.9691162109375, 2.12872314453125, 2.288330078125, 2.44793701171875, 2.6075439453125, 2.76715087890625, 2.9267578125, 3.08636474609375, 3.2459716796875, 3.40557861328125, 3.565185546875, 3.72479248046875, 3.8843994140625, 4.04400634765625, 4.20361328125, 4.36322021484375, 4.5228271484375, 4.68243408203125, 4.842041015625, 5.00164794921875, 5.1612548828125, 5.32086181640625, 5.48046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 4.0, 9.0, 12.0, 14.0, 18.0, 24.0, 38.0, 33.0, 37.0, 61.0, 63.0, 70.0, 79.0, 109.0, 173.0, 156.0, 162.0, 196.0, 217.0, 241.0, 272.0, 247.0, 247.0, 236.0, 214.0, 155.0, 180.0, 138.0, 109.0, 117.0, 91.0, 75.0, 70.0, 49.0, 34.0, 25.0, 28.0, 23.0, 11.0, 9.0, 5.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2294921875, -1.189666748046875, -1.14984130859375, -1.110015869140625, -1.0701904296875, -1.030364990234375, -0.99053955078125, -0.950714111328125, -0.910888671875, -0.871063232421875, -0.83123779296875, -0.791412353515625, -0.7515869140625, -0.711761474609375, -0.67193603515625, -0.632110595703125, -0.59228515625, -0.552459716796875, -0.51263427734375, -0.472808837890625, -0.4329833984375, -0.393157958984375, -0.35333251953125, -0.313507080078125, -0.273681640625, -0.233856201171875, -0.19403076171875, -0.154205322265625, -0.1143798828125, -0.074554443359375, -0.03472900390625, 0.005096435546875, 0.044921875, 0.084747314453125, 0.12457275390625, 0.164398193359375, 0.2042236328125, 0.244049072265625, 0.28387451171875, 0.323699951171875, 0.363525390625, 0.403350830078125, 0.44317626953125, 0.483001708984375, 0.5228271484375, 0.562652587890625, 0.60247802734375, 0.642303466796875, 0.68212890625, 0.721954345703125, 0.76177978515625, 0.801605224609375, 0.8414306640625, 0.881256103515625, 0.92108154296875, 0.960906982421875, 1.000732421875, 1.040557861328125, 1.08038330078125, 1.120208740234375, 1.1600341796875, 1.199859619140625, 1.23968505859375, 1.279510498046875, 1.3193359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 3.0, 7.0, 9.0, 13.0, 20.0, 10.0, 20.0, 25.0, 37.0, 51.0, 57.0, 63.0, 54.0, 68.0, 65.0, 71.0, 57.0, 64.0, 60.0, 51.0, 33.0, 37.0, 24.0, 23.0, 16.0, 13.0, 7.0, 14.0, 5.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.061370372772217, -4.901939868927002, -4.742508888244629, -4.583078384399414, -4.423647880554199, -4.264216899871826, -4.104786396026611, -3.9453556537628174, -3.7859249114990234, -3.6264941692352295, -3.4670634269714355, -3.3076329231262207, -3.1482021808624268, -2.988771438598633, -2.829340934753418, -2.669910192489624, -2.51047945022583, -2.351048707962036, -2.191617965698242, -2.0321874618530273, -1.8727567195892334, -1.7133259773254395, -1.553895354270935, -1.3944647312164307, -1.2350339889526367, -1.0756032466888428, -0.9161726236343384, -0.7567419409751892, -0.59731125831604, -0.43788057565689087, -0.2784498929977417, -0.1190192699432373, 0.040411949157714844, 0.199842631816864, 0.3592733144760132, 0.5187039971351624, 0.6781346797943115, 0.8375653624534607, 0.9969960451126099, 1.1564266681671143, 1.3158574104309082, 1.4752881526947021, 1.6347187757492065, 1.794149398803711, 1.9535801410675049, 2.113010883331299, 2.2724413871765137, 2.4318721294403076, 2.5913028717041016, 2.7507336139678955, 2.9101643562316895, 3.0695948600769043, 3.2290256023406982, 3.388456344604492, 3.547886848449707, 3.707317590713501, 3.866748332977295, 4.02617883682251, 4.185609817504883, 4.345040321350098, 4.5044708251953125, 4.6639018058776855, 4.8233323097229, 4.982763290405273, 5.142193794250488]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 3.0, 7.0, 10.0, 7.0, 9.0, 12.0, 10.0, 16.0, 16.0, 26.0, 21.0, 22.0, 37.0, 30.0, 38.0, 39.0, 40.0, 37.0, 42.0, 53.0, 47.0, 44.0, 35.0, 43.0, 34.0, 36.0, 27.0, 25.0, 29.0, 24.0, 29.0, 31.0, 18.0, 23.0, 10.0, 11.0, 12.0, 11.0, 5.0, 10.0, 6.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.797964096069336, -2.7095541954040527, -2.6211440563201904, -2.5327341556549072, -2.444324254989624, -2.3559141159057617, -2.2675042152404785, -2.1790943145751953, -2.090684413909912, -2.002274513244629, -1.9138644933700562, -1.8254544734954834, -1.7370445728302002, -1.6486345529556274, -1.5602245330810547, -1.4718146324157715, -1.3834044933319092, -1.2949944734573364, -1.2065845727920532, -1.1181745529174805, -1.0297646522521973, -0.9413546323776245, -0.8529446125030518, -0.7645346522331238, -0.6761246919631958, -0.5877147316932678, -0.49930474162101746, -0.4108947515487671, -0.3224847912788391, -0.23407483100891113, -0.14566481113433838, -0.0572548508644104, 0.031154870986938477, 0.11956484615802765, 0.20797482132911682, 0.2963848114013672, 0.38479477167129517, 0.47320473194122314, 0.5616147518157959, 0.6500247120857239, 0.7384346723556519, 0.8268446326255798, 0.9152545928955078, 1.0036646127700806, 1.0920746326446533, 1.1804845333099365, 1.2688945531845093, 1.357304573059082, 1.4457144737243652, 1.534124493598938, 1.6225343942642212, 1.710944414138794, 1.7993543148040771, 1.88776433467865, 1.9761743545532227, 2.064584255218506, 2.152994155883789, 2.2414040565490723, 2.3298141956329346, 2.4182240962982178, 2.506633996963501, 2.5950441360473633, 2.6834540367126465, 2.7718639373779297, 2.860274076461792]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 6.0, 15.0, 10.0, 24.0, 33.0, 40.0, 66.0, 110.0, 115.0, 186.0, 304.0, 402.0, 661.0, 1115.0, 1875.0, 3256.0, 5748.0, 10559.0, 19136.0, 36249.0, 67235.0, 120252.0, 187913.0, 214364.0, 164789.0, 97413.0, 53224.0, 28442.0, 15235.0, 8216.0, 4639.0, 2619.0, 1650.0, 906.0, 567.0, 341.0, 240.0, 169.0, 126.0, 68.0, 71.0, 50.0, 26.0, 19.0, 12.0, 15.0, 7.0, 5.0, 2.0, 10.0, 5.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.52783203125, -0.5114974975585938, -0.4951629638671875, -0.47882843017578125, -0.462493896484375, -0.44615936279296875, -0.4298248291015625, -0.41349029541015625, -0.39715576171875, -0.38082122802734375, -0.3644866943359375, -0.34815216064453125, -0.331817626953125, -0.31548309326171875, -0.2991485595703125, -0.28281402587890625, -0.2664794921875, -0.25014495849609375, -0.2338104248046875, -0.21747589111328125, -0.201141357421875, -0.18480682373046875, -0.1684722900390625, -0.15213775634765625, -0.13580322265625, -0.11946868896484375, -0.1031341552734375, -0.08679962158203125, -0.070465087890625, -0.05413055419921875, -0.0377960205078125, -0.02146148681640625, -0.005126953125, 0.01120758056640625, 0.0275421142578125, 0.04387664794921875, 0.060211181640625, 0.07654571533203125, 0.0928802490234375, 0.10921478271484375, 0.12554931640625, 0.14188385009765625, 0.1582183837890625, 0.17455291748046875, 0.190887451171875, 0.20722198486328125, 0.2235565185546875, 0.23989105224609375, 0.2562255859375, 0.27256011962890625, 0.2888946533203125, 0.30522918701171875, 0.321563720703125, 0.33789825439453125, 0.3542327880859375, 0.37056732177734375, 0.38690185546875, 0.40323638916015625, 0.4195709228515625, 0.43590545654296875, 0.452239990234375, 0.46857452392578125, 0.4849090576171875, 0.5012435913085938, 0.517578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 11.0, 16.0, 13.0, 15.0, 23.0, 23.0, 30.0, 21.0, 35.0, 40.0, 39.0, 41.0, 36.0, 45.0, 54.0, 54.0, 36.0, 42.0, 40.0, 50.0, 29.0, 43.0, 29.0, 39.0, 27.0, 23.0, 16.0, 15.0, 17.0, 16.0, 9.0, 12.0, 11.0, 4.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.9840087890625, -2.880126953125, -2.7762451171875, -2.67236328125, -2.5684814453125, -2.464599609375, -2.3607177734375, -2.2568359375, -2.1529541015625, -2.049072265625, -1.9451904296875, -1.84130859375, -1.7374267578125, -1.633544921875, -1.5296630859375, -1.42578125, -1.3218994140625, -1.218017578125, -1.1141357421875, -1.01025390625, -0.9063720703125, -0.802490234375, -0.6986083984375, -0.5947265625, -0.4908447265625, -0.386962890625, -0.2830810546875, -0.17919921875, -0.0753173828125, 0.028564453125, 0.1324462890625, 0.236328125, 0.3402099609375, 0.444091796875, 0.5479736328125, 0.65185546875, 0.7557373046875, 0.859619140625, 0.9635009765625, 1.0673828125, 1.1712646484375, 1.275146484375, 1.3790283203125, 1.48291015625, 1.5867919921875, 1.690673828125, 1.7945556640625, 1.8984375, 2.0023193359375, 2.106201171875, 2.2100830078125, 2.31396484375, 2.4178466796875, 2.521728515625, 2.6256103515625, 2.7294921875, 2.8333740234375, 2.937255859375, 3.0411376953125, 3.14501953125, 3.2489013671875, 3.352783203125, 3.4566650390625, 3.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 16.0, 24.0, 16.0, 28.0, 40.0, 43.0, 54.0, 82.0, 113.0, 166.0, 216.0, 278.0, 469.0, 607.0, 1061.0, 1622.0, 2751.0, 5235.0, 10357.0, 24288.0, 158943.0, 773983.0, 37615.0, 14354.0, 6792.0, 3570.0, 1983.0, 1236.0, 792.0, 518.0, 362.0, 243.0, 185.0, 115.0, 79.0, 61.0, 58.0, 44.0, 31.0, 23.0, 19.0, 8.0, 9.0, 7.0, 7.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.6416015625, -1.5921478271484375, -1.542694091796875, -1.4932403564453125, -1.44378662109375, -1.3943328857421875, -1.344879150390625, -1.2954254150390625, -1.2459716796875, -1.1965179443359375, -1.147064208984375, -1.0976104736328125, -1.04815673828125, -0.9987030029296875, -0.949249267578125, -0.8997955322265625, -0.850341796875, -0.8008880615234375, -0.751434326171875, -0.7019805908203125, -0.65252685546875, -0.6030731201171875, -0.553619384765625, -0.5041656494140625, -0.4547119140625, -0.4052581787109375, -0.355804443359375, -0.3063507080078125, -0.25689697265625, -0.2074432373046875, -0.157989501953125, -0.1085357666015625, -0.05908203125, -0.0096282958984375, 0.039825439453125, 0.0892791748046875, 0.13873291015625, 0.1881866455078125, 0.237640380859375, 0.2870941162109375, 0.3365478515625, 0.3860015869140625, 0.435455322265625, 0.4849090576171875, 0.53436279296875, 0.5838165283203125, 0.633270263671875, 0.6827239990234375, 0.732177734375, 0.7816314697265625, 0.831085205078125, 0.8805389404296875, 0.92999267578125, 0.9794464111328125, 1.028900146484375, 1.0783538818359375, 1.1278076171875, 1.1772613525390625, 1.226715087890625, 1.2761688232421875, 1.32562255859375, 1.3750762939453125, 1.424530029296875, 1.4739837646484375, 1.5234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 4.0, 8.0, 7.0, 13.0, 9.0, 14.0, 16.0, 18.0, 15.0, 22.0, 23.0, 28.0, 25.0, 34.0, 27.0, 46.0, 30.0, 40.0, 38.0, 39.0, 38.0, 48.0, 40.0, 37.0, 38.0, 32.0, 36.0, 32.0, 30.0, 26.0, 13.0, 20.0, 18.0, 18.0, 19.0, 14.0, 16.0, 9.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.541015625, -2.46380615234375, -2.3865966796875, -2.30938720703125, -2.232177734375, -2.15496826171875, -2.0777587890625, -2.00054931640625, -1.92333984375, -1.84613037109375, -1.7689208984375, -1.69171142578125, -1.614501953125, -1.53729248046875, -1.4600830078125, -1.38287353515625, -1.3056640625, -1.22845458984375, -1.1512451171875, -1.07403564453125, -0.996826171875, -0.91961669921875, -0.8424072265625, -0.76519775390625, -0.68798828125, -0.61077880859375, -0.5335693359375, -0.45635986328125, -0.379150390625, -0.30194091796875, -0.2247314453125, -0.14752197265625, -0.0703125, 0.00689697265625, 0.0841064453125, 0.16131591796875, 0.238525390625, 0.31573486328125, 0.3929443359375, 0.47015380859375, 0.54736328125, 0.62457275390625, 0.7017822265625, 0.77899169921875, 0.856201171875, 0.93341064453125, 1.0106201171875, 1.08782958984375, 1.1650390625, 1.24224853515625, 1.3194580078125, 1.39666748046875, 1.473876953125, 1.55108642578125, 1.6282958984375, 1.70550537109375, 1.78271484375, 1.85992431640625, 1.9371337890625, 2.01434326171875, 2.091552734375, 2.16876220703125, 2.2459716796875, 2.32318115234375, 2.400390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 15.0, 29.0, 36.0, 71.0, 71.0, 116.0, 200.0, 273.0, 450.0, 724.0, 1085.0, 1743.0, 2834.0, 4658.0, 8174.0, 15437.0, 37109.0, 874691.0, 57488.0, 19200.0, 9753.0, 5526.0, 3318.0, 1974.0, 1226.0, 804.0, 519.0, 318.0, 235.0, 150.0, 83.0, 66.0, 54.0, 29.0, 22.0, 19.0, 15.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.49204254150390625, -0.4728546142578125, -0.45366668701171875, -0.434478759765625, -0.41529083251953125, -0.3961029052734375, -0.37691497802734375, -0.35772705078125, -0.33853912353515625, -0.3193511962890625, -0.30016326904296875, -0.280975341796875, -0.26178741455078125, -0.2425994873046875, -0.22341156005859375, -0.2042236328125, -0.18503570556640625, -0.1658477783203125, -0.14665985107421875, -0.127471923828125, -0.10828399658203125, -0.0890960693359375, -0.06990814208984375, -0.05072021484375, -0.03153228759765625, -0.0123443603515625, 0.00684356689453125, 0.026031494140625, 0.04521942138671875, 0.0644073486328125, 0.08359527587890625, 0.102783203125, 0.12197113037109375, 0.1411590576171875, 0.16034698486328125, 0.179534912109375, 0.19872283935546875, 0.2179107666015625, 0.23709869384765625, 0.25628662109375, 0.27547454833984375, 0.2946624755859375, 0.31385040283203125, 0.333038330078125, 0.35222625732421875, 0.3714141845703125, 0.39060211181640625, 0.4097900390625, 0.42897796630859375, 0.4481658935546875, 0.46735382080078125, 0.486541748046875, 0.5057296752929688, 0.5249176025390625, 0.5441055297851562, 0.56329345703125, 0.5824813842773438, 0.6016693115234375, 0.6208572387695312, 0.640045166015625, 0.6592330932617188, 0.6784210205078125, 0.6976089477539062, 0.716796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 13.0, 18.0, 20.0, 17.0, 15.0, 25.0, 30.0, 30.0, 49.0, 31.0, 38.0, 36.0, 39.0, 35.0, 59.0, 30.0, 45.0, 33.0, 38.0, 38.0, 34.0, 39.0, 29.0, 33.0, 20.0, 34.0, 22.0, 15.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.183819353580475e-05, -3.089383244514465e-05, -2.9949471354484558e-05, -2.9005110263824463e-05, -2.8060749173164368e-05, -2.7116388082504272e-05, -2.6172026991844177e-05, -2.5227665901184082e-05, -2.4283304810523987e-05, -2.333894371986389e-05, -2.2394582629203796e-05, -2.14502215385437e-05, -2.0505860447883606e-05, -1.956149935722351e-05, -1.8617138266563416e-05, -1.767277717590332e-05, -1.6728416085243225e-05, -1.578405499458313e-05, -1.4839693903923035e-05, -1.389533281326294e-05, -1.2950971722602844e-05, -1.2006610631942749e-05, -1.1062249541282654e-05, -1.0117888450622559e-05, -9.173527359962463e-06, -8.229166269302368e-06, -7.284805178642273e-06, -6.340444087982178e-06, -5.3960829973220825e-06, -4.451721906661987e-06, -3.507360816001892e-06, -2.562999725341797e-06, -1.6186386346817017e-06, -6.742775440216064e-07, 2.7008354663848877e-07, 1.214444637298584e-06, 2.158805727958679e-06, 3.1031668186187744e-06, 4.04752790927887e-06, 4.991888999938965e-06, 5.93625009059906e-06, 6.880611181259155e-06, 7.82497227191925e-06, 8.769333362579346e-06, 9.713694453239441e-06, 1.0658055543899536e-05, 1.1602416634559631e-05, 1.2546777725219727e-05, 1.3491138815879822e-05, 1.4435499906539917e-05, 1.5379860997200012e-05, 1.6324222087860107e-05, 1.7268583178520203e-05, 1.8212944269180298e-05, 1.9157305359840393e-05, 2.0101666450500488e-05, 2.1046027541160583e-05, 2.199038863182068e-05, 2.2934749722480774e-05, 2.387911081314087e-05, 2.4823471903800964e-05, 2.576783299446106e-05, 2.6712194085121155e-05, 2.765655517578125e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 19.0, 19.0, 24.0, 28.0, 48.0, 75.0, 106.0, 141.0, 210.0, 332.0, 486.0, 677.0, 1165.0, 1786.0, 2986.0, 5145.0, 9292.0, 17908.0, 36776.0, 80510.0, 183817.0, 312423.0, 211974.0, 94592.0, 42331.0, 20490.0, 10426.0, 5775.0, 3292.0, 2000.0, 1243.0, 827.0, 511.0, 347.0, 235.0, 158.0, 102.0, 77.0, 48.0, 39.0, 24.0, 21.0, 10.0, 12.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2139892578125, -0.20699501037597656, -0.20000076293945312, -0.1930065155029297, -0.18601226806640625, -0.1790180206298828, -0.17202377319335938, -0.16502952575683594, -0.1580352783203125, -0.15104103088378906, -0.14404678344726562, -0.1370525360107422, -0.13005828857421875, -0.12306404113769531, -0.11606979370117188, -0.10907554626464844, -0.102081298828125, -0.09508705139160156, -0.08809280395507812, -0.08109855651855469, -0.07410430908203125, -0.06711006164550781, -0.060115814208984375, -0.05312156677246094, -0.0461273193359375, -0.03913307189941406, -0.032138824462890625, -0.025144577026367188, -0.01815032958984375, -0.011156082153320312, -0.004161834716796875, 0.0028324127197265625, 0.00982666015625, 0.016820907592773438, 0.023815155029296875, 0.030809402465820312, 0.03780364990234375, 0.04479789733886719, 0.051792144775390625, 0.05878639221191406, 0.0657806396484375, 0.07277488708496094, 0.07976913452148438, 0.08676338195800781, 0.09375762939453125, 0.10075187683105469, 0.10774612426757812, 0.11474037170410156, 0.121734619140625, 0.12872886657714844, 0.13572311401367188, 0.1427173614501953, 0.14971160888671875, 0.1567058563232422, 0.16370010375976562, 0.17069435119628906, 0.1776885986328125, 0.18468284606933594, 0.19167709350585938, 0.1986713409423828, 0.20566558837890625, 0.2126598358154297, 0.21965408325195312, 0.22664833068847656, 0.233642578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 10.0, 12.0, 12.0, 13.0, 22.0, 21.0, 30.0, 49.0, 43.0, 61.0, 85.0, 81.0, 93.0, 85.0, 70.0, 62.0, 47.0, 36.0, 15.0, 17.0, 20.0, 22.0, 12.0, 11.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12485885620117188, -0.12044525146484375, -0.11603164672851562, -0.1116180419921875, -0.10720443725585938, -0.10279083251953125, -0.09837722778320312, -0.093963623046875, -0.08955001831054688, -0.08513641357421875, -0.08072280883789062, -0.0763092041015625, -0.07189559936523438, -0.06748199462890625, -0.06306838989257812, -0.05865478515625, -0.054241180419921875, -0.04982757568359375, -0.045413970947265625, -0.0410003662109375, -0.036586761474609375, -0.03217315673828125, -0.027759552001953125, -0.023345947265625, -0.018932342529296875, -0.01451873779296875, -0.010105133056640625, -0.0056915283203125, -0.001277923583984375, 0.00313568115234375, 0.007549285888671875, 0.011962890625, 0.016376495361328125, 0.02079010009765625, 0.025203704833984375, 0.0296173095703125, 0.034030914306640625, 0.03844451904296875, 0.042858123779296875, 0.047271728515625, 0.051685333251953125, 0.05609893798828125, 0.060512542724609375, 0.0649261474609375, 0.06933975219726562, 0.07375335693359375, 0.07816696166992188, 0.08258056640625, 0.08699417114257812, 0.09140777587890625, 0.09582138061523438, 0.1002349853515625, 0.10464859008789062, 0.10906219482421875, 0.11347579956054688, 0.117889404296875, 0.12230300903320312, 0.12671661376953125, 0.13113021850585938, 0.1355438232421875, 0.13995742797851562, 0.14437103271484375, 0.14878463745117188, 0.1531982421875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 11.0, 5.0, 7.0, 7.0, 11.0, 14.0, 19.0, 11.0, 22.0, 31.0, 49.0, 42.0, 59.0, 67.0, 62.0, 58.0, 65.0, 70.0, 48.0, 68.0, 67.0, 36.0, 42.0, 27.0, 25.0, 17.0, 16.0, 14.0, 5.0, 13.0, 6.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.942590713500977, -4.7854461669921875, -4.628301620483398, -4.471157073974609, -4.31401252746582, -4.156867980957031, -3.9997236728668213, -3.8425791263580322, -3.685434579849243, -3.528290033340454, -3.371145486831665, -3.214000940322876, -3.056856632232666, -2.899712085723877, -2.742567539215088, -2.585422992706299, -2.4282784461975098, -2.2711338996887207, -2.1139893531799316, -1.9568449258804321, -1.799700379371643, -1.642555832862854, -1.4854114055633545, -1.3282668590545654, -1.1711223125457764, -1.0139777660369873, -0.856833279132843, -0.6996887922286987, -0.5425442457199097, -0.3853996992111206, -0.22825521230697632, -0.07111072540283203, 0.08603382110595703, 0.2431783378124237, 0.4003228545188904, 0.5574673414230347, 0.7146118879318237, 0.8717564344406128, 1.0289008617401123, 1.1860454082489014, 1.3431899547576904, 1.5003345012664795, 1.6574790477752686, 1.814623475074768, 1.9717680215835571, 2.1289124488830566, 2.2860569953918457, 2.4432015419006348, 2.600346088409424, 2.757490634918213, 2.914635181427002, 3.071779727935791, 3.22892427444458, 3.386068820953369, 3.543213129043579, 3.700357675552368, 3.8575022220611572, 4.014646530151367, 4.171791076660156, 4.328935623168945, 4.486080169677734, 4.643224716186523, 4.8003692626953125, 4.957513809204102, 5.114658355712891]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 11.0, 12.0, 15.0, 16.0, 15.0, 26.0, 20.0, 36.0, 29.0, 35.0, 40.0, 39.0, 38.0, 36.0, 54.0, 47.0, 48.0, 40.0, 40.0, 39.0, 29.0, 35.0, 20.0, 35.0, 29.0, 19.0, 29.0, 27.0, 18.0, 15.0, 14.0, 10.0, 13.0, 7.0, 6.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.8237361907958984, -2.7358651161193848, -2.647994041442871, -2.5601229667663574, -2.4722518920898438, -2.38438081741333, -2.2965097427368164, -2.2086386680603027, -2.120767593383789, -2.0328965187072754, -1.9450254440307617, -1.857154369354248, -1.7692832946777344, -1.6814122200012207, -1.5935412645339966, -1.505670189857483, -1.4177992343902588, -1.3299281597137451, -1.2420570850372314, -1.1541860103607178, -1.066314935684204, -0.9784439206123352, -0.8905729055404663, -0.8027018308639526, -0.714830756187439, -0.6269596815109253, -0.5390886068344116, -0.4512175917625427, -0.36334651708602905, -0.2754754424095154, -0.18760442733764648, -0.09973335266113281, -0.01186227798461914, 0.07600878179073334, 0.16387984156608582, 0.2517508864402771, 0.33962196111679077, 0.42749303579330444, 0.5153640508651733, 0.603235125541687, 0.6911062002182007, 0.7789772748947144, 0.866848349571228, 0.9547193646430969, 1.0425903797149658, 1.1304614543914795, 1.2183325290679932, 1.3062036037445068, 1.3940746784210205, 1.4819457530975342, 1.5698168277740479, 1.6576879024505615, 1.7455589771270752, 1.8334300518035889, 1.921301007270813, 2.009171962738037, 2.097043037414551, 2.1849141120910645, 2.272785186767578, 2.360656261444092, 2.4485273361206055, 2.536398410797119, 2.624269485473633, 2.7121405601501465, 2.80001163482666]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 18.0, 24.0, 38.0, 63.0, 97.0, 143.0, 210.0, 364.0, 531.0, 918.0, 1490.0, 2654.0, 4234.0, 6735.0, 11581.0, 18956.0, 31577.0, 50646.0, 79152.0, 113377.0, 144064.0, 155466.0, 137245.0, 103328.0, 70792.0, 44876.0, 27707.0, 16633.0, 10027.0, 5943.0, 3745.0, 2294.0, 1372.0, 815.0, 498.0, 334.0, 206.0, 124.0, 83.0, 66.0, 27.0, 34.0, 11.0, 8.0, 5.0, 2.0, 9.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-3.341796875, -3.238555908203125, -3.13531494140625, -3.032073974609375, -2.9288330078125, -2.825592041015625, -2.72235107421875, -2.619110107421875, -2.515869140625, -2.412628173828125, -2.30938720703125, -2.206146240234375, -2.1029052734375, -1.999664306640625, -1.89642333984375, -1.793182373046875, -1.68994140625, -1.586700439453125, -1.48345947265625, -1.380218505859375, -1.2769775390625, -1.173736572265625, -1.07049560546875, -0.967254638671875, -0.864013671875, -0.760772705078125, -0.65753173828125, -0.554290771484375, -0.4510498046875, -0.347808837890625, -0.24456787109375, -0.141326904296875, -0.0380859375, 0.065155029296875, 0.16839599609375, 0.271636962890625, 0.3748779296875, 0.478118896484375, 0.58135986328125, 0.684600830078125, 0.787841796875, 0.891082763671875, 0.99432373046875, 1.097564697265625, 1.2008056640625, 1.304046630859375, 1.40728759765625, 1.510528564453125, 1.61376953125, 1.717010498046875, 1.82025146484375, 1.923492431640625, 2.0267333984375, 2.129974365234375, 2.23321533203125, 2.336456298828125, 2.439697265625, 2.542938232421875, 2.64617919921875, 2.749420166015625, 2.8526611328125, 2.955902099609375, 3.05914306640625, 3.162384033203125, 3.265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 7.0, 13.0, 13.0, 13.0, 15.0, 21.0, 25.0, 23.0, 23.0, 40.0, 28.0, 31.0, 35.0, 33.0, 32.0, 43.0, 47.0, 51.0, 41.0, 29.0, 37.0, 24.0, 31.0, 35.0, 44.0, 29.0, 29.0, 26.0, 23.0, 19.0, 23.0, 15.0, 12.0, 14.0, 7.0, 12.0, 7.0, 8.0, 4.0, 3.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.543731689453125, -2.45269775390625, -2.361663818359375, -2.2706298828125, -2.179595947265625, -2.08856201171875, -1.997528076171875, -1.906494140625, -1.815460205078125, -1.72442626953125, -1.633392333984375, -1.5423583984375, -1.451324462890625, -1.36029052734375, -1.269256591796875, -1.17822265625, -1.087188720703125, -0.99615478515625, -0.905120849609375, -0.8140869140625, -0.723052978515625, -0.63201904296875, -0.540985107421875, -0.449951171875, -0.358917236328125, -0.26788330078125, -0.176849365234375, -0.0858154296875, 0.005218505859375, 0.09625244140625, 0.187286376953125, 0.2783203125, 0.369354248046875, 0.46038818359375, 0.551422119140625, 0.6424560546875, 0.733489990234375, 0.82452392578125, 0.915557861328125, 1.006591796875, 1.097625732421875, 1.18865966796875, 1.279693603515625, 1.3707275390625, 1.461761474609375, 1.55279541015625, 1.643829345703125, 1.73486328125, 1.825897216796875, 1.91693115234375, 2.007965087890625, 2.0989990234375, 2.190032958984375, 2.28106689453125, 2.372100830078125, 2.463134765625, 2.554168701171875, 2.64520263671875, 2.736236572265625, 2.8272705078125, 2.918304443359375, 3.00933837890625, 3.100372314453125, 3.19140625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 16.0, 19.0, 24.0, 40.0, 67.0, 96.0, 128.0, 195.0, 328.0, 466.0, 806.0, 1352.0, 2200.0, 3675.0, 6014.0, 10167.0, 17248.0, 28438.0, 46243.0, 73195.0, 108372.0, 142850.0, 158204.0, 143943.0, 109824.0, 74986.0, 47144.0, 29193.0, 17271.0, 10243.0, 6267.0, 3635.0, 2197.0, 1341.0, 858.0, 545.0, 355.0, 197.0, 140.0, 95.0, 58.0, 39.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-3.42578125, -3.323577880859375, -3.22137451171875, -3.119171142578125, -3.0169677734375, -2.914764404296875, -2.81256103515625, -2.710357666015625, -2.608154296875, -2.505950927734375, -2.40374755859375, -2.301544189453125, -2.1993408203125, -2.097137451171875, -1.99493408203125, -1.892730712890625, -1.79052734375, -1.688323974609375, -1.58612060546875, -1.483917236328125, -1.3817138671875, -1.279510498046875, -1.17730712890625, -1.075103759765625, -0.972900390625, -0.870697021484375, -0.76849365234375, -0.666290283203125, -0.5640869140625, -0.461883544921875, -0.35968017578125, -0.257476806640625, -0.1552734375, -0.053070068359375, 0.04913330078125, 0.151336669921875, 0.2535400390625, 0.355743408203125, 0.45794677734375, 0.560150146484375, 0.662353515625, 0.764556884765625, 0.86676025390625, 0.968963623046875, 1.0711669921875, 1.173370361328125, 1.27557373046875, 1.377777099609375, 1.47998046875, 1.582183837890625, 1.68438720703125, 1.786590576171875, 1.8887939453125, 1.990997314453125, 2.09320068359375, 2.195404052734375, 2.297607421875, 2.399810791015625, 2.50201416015625, 2.604217529296875, 2.7064208984375, 2.808624267578125, 2.91082763671875, 3.013031005859375, 3.115234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 9.0, 16.0, 7.0, 13.0, 10.0, 23.0, 17.0, 29.0, 31.0, 39.0, 36.0, 29.0, 37.0, 43.0, 35.0, 40.0, 40.0, 40.0, 45.0, 51.0, 39.0, 32.0, 40.0, 33.0, 36.0, 32.0, 22.0, 29.0, 15.0, 27.0, 15.0, 17.0, 13.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.98492431640625, -1.9210205078125, -1.85711669921875, -1.793212890625, -1.72930908203125, -1.6654052734375, -1.60150146484375, -1.53759765625, -1.47369384765625, -1.4097900390625, -1.34588623046875, -1.281982421875, -1.21807861328125, -1.1541748046875, -1.09027099609375, -1.0263671875, -0.96246337890625, -0.8985595703125, -0.83465576171875, -0.770751953125, -0.70684814453125, -0.6429443359375, -0.57904052734375, -0.51513671875, -0.45123291015625, -0.3873291015625, -0.32342529296875, -0.259521484375, -0.19561767578125, -0.1317138671875, -0.06781005859375, -0.00390625, 0.05999755859375, 0.1239013671875, 0.18780517578125, 0.251708984375, 0.31561279296875, 0.3795166015625, 0.44342041015625, 0.50732421875, 0.57122802734375, 0.6351318359375, 0.69903564453125, 0.762939453125, 0.82684326171875, 0.8907470703125, 0.95465087890625, 1.0185546875, 1.08245849609375, 1.1463623046875, 1.21026611328125, 1.274169921875, 1.33807373046875, 1.4019775390625, 1.46588134765625, 1.52978515625, 1.59368896484375, 1.6575927734375, 1.72149658203125, 1.785400390625, 1.84930419921875, 1.9132080078125, 1.97711181640625, 2.041015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 10.0, 19.0, 22.0, 38.0, 55.0, 109.0, 140.0, 223.0, 351.0, 556.0, 938.0, 1460.0, 2576.0, 4235.0, 7382.0, 12941.0, 22366.0, 39416.0, 68510.0, 111793.0, 161641.0, 185020.0, 159659.0, 110126.0, 67156.0, 39376.0, 22187.0, 12566.0, 7168.0, 4202.0, 2453.0, 1448.0, 899.0, 537.0, 346.0, 236.0, 129.0, 100.0, 52.0, 30.0, 20.0, 18.0, 9.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.099609375, -2.03497314453125, -1.9703369140625, -1.90570068359375, -1.841064453125, -1.77642822265625, -1.7117919921875, -1.64715576171875, -1.58251953125, -1.51788330078125, -1.4532470703125, -1.38861083984375, -1.323974609375, -1.25933837890625, -1.1947021484375, -1.13006591796875, -1.0654296875, -1.00079345703125, -0.9361572265625, -0.87152099609375, -0.806884765625, -0.74224853515625, -0.6776123046875, -0.61297607421875, -0.54833984375, -0.48370361328125, -0.4190673828125, -0.35443115234375, -0.289794921875, -0.22515869140625, -0.1605224609375, -0.09588623046875, -0.03125, 0.03338623046875, 0.0980224609375, 0.16265869140625, 0.227294921875, 0.29193115234375, 0.3565673828125, 0.42120361328125, 0.48583984375, 0.55047607421875, 0.6151123046875, 0.67974853515625, 0.744384765625, 0.80902099609375, 0.8736572265625, 0.93829345703125, 1.0029296875, 1.06756591796875, 1.1322021484375, 1.19683837890625, 1.261474609375, 1.32611083984375, 1.3907470703125, 1.45538330078125, 1.52001953125, 1.58465576171875, 1.6492919921875, 1.71392822265625, 1.778564453125, 1.84320068359375, 1.9078369140625, 1.97247314453125, 2.037109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 14.0, 15.0, 17.0, 16.0, 15.0, 24.0, 38.0, 23.0, 32.0, 42.0, 50.0, 48.0, 54.0, 68.0, 74.0, 49.0, 61.0, 44.0, 43.0, 40.0, 42.0, 24.0, 19.0, 27.0, 20.0, 20.0, 13.0, 10.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00019216537475585938, -0.0001864079385995865, -0.0001806505024433136, -0.0001748930662870407, -0.00016913563013076782, -0.00016337819397449493, -0.00015762075781822205, -0.00015186332166194916, -0.00014610588550567627, -0.00014034844934940338, -0.0001345910131931305, -0.0001288335770368576, -0.00012307614088058472, -0.00011731870472431183, -0.00011156126856803894, -0.00010580383241176605, -0.00010004639625549316, -9.428896009922028e-05, -8.853152394294739e-05, -8.27740877866745e-05, -7.701665163040161e-05, -7.125921547412872e-05, -6.550177931785583e-05, -5.974434316158295e-05, -5.398690700531006e-05, -4.822947084903717e-05, -4.247203469276428e-05, -3.6714598536491394e-05, -3.0957162380218506e-05, -2.5199726223945618e-05, -1.944229006767273e-05, -1.3684853911399841e-05, -7.927417755126953e-06, -2.169981598854065e-06, 3.5874545574188232e-06, 9.344890713691711e-06, 1.51023268699646e-05, 2.0859763026237488e-05, 2.6617199182510376e-05, 3.2374635338783264e-05, 3.813207149505615e-05, 4.388950765132904e-05, 4.964694380760193e-05, 5.540437996387482e-05, 6.11618161201477e-05, 6.69192522764206e-05, 7.267668843269348e-05, 7.843412458896637e-05, 8.419156074523926e-05, 8.994899690151215e-05, 9.570643305778503e-05, 0.00010146386921405792, 0.00010722130537033081, 0.0001129787415266037, 0.00011873617768287659, 0.00012449361383914948, 0.00013025104999542236, 0.00013600848615169525, 0.00014176592230796814, 0.00014752335846424103, 0.00015328079462051392, 0.0001590382307767868, 0.0001647956669330597, 0.00017055310308933258, 0.00017631053924560547]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 12.0, 11.0, 23.0, 37.0, 64.0, 94.0, 145.0, 251.0, 403.0, 651.0, 999.0, 1673.0, 2590.0, 4236.0, 6953.0, 11467.0, 18383.0, 29972.0, 48292.0, 75297.0, 110361.0, 143914.0, 157109.0, 140144.0, 105672.0, 71318.0, 45015.0, 28284.0, 17416.0, 10746.0, 6507.0, 4049.0, 2429.0, 1523.0, 977.0, 553.0, 371.0, 222.0, 141.0, 90.0, 51.0, 47.0, 25.0, 10.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7412109375, -1.6891326904296875, -1.637054443359375, -1.5849761962890625, -1.53289794921875, -1.4808197021484375, -1.428741455078125, -1.3766632080078125, -1.3245849609375, -1.2725067138671875, -1.220428466796875, -1.1683502197265625, -1.11627197265625, -1.0641937255859375, -1.012115478515625, -0.9600372314453125, -0.907958984375, -0.8558807373046875, -0.803802490234375, -0.7517242431640625, -0.69964599609375, -0.6475677490234375, -0.595489501953125, -0.5434112548828125, -0.4913330078125, -0.4392547607421875, -0.387176513671875, -0.3350982666015625, -0.28302001953125, -0.2309417724609375, -0.178863525390625, -0.1267852783203125, -0.07470703125, -0.0226287841796875, 0.029449462890625, 0.0815277099609375, 0.13360595703125, 0.1856842041015625, 0.237762451171875, 0.2898406982421875, 0.3419189453125, 0.3939971923828125, 0.446075439453125, 0.4981536865234375, 0.55023193359375, 0.6023101806640625, 0.654388427734375, 0.7064666748046875, 0.758544921875, 0.8106231689453125, 0.862701416015625, 0.9147796630859375, 0.96685791015625, 1.0189361572265625, 1.071014404296875, 1.1230926513671875, 1.1751708984375, 1.2272491455078125, 1.279327392578125, 1.3314056396484375, 1.38348388671875, 1.4355621337890625, 1.487640380859375, 1.5397186279296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 4.0, 9.0, 13.0, 15.0, 12.0, 18.0, 16.0, 23.0, 32.0, 30.0, 39.0, 54.0, 59.0, 59.0, 61.0, 57.0, 72.0, 56.0, 64.0, 54.0, 37.0, 23.0, 34.0, 30.0, 29.0, 22.0, 14.0, 12.0, 12.0, 11.0, 6.0, 4.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66064453125, -0.6390609741210938, -0.6174774169921875, -0.5958938598632812, -0.574310302734375, -0.5527267456054688, -0.5311431884765625, -0.5095596313476562, -0.48797607421875, -0.46639251708984375, -0.4448089599609375, -0.42322540283203125, -0.401641845703125, -0.38005828857421875, -0.3584747314453125, -0.33689117431640625, -0.3153076171875, -0.29372406005859375, -0.2721405029296875, -0.25055694580078125, -0.228973388671875, -0.20738983154296875, -0.1858062744140625, -0.16422271728515625, -0.14263916015625, -0.12105560302734375, -0.0994720458984375, -0.07788848876953125, -0.056304931640625, -0.03472137451171875, -0.0131378173828125, 0.00844573974609375, 0.030029296875, 0.05161285400390625, 0.0731964111328125, 0.09477996826171875, 0.116363525390625, 0.13794708251953125, 0.1595306396484375, 0.18111419677734375, 0.20269775390625, 0.22428131103515625, 0.2458648681640625, 0.26744842529296875, 0.289031982421875, 0.31061553955078125, 0.3321990966796875, 0.35378265380859375, 0.3753662109375, 0.39694976806640625, 0.4185333251953125, 0.44011688232421875, 0.461700439453125, 0.48328399658203125, 0.5048675537109375, 0.5264511108398438, 0.54803466796875, 0.5696182250976562, 0.5912017822265625, 0.6127853393554688, 0.634368896484375, 0.6559524536132812, 0.6775360107421875, 0.6991195678710938, 0.720703125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 11.0, 12.0, 11.0, 21.0, 29.0, 48.0, 45.0, 48.0, 62.0, 59.0, 66.0, 60.0, 62.0, 59.0, 56.0, 61.0, 46.0, 44.0, 27.0, 34.0, 26.0, 18.0, 9.0, 7.0, 11.0, 10.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9030683040618896, -3.753147840499878, -3.6032276153564453, -3.4533071517944336, -3.303386926651001, -3.1534664630889893, -3.0035462379455566, -2.853625774383545, -2.703705310821533, -2.5537848472595215, -2.403864622116089, -2.253944158554077, -2.1040239334106445, -1.9541034698486328, -1.8041831254959106, -1.6542627811431885, -1.5043425559997559, -1.3544222116470337, -1.2045018672943115, -1.0545814037322998, -0.9046611189842224, -0.7547407746315002, -0.6048203706741333, -0.45490002632141113, -0.30497968196868896, -0.1550593227148056, -0.005138963460922241, 0.14478141069412231, 0.2947017550468445, 0.44462209939956665, 0.5945425033569336, 0.7444628477096558, 0.894383430480957, 1.0443037748336792, 1.1942241191864014, 1.344144582748413, 1.4940648078918457, 1.6439852714538574, 1.7939056158065796, 1.9438259601593018, 2.0937461853027344, 2.243666648864746, 2.3935868740081787, 2.5435073375701904, 2.693427562713623, 2.8433480262756348, 2.9932684898376465, 3.143188714981079, 3.293109178543091, 3.4430296421051025, 3.592949867248535, 3.742870330810547, 3.8927905559539795, 4.042710781097412, 4.192631244659424, 4.3425517082214355, 4.492472171783447, 4.642392635345459, 4.792313098907471, 4.942233085632324, 5.092153549194336, 5.242074012756348, 5.391994476318359, 5.541914939880371, 5.691834926605225]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 1.0, 8.0, 1.0, 3.0, 6.0, 12.0, 13.0, 17.0, 12.0, 8.0, 14.0, 24.0, 21.0, 26.0, 35.0, 24.0, 33.0, 38.0, 38.0, 49.0, 44.0, 36.0, 43.0, 38.0, 34.0, 32.0, 31.0, 23.0, 28.0, 34.0, 26.0, 26.0, 32.0, 20.0, 25.0, 27.0, 16.0, 8.0, 11.0, 21.0, 9.0, 6.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0], "bins": [-2.761392116546631, -2.680264949798584, -2.599137544631958, -2.518010377883911, -2.4368832111358643, -2.3557558059692383, -2.2746286392211914, -2.1935014724731445, -2.1123740673065186, -2.0312469005584717, -1.9501196146011353, -1.8689923286437988, -1.7878650426864624, -1.706737756729126, -1.625610589981079, -1.5444833040237427, -1.4633561372756958, -1.3822288513183594, -1.3011016845703125, -1.219974398612976, -1.1388471126556396, -1.0577199459075928, -0.9765926599502563, -0.8954653739929199, -0.8143381476402283, -0.7332109212875366, -0.6520836353302002, -0.5709564089775085, -0.4898291528224945, -0.40870189666748047, -0.3275746703147888, -0.2464473843574524, -0.16532015800476074, -0.0841929093003273, -0.00306566059589386, 0.07806158065795898, 0.15918883681297302, 0.24031609296798706, 0.3214433193206787, 0.40257060527801514, 0.4836978316307068, 0.5648250579833984, 0.6459523439407349, 0.7270795702934265, 0.8082067966461182, 0.8893340826034546, 0.9704613089561462, 1.051588535308838, 1.1327158212661743, 1.2138431072235107, 1.2949702739715576, 1.376097559928894, 1.4572248458862305, 1.5383520126342773, 1.6194792985916138, 1.7006065845489502, 1.781733751296997, 1.8628610372543335, 1.9439882040023804, 2.025115489959717, 2.1062426567077637, 2.1873700618743896, 2.2684972286224365, 2.3496246337890625, 2.4307518005371094]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 9.0, 11.0, 23.0, 25.0, 38.0, 52.0, 68.0, 117.0, 212.0, 318.0, 446.0, 691.0, 1043.0, 1769.0, 2851.0, 4684.0, 7814.0, 13949.0, 25472.0, 49713.0, 101316.0, 222267.0, 517864.0, 1031953.0, 1113228.0, 602227.0, 257634.0, 115340.0, 56228.0, 28931.0, 15911.0, 8980.0, 5106.0, 3008.0, 1882.0, 1128.0, 747.0, 439.0, 254.0, 203.0, 132.0, 71.0, 45.0, 43.0, 18.0, 13.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-5.203125, -5.0589599609375, -4.914794921875, -4.7706298828125, -4.62646484375, -4.4822998046875, -4.338134765625, -4.1939697265625, -4.0498046875, -3.9056396484375, -3.761474609375, -3.6173095703125, -3.47314453125, -3.3289794921875, -3.184814453125, -3.0406494140625, -2.896484375, -2.7523193359375, -2.608154296875, -2.4639892578125, -2.31982421875, -2.1756591796875, -2.031494140625, -1.8873291015625, -1.7431640625, -1.5989990234375, -1.454833984375, -1.3106689453125, -1.16650390625, -1.0223388671875, -0.878173828125, -0.7340087890625, -0.58984375, -0.4456787109375, -0.301513671875, -0.1573486328125, -0.01318359375, 0.1309814453125, 0.275146484375, 0.4193115234375, 0.5634765625, 0.7076416015625, 0.851806640625, 0.9959716796875, 1.14013671875, 1.2843017578125, 1.428466796875, 1.5726318359375, 1.716796875, 1.8609619140625, 2.005126953125, 2.1492919921875, 2.29345703125, 2.4376220703125, 2.581787109375, 2.7259521484375, 2.8701171875, 3.0142822265625, 3.158447265625, 3.3026123046875, 3.44677734375, 3.5909423828125, 3.735107421875, 3.8792724609375, 4.0234375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 10.0, 17.0, 14.0, 15.0, 14.0, 17.0, 21.0, 28.0, 19.0, 30.0, 43.0, 29.0, 37.0, 39.0, 40.0, 38.0, 48.0, 47.0, 34.0, 39.0, 32.0, 30.0, 36.0, 41.0, 33.0, 23.0, 21.0, 22.0, 23.0, 25.0, 20.0, 13.0, 10.0, 11.0, 7.0, 14.0, 3.0, 5.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8919677734375, -1.831787109375, -1.7716064453125, -1.71142578125, -1.6512451171875, -1.591064453125, -1.5308837890625, -1.470703125, -1.4105224609375, -1.350341796875, -1.2901611328125, -1.22998046875, -1.1697998046875, -1.109619140625, -1.0494384765625, -0.9892578125, -0.9290771484375, -0.868896484375, -0.8087158203125, -0.74853515625, -0.6883544921875, -0.628173828125, -0.5679931640625, -0.5078125, -0.4476318359375, -0.387451171875, -0.3272705078125, -0.26708984375, -0.2069091796875, -0.146728515625, -0.0865478515625, -0.0263671875, 0.0338134765625, 0.093994140625, 0.1541748046875, 0.21435546875, 0.2745361328125, 0.334716796875, 0.3948974609375, 0.455078125, 0.5152587890625, 0.575439453125, 0.6356201171875, 0.69580078125, 0.7559814453125, 0.816162109375, 0.8763427734375, 0.9365234375, 0.9967041015625, 1.056884765625, 1.1170654296875, 1.17724609375, 1.2374267578125, 1.297607421875, 1.3577880859375, 1.41796875, 1.4781494140625, 1.538330078125, 1.5985107421875, 1.65869140625, 1.7188720703125, 1.779052734375, 1.8392333984375, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 31.0, 29.0, 50.0, 63.0, 117.0, 179.0, 263.0, 385.0, 651.0, 930.0, 1634.0, 2557.0, 4142.0, 6969.0, 12067.0, 20994.0, 38495.0, 73202.0, 143392.0, 285092.0, 562891.0, 936695.0, 936982.0, 567641.0, 289982.0, 144460.0, 73875.0, 38822.0, 21567.0, 12151.0, 6983.0, 4029.0, 2544.0, 1585.0, 1007.0, 597.0, 406.0, 277.0, 191.0, 100.0, 81.0, 49.0, 34.0, 28.0, 16.0, 6.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.05859375, -3.92333984375, -3.7880859375, -3.65283203125, -3.517578125, -3.38232421875, -3.2470703125, -3.11181640625, -2.9765625, -2.84130859375, -2.7060546875, -2.57080078125, -2.435546875, -2.30029296875, -2.1650390625, -2.02978515625, -1.89453125, -1.75927734375, -1.6240234375, -1.48876953125, -1.353515625, -1.21826171875, -1.0830078125, -0.94775390625, -0.8125, -0.67724609375, -0.5419921875, -0.40673828125, -0.271484375, -0.13623046875, -0.0009765625, 0.13427734375, 0.26953125, 0.40478515625, 0.5400390625, 0.67529296875, 0.810546875, 0.94580078125, 1.0810546875, 1.21630859375, 1.3515625, 1.48681640625, 1.6220703125, 1.75732421875, 1.892578125, 2.02783203125, 2.1630859375, 2.29833984375, 2.43359375, 2.56884765625, 2.7041015625, 2.83935546875, 2.974609375, 3.10986328125, 3.2451171875, 3.38037109375, 3.515625, 3.65087890625, 3.7861328125, 3.92138671875, 4.056640625, 4.19189453125, 4.3271484375, 4.46240234375, 4.59765625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 4.0, 10.0, 17.0, 22.0, 20.0, 27.0, 34.0, 55.0, 61.0, 82.0, 86.0, 113.0, 114.0, 148.0, 191.0, 226.0, 230.0, 246.0, 247.0, 246.0, 264.0, 224.0, 224.0, 200.0, 181.0, 147.0, 119.0, 104.0, 85.0, 67.0, 71.0, 44.0, 32.0, 27.0, 30.0, 14.0, 11.0, 8.0, 10.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.209442138671875, -1.17181396484375, -1.134185791015625, -1.0965576171875, -1.058929443359375, -1.02130126953125, -0.983673095703125, -0.946044921875, -0.908416748046875, -0.87078857421875, -0.833160400390625, -0.7955322265625, -0.757904052734375, -0.72027587890625, -0.682647705078125, -0.64501953125, -0.607391357421875, -0.56976318359375, -0.532135009765625, -0.4945068359375, -0.456878662109375, -0.41925048828125, -0.381622314453125, -0.343994140625, -0.306365966796875, -0.26873779296875, -0.231109619140625, -0.1934814453125, -0.155853271484375, -0.11822509765625, -0.080596923828125, -0.04296875, -0.005340576171875, 0.03228759765625, 0.069915771484375, 0.1075439453125, 0.145172119140625, 0.18280029296875, 0.220428466796875, 0.258056640625, 0.295684814453125, 0.33331298828125, 0.370941162109375, 0.4085693359375, 0.446197509765625, 0.48382568359375, 0.521453857421875, 0.55908203125, 0.596710205078125, 0.63433837890625, 0.671966552734375, 0.7095947265625, 0.747222900390625, 0.78485107421875, 0.822479248046875, 0.860107421875, 0.897735595703125, 0.93536376953125, 0.972991943359375, 1.0106201171875, 1.048248291015625, 1.08587646484375, 1.123504638671875, 1.1611328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 6.0, 7.0, 10.0, 15.0, 16.0, 14.0, 20.0, 28.0, 32.0, 33.0, 51.0, 43.0, 52.0, 56.0, 46.0, 53.0, 56.0, 61.0, 51.0, 45.0, 34.0, 36.0, 35.0, 33.0, 25.0, 24.0, 23.0, 15.0, 6.0, 20.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2587530612945557, -3.1374149322509766, -3.0160770416259766, -2.8947389125823975, -2.7734007835388184, -2.6520628929138184, -2.5307247638702393, -2.40938663482666, -2.28804874420166, -2.166710615158081, -2.045372724533081, -1.924034595489502, -1.8026965856552124, -1.6813585758209229, -1.5600204467773438, -1.4386824369430542, -1.3173444271087646, -1.196006417274475, -1.0746684074401855, -0.9533302783966064, -0.8319922685623169, -0.7106542587280273, -0.589316189289093, -0.4679781198501587, -0.34664011001586914, -0.2253020703792572, -0.10396403074264526, 0.017374008893966675, 0.1387120485305786, 0.26005005836486816, 0.3813881278038025, 0.5027261972427368, 0.6240639686584473, 0.7454019784927368, 0.8667400479316711, 0.9880781173706055, 1.109416127204895, 1.2307541370391846, 1.3520922660827637, 1.4734302759170532, 1.5947682857513428, 1.7161062955856323, 1.8374443054199219, 1.958782434463501, 2.08012056350708, 2.20145845413208, 2.322796583175659, 2.4441347122192383, 2.5654726028442383, 2.6868107318878174, 2.8081486225128174, 2.9294867515563965, 3.0508246421813965, 3.1721627712249756, 3.2935009002685547, 3.4148387908935547, 3.536176919937134, 3.657515048980713, 3.778852939605713, 3.900191068649292, 4.021529197692871, 4.142867088317871, 4.264204978942871, 4.385543346405029, 4.506881237030029]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 7.0, 12.0, 9.0, 6.0, 11.0, 9.0, 14.0, 15.0, 20.0, 23.0, 15.0, 17.0, 29.0, 34.0, 35.0, 29.0, 26.0, 38.0, 30.0, 46.0, 46.0, 50.0, 43.0, 28.0, 27.0, 29.0, 38.0, 36.0, 31.0, 37.0, 20.0, 22.0, 11.0, 20.0, 24.0, 17.0, 22.0, 13.0, 8.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.0733299255371094, -2.0040252208709717, -1.934720516204834, -1.8654159307479858, -1.7961112260818481, -1.7268065214157104, -1.6575019359588623, -1.5881972312927246, -1.518892526626587, -1.4495878219604492, -1.3802831172943115, -1.3109785318374634, -1.2416738271713257, -1.172369122505188, -1.1030645370483398, -1.0337598323822021, -0.9644551277160645, -0.8951504230499268, -0.8258457779884338, -0.7565411329269409, -0.6872364282608032, -0.6179317235946655, -0.5486270785331726, -0.4793224036693573, -0.410017728805542, -0.3407130539417267, -0.2714083790779114, -0.20210370421409607, -0.13279902935028076, -0.06349435448646545, 0.0058103203773498535, 0.07511499524116516, 0.14441990852355957, 0.21372458338737488, 0.2830292582511902, 0.3523339331150055, 0.4216386079788208, 0.4909432828426361, 0.5602479577064514, 0.6295526027679443, 0.698857307434082, 0.7681620121002197, 0.8374666571617126, 0.9067713022232056, 0.9760760068893433, 1.045380711555481, 1.114685297012329, 1.1839900016784668, 1.2532947063446045, 1.3225994110107422, 1.3919041156768799, 1.461208701133728, 1.5305134057998657, 1.5998181104660034, 1.6691226959228516, 1.7384274005889893, 1.807732105255127, 1.8770368099212646, 1.9463415145874023, 2.01564621925354, 2.0849509239196777, 2.1542553901672363, 2.223560094833374, 2.2928647994995117, 2.3621695041656494]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 23.0, 32.0, 56.0, 83.0, 115.0, 169.0, 296.0, 415.0, 628.0, 950.0, 1496.0, 2328.0, 3663.0, 5729.0, 9105.0, 14356.0, 22547.0, 35283.0, 54423.0, 82369.0, 117504.0, 148476.0, 153693.0, 128318.0, 93210.0, 62004.0, 40552.0, 25638.0, 16361.0, 10314.0, 6504.0, 4231.0, 2696.0, 1805.0, 1110.0, 681.0, 446.0, 324.0, 204.0, 121.0, 111.0, 48.0, 32.0, 23.0, 10.0, 15.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.315673828125, -0.3064308166503906, -0.29718780517578125, -0.2879447937011719, -0.2787017822265625, -0.2694587707519531, -0.26021575927734375, -0.2509727478027344, -0.241729736328125, -0.23248672485351562, -0.22324371337890625, -0.21400070190429688, -0.2047576904296875, -0.19551467895507812, -0.18627166748046875, -0.17702865600585938, -0.16778564453125, -0.15854263305664062, -0.14929962158203125, -0.14005661010742188, -0.1308135986328125, -0.12157058715820312, -0.11232757568359375, -0.10308456420898438, -0.093841552734375, -0.08459854125976562, -0.07535552978515625, -0.06611251831054688, -0.0568695068359375, -0.047626495361328125, -0.03838348388671875, -0.029140472412109375, -0.0198974609375, -0.010654449462890625, -0.00141143798828125, 0.007831573486328125, 0.0170745849609375, 0.026317596435546875, 0.03556060791015625, 0.044803619384765625, 0.054046630859375, 0.06328964233398438, 0.07253265380859375, 0.08177566528320312, 0.0910186767578125, 0.10026168823242188, 0.10950469970703125, 0.11874771118164062, 0.12799072265625, 0.13723373413085938, 0.14647674560546875, 0.15571975708007812, 0.1649627685546875, 0.17420578002929688, 0.18344879150390625, 0.19269180297851562, 0.201934814453125, 0.21117782592773438, 0.22042083740234375, 0.22966384887695312, 0.2389068603515625, 0.24814987182617188, 0.25739288330078125, 0.2666358947753906, 0.27587890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 16.0, 15.0, 23.0, 22.0, 18.0, 20.0, 36.0, 20.0, 26.0, 40.0, 25.0, 41.0, 45.0, 40.0, 44.0, 53.0, 40.0, 38.0, 47.0, 33.0, 30.0, 31.0, 34.0, 25.0, 19.0, 27.0, 19.0, 23.0, 11.0, 19.0, 19.0, 20.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28125, -2.198883056640625, -2.11651611328125, -2.034149169921875, -1.9517822265625, -1.869415283203125, -1.78704833984375, -1.704681396484375, -1.622314453125, -1.539947509765625, -1.45758056640625, -1.375213623046875, -1.2928466796875, -1.210479736328125, -1.12811279296875, -1.045745849609375, -0.96337890625, -0.881011962890625, -0.79864501953125, -0.716278076171875, -0.6339111328125, -0.551544189453125, -0.46917724609375, -0.386810302734375, -0.304443359375, -0.222076416015625, -0.13970947265625, -0.057342529296875, 0.0250244140625, 0.107391357421875, 0.18975830078125, 0.272125244140625, 0.3544921875, 0.436859130859375, 0.51922607421875, 0.601593017578125, 0.6839599609375, 0.766326904296875, 0.84869384765625, 0.931060791015625, 1.013427734375, 1.095794677734375, 1.17816162109375, 1.260528564453125, 1.3428955078125, 1.425262451171875, 1.50762939453125, 1.589996337890625, 1.67236328125, 1.754730224609375, 1.83709716796875, 1.919464111328125, 2.0018310546875, 2.084197998046875, 2.16656494140625, 2.248931884765625, 2.331298828125, 2.413665771484375, 2.49603271484375, 2.578399658203125, 2.6607666015625, 2.743133544921875, 2.82550048828125, 2.907867431640625, 2.990234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 7.0, 11.0, 16.0, 19.0, 25.0, 26.0, 59.0, 57.0, 85.0, 108.0, 148.0, 195.0, 308.0, 451.0, 649.0, 1094.0, 1778.0, 3170.0, 5974.0, 11518.0, 24087.0, 118039.0, 796702.0, 46413.0, 17614.0, 8661.0, 4488.0, 2536.0, 1451.0, 931.0, 610.0, 382.0, 260.0, 184.0, 123.0, 104.0, 59.0, 42.0, 34.0, 25.0, 20.0, 24.0, 11.0, 16.0, 10.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.95849609375, -0.92578125, -0.89306640625, -0.8603515625, -0.82763671875, -0.794921875, -0.76220703125, -0.7294921875, -0.69677734375, -0.6640625, -0.63134765625, -0.5986328125, -0.56591796875, -0.533203125, -0.50048828125, -0.4677734375, -0.43505859375, -0.40234375, -0.36962890625, -0.3369140625, -0.30419921875, -0.271484375, -0.23876953125, -0.2060546875, -0.17333984375, -0.140625, -0.10791015625, -0.0751953125, -0.04248046875, -0.009765625, 0.02294921875, 0.0556640625, 0.08837890625, 0.12109375, 0.15380859375, 0.1865234375, 0.21923828125, 0.251953125, 0.28466796875, 0.3173828125, 0.35009765625, 0.3828125, 0.41552734375, 0.4482421875, 0.48095703125, 0.513671875, 0.54638671875, 0.5791015625, 0.61181640625, 0.64453125, 0.67724609375, 0.7099609375, 0.74267578125, 0.775390625, 0.80810546875, 0.8408203125, 0.87353515625, 0.90625, 0.93896484375, 0.9716796875, 1.00439453125, 1.037109375, 1.06982421875, 1.1025390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 4.0, 8.0, 5.0, 14.0, 14.0, 13.0, 22.0, 21.0, 15.0, 24.0, 20.0, 30.0, 34.0, 30.0, 30.0, 42.0, 36.0, 34.0, 29.0, 36.0, 43.0, 30.0, 35.0, 34.0, 29.0, 36.0, 35.0, 31.0, 31.0, 34.0, 25.0, 19.0, 15.0, 20.0, 21.0, 13.0, 14.0, 9.0, 9.0, 10.0, 8.0, 10.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6951446533203125, -1.640289306640625, -1.5854339599609375, -1.53057861328125, -1.4757232666015625, -1.420867919921875, -1.3660125732421875, -1.3111572265625, -1.2563018798828125, -1.201446533203125, -1.1465911865234375, -1.09173583984375, -1.0368804931640625, -0.982025146484375, -0.9271697998046875, -0.872314453125, -0.8174591064453125, -0.762603759765625, -0.7077484130859375, -0.65289306640625, -0.5980377197265625, -0.543182373046875, -0.4883270263671875, -0.4334716796875, -0.3786163330078125, -0.323760986328125, -0.2689056396484375, -0.21405029296875, -0.1591949462890625, -0.104339599609375, -0.0494842529296875, 0.00537109375, 0.0602264404296875, 0.115081787109375, 0.1699371337890625, 0.22479248046875, 0.2796478271484375, 0.334503173828125, 0.3893585205078125, 0.4442138671875, 0.4990692138671875, 0.553924560546875, 0.6087799072265625, 0.66363525390625, 0.7184906005859375, 0.773345947265625, 0.8282012939453125, 0.883056640625, 0.9379119873046875, 0.992767333984375, 1.0476226806640625, 1.10247802734375, 1.1573333740234375, 1.212188720703125, 1.2670440673828125, 1.3218994140625, 1.3767547607421875, 1.431610107421875, 1.4864654541015625, 1.54132080078125, 1.5961761474609375, 1.651031494140625, 1.7058868408203125, 1.7607421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 2.0, 5.0, 13.0, 8.0, 17.0, 27.0, 41.0, 45.0, 52.0, 75.0, 95.0, 166.0, 267.0, 347.0, 566.0, 726.0, 1188.0, 1758.0, 2726.0, 4350.0, 7189.0, 12202.0, 22586.0, 81549.0, 834490.0, 35479.0, 16747.0, 9663.0, 5644.0, 3639.0, 2321.0, 1483.0, 988.0, 660.0, 424.0, 305.0, 211.0, 152.0, 95.0, 65.0, 49.0, 35.0, 32.0, 21.0, 13.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.259033203125, -0.24953460693359375, -0.2400360107421875, -0.23053741455078125, -0.221038818359375, -0.21154022216796875, -0.2020416259765625, -0.19254302978515625, -0.18304443359375, -0.17354583740234375, -0.1640472412109375, -0.15454864501953125, -0.145050048828125, -0.13555145263671875, -0.1260528564453125, -0.11655426025390625, -0.1070556640625, -0.09755706787109375, -0.0880584716796875, -0.07855987548828125, -0.069061279296875, -0.05956268310546875, -0.0500640869140625, -0.04056549072265625, -0.03106689453125, -0.02156829833984375, -0.0120697021484375, -0.00257110595703125, 0.006927490234375, 0.01642608642578125, 0.0259246826171875, 0.03542327880859375, 0.044921875, 0.05442047119140625, 0.0639190673828125, 0.07341766357421875, 0.082916259765625, 0.09241485595703125, 0.1019134521484375, 0.11141204833984375, 0.12091064453125, 0.13040924072265625, 0.1399078369140625, 0.14940643310546875, 0.158905029296875, 0.16840362548828125, 0.1779022216796875, 0.18740081787109375, 0.1968994140625, 0.20639801025390625, 0.2158966064453125, 0.22539520263671875, 0.234893798828125, 0.24439239501953125, 0.2538909912109375, 0.26338958740234375, 0.27288818359375, 0.28238677978515625, 0.2918853759765625, 0.30138397216796875, 0.310882568359375, 0.32038116455078125, 0.3298797607421875, 0.33937835693359375, 0.348876953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 6.0, 11.0, 17.0, 21.0, 19.0, 25.0, 18.0, 26.0, 19.0, 39.0, 32.0, 43.0, 40.0, 43.0, 35.0, 53.0, 37.0, 56.0, 42.0, 55.0, 40.0, 43.0, 45.0, 34.0, 26.0, 26.0, 24.0, 18.0, 17.0, 6.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.562999725341797e-05, -2.470053732395172e-05, -2.3771077394485474e-05, -2.2841617465019226e-05, -2.191215753555298e-05, -2.098269760608673e-05, -2.0053237676620483e-05, -1.9123777747154236e-05, -1.8194317817687988e-05, -1.726485788822174e-05, -1.6335397958755493e-05, -1.5405938029289246e-05, -1.4476478099822998e-05, -1.354701817035675e-05, -1.2617558240890503e-05, -1.1688098311424255e-05, -1.0758638381958008e-05, -9.82917845249176e-06, -8.899718523025513e-06, -7.970258593559265e-06, -7.040798664093018e-06, -6.11133873462677e-06, -5.1818788051605225e-06, -4.252418875694275e-06, -3.3229589462280273e-06, -2.3934990167617798e-06, -1.4640390872955322e-06, -5.345791578292847e-07, 3.948807716369629e-07, 1.3243407011032104e-06, 2.253800630569458e-06, 3.1832605600357056e-06, 4.112720489501953e-06, 5.042180418968201e-06, 5.971640348434448e-06, 6.901100277900696e-06, 7.830560207366943e-06, 8.760020136833191e-06, 9.689480066299438e-06, 1.0618939995765686e-05, 1.1548399925231934e-05, 1.2477859854698181e-05, 1.3407319784164429e-05, 1.4336779713630676e-05, 1.5266239643096924e-05, 1.619569957256317e-05, 1.712515950202942e-05, 1.8054619431495667e-05, 1.8984079360961914e-05, 1.991353929042816e-05, 2.084299921989441e-05, 2.1772459149360657e-05, 2.2701919078826904e-05, 2.3631379008293152e-05, 2.45608389377594e-05, 2.5490298867225647e-05, 2.6419758796691895e-05, 2.7349218726158142e-05, 2.827867865562439e-05, 2.9208138585090637e-05, 3.0137598514556885e-05, 3.106705844402313e-05, 3.199651837348938e-05, 3.292597830295563e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 23.0, 29.0, 40.0, 61.0, 68.0, 111.0, 172.0, 255.0, 422.0, 757.0, 1277.0, 2200.0, 3683.0, 6939.0, 13388.0, 27587.0, 58850.0, 130249.0, 254678.0, 271229.0, 146350.0, 66656.0, 30960.0, 15126.0, 7651.0, 4123.0, 2271.0, 1280.0, 823.0, 473.0, 291.0, 167.0, 126.0, 78.0, 50.0, 25.0, 15.0, 16.0, 5.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.1693115234375, -0.16434288024902344, -0.15937423706054688, -0.1544055938720703, -0.14943695068359375, -0.1444683074951172, -0.13949966430664062, -0.13453102111816406, -0.1295623779296875, -0.12459373474121094, -0.11962509155273438, -0.11465644836425781, -0.10968780517578125, -0.10471916198730469, -0.09975051879882812, -0.09478187561035156, -0.089813232421875, -0.08484458923339844, -0.07987594604492188, -0.07490730285644531, -0.06993865966796875, -0.06497001647949219, -0.060001373291015625, -0.05503273010253906, -0.0500640869140625, -0.04509544372558594, -0.040126800537109375, -0.03515815734863281, -0.03018951416015625, -0.025220870971679688, -0.020252227783203125, -0.015283584594726562, -0.01031494140625, -0.0053462982177734375, -0.000377655029296875, 0.0045909881591796875, 0.00955963134765625, 0.014528274536132812, 0.019496917724609375, 0.024465560913085938, 0.0294342041015625, 0.03440284729003906, 0.039371490478515625, 0.04434013366699219, 0.04930877685546875, 0.05427742004394531, 0.059246063232421875, 0.06421470642089844, 0.069183349609375, 0.07415199279785156, 0.07912063598632812, 0.08408927917480469, 0.08905792236328125, 0.09402656555175781, 0.09899520874023438, 0.10396385192871094, 0.1089324951171875, 0.11390113830566406, 0.11886978149414062, 0.12383842468261719, 0.12880706787109375, 0.1337757110595703, 0.13874435424804688, 0.14371299743652344, 0.148681640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 7.0, 16.0, 14.0, 10.0, 15.0, 16.0, 24.0, 29.0, 43.0, 62.0, 54.0, 76.0, 69.0, 85.0, 76.0, 56.0, 58.0, 54.0, 45.0, 22.0, 33.0, 18.0, 25.0, 20.0, 17.0, 10.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.06186485290527344, -0.059581756591796875, -0.05729866027832031, -0.05501556396484375, -0.05273246765136719, -0.050449371337890625, -0.04816627502441406, -0.0458831787109375, -0.04360008239746094, -0.041316986083984375, -0.03903388977050781, -0.03675079345703125, -0.03446769714355469, -0.032184600830078125, -0.029901504516601562, -0.027618408203125, -0.025335311889648438, -0.023052215576171875, -0.020769119262695312, -0.01848602294921875, -0.016202926635742188, -0.013919830322265625, -0.011636734008789062, -0.0093536376953125, -0.0070705413818359375, -0.004787445068359375, -0.0025043487548828125, -0.00022125244140625, 0.0020618438720703125, 0.004344940185546875, 0.0066280364990234375, 0.0089111328125, 0.011194229125976562, 0.013477325439453125, 0.015760421752929688, 0.01804351806640625, 0.020326614379882812, 0.022609710693359375, 0.024892807006835938, 0.0271759033203125, 0.029458999633789062, 0.031742095947265625, 0.03402519226074219, 0.03630828857421875, 0.03859138488769531, 0.040874481201171875, 0.04315757751464844, 0.045440673828125, 0.04772377014160156, 0.050006866455078125, 0.05228996276855469, 0.05457305908203125, 0.05685615539550781, 0.059139251708984375, 0.06142234802246094, 0.0637054443359375, 0.06598854064941406, 0.06827163696289062, 0.07055473327636719, 0.07283782958984375, 0.07512092590332031, 0.07740402221679688, 0.07968711853027344, 0.08197021484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 6.0, 10.0, 10.0, 11.0, 18.0, 15.0, 25.0, 20.0, 39.0, 35.0, 50.0, 44.0, 51.0, 56.0, 46.0, 60.0, 53.0, 61.0, 44.0, 48.0, 34.0, 34.0, 32.0, 39.0, 18.0, 26.0, 22.0, 14.0, 9.0, 18.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2084171772003174, -3.0880517959594727, -2.967686653137207, -2.8473212718963623, -2.7269558906555176, -2.606590747833252, -2.4862253665924072, -2.3658599853515625, -2.245494842529297, -2.125129461288452, -2.0047643184661865, -1.8843989372253418, -1.764033555984497, -1.643668293952942, -1.5233030319213867, -1.402937650680542, -1.2825722694396973, -1.162207007408142, -1.0418416261672974, -0.9214763641357422, -0.8011110424995422, -0.6807457208633423, -0.5603804588317871, -0.44001513719558716, -0.3196498155593872, -0.19928450882434845, -0.07891920208930969, 0.04144608974456787, 0.16181141138076782, 0.2821767330169678, 0.40254199504852295, 0.5229073166847229, 0.643272876739502, 0.7636381983757019, 0.8840035200119019, 1.004368782043457, 1.1247341632843018, 1.245099425315857, 1.365464687347412, 1.4858300685882568, 1.606195330619812, 1.7265605926513672, 1.846925973892212, 1.967291235923767, 2.0876564979553223, 2.208021879196167, 2.3283872604370117, 2.4487524032592773, 2.569117784500122, 2.689483165740967, 2.8098483085632324, 2.930213689804077, 3.050579071044922, 3.1709442138671875, 3.2913095951080322, 3.411674976348877, 3.5320401191711426, 3.6524055004119873, 3.772770643234253, 3.8931360244750977, 4.013501167297363, 4.133866786956787, 4.254231929779053, 4.374597072601318, 4.494962692260742]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 8.0, 9.0, 12.0, 6.0, 8.0, 10.0, 16.0, 17.0, 14.0, 26.0, 14.0, 19.0, 27.0, 40.0, 33.0, 30.0, 30.0, 29.0, 37.0, 40.0, 49.0, 50.0, 42.0, 26.0, 30.0, 31.0, 39.0, 33.0, 31.0, 36.0, 24.0, 17.0, 14.0, 18.0, 23.0, 22.0, 18.0, 10.0, 12.0, 11.0, 7.0, 6.0, 5.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.064056634902954, -1.9949069023132324, -1.9257571697235107, -1.856607437133789, -1.7874577045440674, -1.7183079719543457, -1.649158239364624, -1.5800085067749023, -1.5108587741851807, -1.441709041595459, -1.3725593090057373, -1.3034095764160156, -1.234259843826294, -1.1651101112365723, -1.0959603786468506, -1.026810646057129, -0.9576607942581177, -0.888511061668396, -0.8193613290786743, -0.7502115964889526, -0.681061863899231, -0.6119121313095093, -0.5427623391151428, -0.47361260652542114, -0.40446287393569946, -0.3353131413459778, -0.2661634087562561, -0.19701364636421204, -0.12786391377449036, -0.05871418118476868, 0.01043558120727539, 0.07958531379699707, 0.14873504638671875, 0.21788477897644043, 0.2870345115661621, 0.3561842739582062, 0.42533400654792786, 0.49448373913764954, 0.5636335015296936, 0.6327832341194153, 0.701932966709137, 0.7710826992988586, 0.8402324318885803, 0.9093822240829468, 0.9785319566726685, 1.0476816892623901, 1.1168314218521118, 1.1859811544418335, 1.2551308870315552, 1.3242806196212769, 1.3934303522109985, 1.4625800848007202, 1.531729817390442, 1.6008795499801636, 1.6700294017791748, 1.7391791343688965, 1.8083288669586182, 1.8774785995483398, 1.9466283321380615, 2.015778064727783, 2.084927797317505, 2.1540775299072266, 2.2232272624969482, 2.29237699508667, 2.3615267276763916]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 14.0, 19.0, 21.0, 34.0, 57.0, 84.0, 104.0, 166.0, 259.0, 423.0, 609.0, 913.0, 1560.0, 2424.0, 4022.0, 6612.0, 11138.0, 18550.0, 31169.0, 49787.0, 76607.0, 108486.0, 137858.0, 150213.0, 137697.0, 108016.0, 76042.0, 48777.0, 30343.0, 18343.0, 11057.0, 6567.0, 3908.0, 2419.0, 1487.0, 921.0, 591.0, 397.0, 284.0, 189.0, 126.0, 65.0, 73.0, 33.0, 27.0, 16.0, 16.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.451171875, -2.373321533203125, -2.29547119140625, -2.217620849609375, -2.1397705078125, -2.061920166015625, -1.98406982421875, -1.906219482421875, -1.828369140625, -1.750518798828125, -1.67266845703125, -1.594818115234375, -1.5169677734375, -1.439117431640625, -1.36126708984375, -1.283416748046875, -1.20556640625, -1.127716064453125, -1.04986572265625, -0.972015380859375, -0.8941650390625, -0.816314697265625, -0.73846435546875, -0.660614013671875, -0.582763671875, -0.504913330078125, -0.42706298828125, -0.349212646484375, -0.2713623046875, -0.193511962890625, -0.11566162109375, -0.037811279296875, 0.0400390625, 0.117889404296875, 0.19573974609375, 0.273590087890625, 0.3514404296875, 0.429290771484375, 0.50714111328125, 0.584991455078125, 0.662841796875, 0.740692138671875, 0.81854248046875, 0.896392822265625, 0.9742431640625, 1.052093505859375, 1.12994384765625, 1.207794189453125, 1.28564453125, 1.363494873046875, 1.44134521484375, 1.519195556640625, 1.5970458984375, 1.674896240234375, 1.75274658203125, 1.830596923828125, 1.908447265625, 1.986297607421875, 2.06414794921875, 2.141998291015625, 2.2198486328125, 2.297698974609375, 2.37554931640625, 2.453399658203125, 2.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 4.0, 10.0, 11.0, 10.0, 8.0, 17.0, 24.0, 20.0, 24.0, 22.0, 18.0, 33.0, 19.0, 35.0, 39.0, 26.0, 49.0, 46.0, 50.0, 41.0, 39.0, 29.0, 39.0, 43.0, 32.0, 30.0, 29.0, 28.0, 23.0, 28.0, 27.0, 18.0, 14.0, 19.0, 14.0, 13.0, 11.0, 9.0, 11.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-2.333984375, -2.254425048828125, -2.17486572265625, -2.095306396484375, -2.0157470703125, -1.936187744140625, -1.85662841796875, -1.777069091796875, -1.697509765625, -1.617950439453125, -1.53839111328125, -1.458831787109375, -1.3792724609375, -1.299713134765625, -1.22015380859375, -1.140594482421875, -1.06103515625, -0.981475830078125, -0.90191650390625, -0.822357177734375, -0.7427978515625, -0.663238525390625, -0.58367919921875, -0.504119873046875, -0.424560546875, -0.345001220703125, -0.26544189453125, -0.185882568359375, -0.1063232421875, -0.026763916015625, 0.05279541015625, 0.132354736328125, 0.2119140625, 0.291473388671875, 0.37103271484375, 0.450592041015625, 0.5301513671875, 0.609710693359375, 0.68927001953125, 0.768829345703125, 0.848388671875, 0.927947998046875, 1.00750732421875, 1.087066650390625, 1.1666259765625, 1.246185302734375, 1.32574462890625, 1.405303955078125, 1.48486328125, 1.564422607421875, 1.64398193359375, 1.723541259765625, 1.8031005859375, 1.882659912109375, 1.96221923828125, 2.041778564453125, 2.121337890625, 2.200897216796875, 2.28045654296875, 2.360015869140625, 2.4395751953125, 2.519134521484375, 2.59869384765625, 2.678253173828125, 2.7578125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 28.0, 41.0, 60.0, 97.0, 127.0, 228.0, 310.0, 407.0, 718.0, 1129.0, 1664.0, 2514.0, 3922.0, 5911.0, 8993.0, 14307.0, 21533.0, 32764.0, 47827.0, 69122.0, 93037.0, 115252.0, 129046.0, 125140.0, 107743.0, 83663.0, 60639.0, 41578.0, 27840.0, 18275.0, 11956.0, 7723.0, 5136.0, 3386.0, 2207.0, 1447.0, 927.0, 562.0, 420.0, 266.0, 175.0, 125.0, 104.0, 63.0, 36.0, 31.0, 13.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0], "bins": [-2.25, -2.181427001953125, -2.11285400390625, -2.044281005859375, -1.9757080078125, -1.907135009765625, -1.83856201171875, -1.769989013671875, -1.701416015625, -1.632843017578125, -1.56427001953125, -1.495697021484375, -1.4271240234375, -1.358551025390625, -1.28997802734375, -1.221405029296875, -1.15283203125, -1.084259033203125, -1.01568603515625, -0.947113037109375, -0.8785400390625, -0.809967041015625, -0.74139404296875, -0.672821044921875, -0.604248046875, -0.535675048828125, -0.46710205078125, -0.398529052734375, -0.3299560546875, -0.261383056640625, -0.19281005859375, -0.124237060546875, -0.0556640625, 0.012908935546875, 0.08148193359375, 0.150054931640625, 0.2186279296875, 0.287200927734375, 0.35577392578125, 0.424346923828125, 0.492919921875, 0.561492919921875, 0.63006591796875, 0.698638916015625, 0.7672119140625, 0.835784912109375, 0.90435791015625, 0.972930908203125, 1.04150390625, 1.110076904296875, 1.17864990234375, 1.247222900390625, 1.3157958984375, 1.384368896484375, 1.45294189453125, 1.521514892578125, 1.590087890625, 1.658660888671875, 1.72723388671875, 1.795806884765625, 1.8643798828125, 1.932952880859375, 2.00152587890625, 2.070098876953125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 13.0, 18.0, 16.0, 20.0, 26.0, 29.0, 18.0, 37.0, 40.0, 50.0, 48.0, 31.0, 43.0, 44.0, 37.0, 47.0, 48.0, 41.0, 42.0, 48.0, 35.0, 33.0, 36.0, 18.0, 25.0, 22.0, 22.0, 16.0, 11.0, 8.0, 9.0, 4.0, 8.0, 12.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.770233154296875, -1.71234130859375, -1.654449462890625, -1.5965576171875, -1.538665771484375, -1.48077392578125, -1.422882080078125, -1.364990234375, -1.307098388671875, -1.24920654296875, -1.191314697265625, -1.1334228515625, -1.075531005859375, -1.01763916015625, -0.959747314453125, -0.90185546875, -0.843963623046875, -0.78607177734375, -0.728179931640625, -0.6702880859375, -0.612396240234375, -0.55450439453125, -0.496612548828125, -0.438720703125, -0.380828857421875, -0.32293701171875, -0.265045166015625, -0.2071533203125, -0.149261474609375, -0.09136962890625, -0.033477783203125, 0.0244140625, 0.082305908203125, 0.14019775390625, 0.198089599609375, 0.2559814453125, 0.313873291015625, 0.37176513671875, 0.429656982421875, 0.487548828125, 0.545440673828125, 0.60333251953125, 0.661224365234375, 0.7191162109375, 0.777008056640625, 0.83489990234375, 0.892791748046875, 0.95068359375, 1.008575439453125, 1.06646728515625, 1.124359130859375, 1.1822509765625, 1.240142822265625, 1.29803466796875, 1.355926513671875, 1.413818359375, 1.471710205078125, 1.52960205078125, 1.587493896484375, 1.6453857421875, 1.703277587890625, 1.76116943359375, 1.819061279296875, 1.876953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 13.0, 14.0, 23.0, 29.0, 43.0, 64.0, 93.0, 154.0, 256.0, 403.0, 656.0, 1166.0, 1897.0, 3336.0, 5876.0, 10222.0, 18268.0, 32339.0, 56490.0, 93837.0, 143808.0, 182255.0, 174814.0, 129306.0, 81618.0, 48177.0, 27264.0, 15309.0, 8828.0, 4834.0, 2949.0, 1652.0, 989.0, 588.0, 362.0, 218.0, 145.0, 81.0, 58.0, 42.0, 19.0, 19.0, 14.0, 3.0, 12.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5177154541015625, -1.465118408203125, -1.4125213623046875, -1.35992431640625, -1.3073272705078125, -1.254730224609375, -1.2021331787109375, -1.1495361328125, -1.0969390869140625, -1.044342041015625, -0.9917449951171875, -0.93914794921875, -0.8865509033203125, -0.833953857421875, -0.7813568115234375, -0.728759765625, -0.6761627197265625, -0.623565673828125, -0.5709686279296875, -0.51837158203125, -0.4657745361328125, -0.413177490234375, -0.3605804443359375, -0.3079833984375, -0.2553863525390625, -0.202789306640625, -0.1501922607421875, -0.09759521484375, -0.0449981689453125, 0.007598876953125, 0.0601959228515625, 0.11279296875, 0.1653900146484375, 0.217987060546875, 0.2705841064453125, 0.32318115234375, 0.3757781982421875, 0.428375244140625, 0.4809722900390625, 0.5335693359375, 0.5861663818359375, 0.638763427734375, 0.6913604736328125, 0.74395751953125, 0.7965545654296875, 0.849151611328125, 0.9017486572265625, 0.954345703125, 1.0069427490234375, 1.059539794921875, 1.1121368408203125, 1.16473388671875, 1.2173309326171875, 1.269927978515625, 1.3225250244140625, 1.3751220703125, 1.4277191162109375, 1.480316162109375, 1.5329132080078125, 1.58551025390625, 1.6381072998046875, 1.690704345703125, 1.7433013916015625, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 6.0, 11.0, 14.0, 15.0, 13.0, 22.0, 31.0, 26.0, 36.0, 40.0, 39.0, 48.0, 39.0, 55.0, 41.0, 59.0, 45.0, 49.0, 54.0, 48.0, 41.0, 35.0, 36.0, 26.0, 25.0, 24.0, 16.0, 17.0, 18.0, 12.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001214146614074707, -0.00011733081191778183, -0.00011324696242809296, -0.00010916311293840408, -0.00010507926344871521, -0.00010099541395902634, -9.691156446933746e-05, -9.282771497964859e-05, -8.874386548995972e-05, -8.466001600027084e-05, -8.057616651058197e-05, -7.64923170208931e-05, -7.240846753120422e-05, -6.832461804151535e-05, -6.424076855182648e-05, -6.0156919062137604e-05, -5.607306957244873e-05, -5.198922008275986e-05, -4.7905370593070984e-05, -4.382152110338211e-05, -3.973767161369324e-05, -3.5653822124004364e-05, -3.156997263431549e-05, -2.7486123144626617e-05, -2.3402273654937744e-05, -1.931842416524887e-05, -1.5234574675559998e-05, -1.1150725185871124e-05, -7.066875696182251e-06, -2.9830262064933777e-06, 1.1008232831954956e-06, 5.184672772884369e-06, 9.268522262573242e-06, 1.3352371752262115e-05, 1.743622124195099e-05, 2.1520070731639862e-05, 2.5603920221328735e-05, 2.968776971101761e-05, 3.377161920070648e-05, 3.7855468690395355e-05, 4.193931818008423e-05, 4.60231676697731e-05, 5.0107017159461975e-05, 5.419086664915085e-05, 5.827471613883972e-05, 6.23585656285286e-05, 6.644241511821747e-05, 7.052626460790634e-05, 7.461011409759521e-05, 7.869396358728409e-05, 8.277781307697296e-05, 8.686166256666183e-05, 9.094551205635071e-05, 9.502936154603958e-05, 9.911321103572845e-05, 0.00010319706052541733, 0.0001072809100151062, 0.00011136475950479507, 0.00011544860899448395, 0.00011953245848417282, 0.0001236163079738617, 0.00012770015746355057, 0.00013178400695323944, 0.00013586785644292831, 0.0001399517059326172]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 22.0, 42.0, 46.0, 97.0, 139.0, 205.0, 343.0, 547.0, 880.0, 1436.0, 2382.0, 4010.0, 6724.0, 10976.0, 18127.0, 30230.0, 49581.0, 76893.0, 113280.0, 148222.0, 160438.0, 140719.0, 103589.0, 69046.0, 43475.0, 26562.0, 16209.0, 9600.0, 5827.0, 3471.0, 2056.0, 1290.0, 749.0, 459.0, 303.0, 203.0, 134.0, 83.0, 40.0, 44.0, 15.0, 12.0, 13.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3618621826171875, -1.318450927734375, -1.2750396728515625, -1.23162841796875, -1.1882171630859375, -1.144805908203125, -1.1013946533203125, -1.0579833984375, -1.0145721435546875, -0.971160888671875, -0.9277496337890625, -0.88433837890625, -0.8409271240234375, -0.797515869140625, -0.7541046142578125, -0.710693359375, -0.6672821044921875, -0.623870849609375, -0.5804595947265625, -0.53704833984375, -0.4936370849609375, -0.450225830078125, -0.4068145751953125, -0.3634033203125, -0.3199920654296875, -0.276580810546875, -0.2331695556640625, -0.18975830078125, -0.1463470458984375, -0.102935791015625, -0.0595245361328125, -0.01611328125, 0.0272979736328125, 0.070709228515625, 0.1141204833984375, 0.15753173828125, 0.2009429931640625, 0.244354248046875, 0.2877655029296875, 0.3311767578125, 0.3745880126953125, 0.417999267578125, 0.4614105224609375, 0.50482177734375, 0.5482330322265625, 0.591644287109375, 0.6350555419921875, 0.678466796875, 0.7218780517578125, 0.765289306640625, 0.8087005615234375, 0.85211181640625, 0.8955230712890625, 0.938934326171875, 0.9823455810546875, 1.0257568359375, 1.0691680908203125, 1.112579345703125, 1.1559906005859375, 1.19940185546875, 1.2428131103515625, 1.286224365234375, 1.3296356201171875, 1.373046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 9.0, 9.0, 5.0, 16.0, 13.0, 17.0, 22.0, 28.0, 23.0, 41.0, 40.0, 33.0, 41.0, 52.0, 41.0, 43.0, 56.0, 47.0, 54.0, 53.0, 47.0, 47.0, 37.0, 34.0, 35.0, 34.0, 22.0, 17.0, 18.0, 9.0, 16.0, 10.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.359283447265625, -0.34600830078125, -0.332733154296875, -0.3194580078125, -0.306182861328125, -0.29290771484375, -0.279632568359375, -0.266357421875, -0.253082275390625, -0.23980712890625, -0.226531982421875, -0.2132568359375, -0.199981689453125, -0.18670654296875, -0.173431396484375, -0.16015625, -0.146881103515625, -0.13360595703125, -0.120330810546875, -0.1070556640625, -0.093780517578125, -0.08050537109375, -0.067230224609375, -0.053955078125, -0.040679931640625, -0.02740478515625, -0.014129638671875, -0.0008544921875, 0.012420654296875, 0.02569580078125, 0.038970947265625, 0.05224609375, 0.065521240234375, 0.07879638671875, 0.092071533203125, 0.1053466796875, 0.118621826171875, 0.13189697265625, 0.145172119140625, 0.158447265625, 0.171722412109375, 0.18499755859375, 0.198272705078125, 0.2115478515625, 0.224822998046875, 0.23809814453125, 0.251373291015625, 0.2646484375, 0.277923583984375, 0.29119873046875, 0.304473876953125, 0.3177490234375, 0.331024169921875, 0.34429931640625, 0.357574462890625, 0.370849609375, 0.384124755859375, 0.39739990234375, 0.410675048828125, 0.4239501953125, 0.437225341796875, 0.45050048828125, 0.463775634765625, 0.47705078125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 14.0, 11.0, 9.0, 15.0, 18.0, 13.0, 17.0, 31.0, 27.0, 41.0, 43.0, 42.0, 55.0, 63.0, 61.0, 68.0, 61.0, 58.0, 45.0, 61.0, 31.0, 35.0, 25.0, 29.0, 32.0, 27.0, 16.0, 10.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737412691116333, -3.605987548828125, -3.474562406539917, -3.343137264251709, -3.211712121963501, -3.080286979675293, -2.948861837387085, -2.817436695098877, -2.686011552810669, -2.554586410522461, -2.423161268234253, -2.291736125946045, -2.160310983657837, -2.028885841369629, -1.897460699081421, -1.766035556793213, -1.6346104145050049, -1.5031852722167969, -1.3717601299285889, -1.2403349876403809, -1.1089098453521729, -0.9774847030639648, -0.8460595607757568, -0.7146344184875488, -0.5832092761993408, -0.4517841339111328, -0.3203589916229248, -0.1889338493347168, -0.05750870704650879, 0.07391643524169922, 0.20534157752990723, 0.33676671981811523, 0.46819162368774414, 0.5996167659759521, 0.7310419082641602, 0.8624670505523682, 0.9938921928405762, 1.1253173351287842, 1.2567424774169922, 1.3881676197052002, 1.5195927619934082, 1.6510179042816162, 1.7824430465698242, 1.9138681888580322, 2.0452933311462402, 2.1767184734344482, 2.3081436157226562, 2.4395687580108643, 2.5709939002990723, 2.7024190425872803, 2.8338441848754883, 2.9652693271636963, 3.0966944694519043, 3.2281196117401123, 3.3595447540283203, 3.4909698963165283, 3.6223950386047363, 3.7538201808929443, 3.8852453231811523, 4.016670227050781, 4.148095607757568, 4.2795209884643555, 4.410945892333984, 4.542370796203613, 4.6737961769104]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 9.0, 9.0, 14.0, 12.0, 24.0, 22.0, 30.0, 31.0, 25.0, 35.0, 35.0, 35.0, 40.0, 36.0, 33.0, 30.0, 39.0, 32.0, 44.0, 47.0, 49.0, 44.0, 37.0, 25.0, 27.0, 27.0, 19.0, 27.0, 15.0, 13.0, 17.0, 20.0, 11.0, 14.0, 6.0, 7.0, 4.0, 9.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0968737602233887, -2.024630546569824, -1.9523870944976807, -1.8801438808441162, -1.8079005479812622, -1.7356572151184082, -1.6634140014648438, -1.5911706686019897, -1.5189273357391357, -1.4466840028762817, -1.3744406700134277, -1.3021974563598633, -1.2299541234970093, -1.1577107906341553, -1.0854675769805908, -1.0132242441177368, -0.9409809112548828, -0.8687375783920288, -0.7964943051338196, -0.7242510318756104, -0.6520076990127563, -0.5797643661499023, -0.5075210928916931, -0.4352778196334839, -0.3630344867706299, -0.29079118371009827, -0.21854788064956665, -0.14630457758903503, -0.07406127452850342, -0.0018179714679718018, 0.07042533159255981, 0.14266860485076904, 0.21491169929504395, 0.28715500235557556, 0.3593983054161072, 0.4316416084766388, 0.5038849115371704, 0.5761282444000244, 0.6483715176582336, 0.7206147909164429, 0.7928581237792969, 0.8651014566421509, 0.9373447299003601, 1.0095880031585693, 1.0818313360214233, 1.1540746688842773, 1.2263178825378418, 1.2985612154006958, 1.3708045482635498, 1.4430478811264038, 1.5152912139892578, 1.5875344276428223, 1.6597777605056763, 1.7320210933685303, 1.8042643070220947, 1.8765076398849487, 1.9487509727478027, 2.020994186401367, 2.0932376384735107, 2.165480852127075, 2.2377243041992188, 2.309967517852783, 2.3822107315063477, 2.454453945159912, 2.5266973972320557]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 15.0, 15.0, 31.0, 53.0, 50.0, 84.0, 107.0, 164.0, 243.0, 360.0, 595.0, 951.0, 1362.0, 2329.0, 3856.0, 6858.0, 12539.0, 23711.0, 47416.0, 100038.0, 229439.0, 552685.0, 1117856.0, 1118593.0, 544901.0, 225033.0, 100026.0, 47521.0, 24514.0, 13433.0, 7620.0, 4376.0, 2776.0, 1663.0, 1092.0, 682.0, 473.0, 284.0, 187.0, 130.0, 73.0, 49.0, 28.0, 19.0, 13.0, 10.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 11.0, 5.0, 7.0, 17.0, 16.0, 10.0, 26.0, 18.0, 17.0, 37.0, 34.0, 29.0, 45.0, 42.0, 34.0, 38.0, 45.0, 40.0, 46.0, 40.0, 46.0, 54.0, 44.0, 22.0, 29.0, 28.0, 27.0, 24.0, 24.0, 25.0, 27.0, 13.0, 16.0, 14.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7919921875, -1.734954833984375, -1.67791748046875, -1.620880126953125, -1.5638427734375, -1.506805419921875, -1.44976806640625, -1.392730712890625, -1.335693359375, -1.278656005859375, -1.22161865234375, -1.164581298828125, -1.1075439453125, -1.050506591796875, -0.99346923828125, -0.936431884765625, -0.87939453125, -0.822357177734375, -0.76531982421875, -0.708282470703125, -0.6512451171875, -0.594207763671875, -0.53717041015625, -0.480133056640625, -0.423095703125, -0.366058349609375, -0.30902099609375, -0.251983642578125, -0.1949462890625, -0.137908935546875, -0.08087158203125, -0.023834228515625, 0.033203125, 0.090240478515625, 0.14727783203125, 0.204315185546875, 0.2613525390625, 0.318389892578125, 0.37542724609375, 0.432464599609375, 0.489501953125, 0.546539306640625, 0.60357666015625, 0.660614013671875, 0.7176513671875, 0.774688720703125, 0.83172607421875, 0.888763427734375, 0.94580078125, 1.002838134765625, 1.05987548828125, 1.116912841796875, 1.1739501953125, 1.230987548828125, 1.28802490234375, 1.345062255859375, 1.402099609375, 1.459136962890625, 1.51617431640625, 1.573211669921875, 1.6302490234375, 1.687286376953125, 1.74432373046875, 1.801361083984375, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 15.0, 20.0, 32.0, 57.0, 74.0, 131.0, 211.0, 321.0, 518.0, 853.0, 1404.0, 2213.0, 3707.0, 6283.0, 10778.0, 19348.0, 36010.0, 67104.0, 131689.0, 264487.0, 532742.0, 931319.0, 981830.0, 592995.0, 297473.0, 147644.0, 74988.0, 39427.0, 21663.0, 11878.0, 6744.0, 3924.0, 2364.0, 1483.0, 884.0, 566.0, 363.0, 256.0, 134.0, 88.0, 70.0, 49.0, 51.0, 21.0, 15.0, 16.0, 5.0, 7.0, 11.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.9658203125, -3.833984375, -3.7021484375, -3.5703125, -3.4384765625, -3.306640625, -3.1748046875, -3.04296875, -2.9111328125, -2.779296875, -2.6474609375, -2.515625, -2.3837890625, -2.251953125, -2.1201171875, -1.98828125, -1.8564453125, -1.724609375, -1.5927734375, -1.4609375, -1.3291015625, -1.197265625, -1.0654296875, -0.93359375, -0.8017578125, -0.669921875, -0.5380859375, -0.40625, -0.2744140625, -0.142578125, -0.0107421875, 0.12109375, 0.2529296875, 0.384765625, 0.5166015625, 0.6484375, 0.7802734375, 0.912109375, 1.0439453125, 1.17578125, 1.3076171875, 1.439453125, 1.5712890625, 1.703125, 1.8349609375, 1.966796875, 2.0986328125, 2.23046875, 2.3623046875, 2.494140625, 2.6259765625, 2.7578125, 2.8896484375, 3.021484375, 3.1533203125, 3.28515625, 3.4169921875, 3.548828125, 3.6806640625, 3.8125, 3.9443359375, 4.076171875, 4.2080078125, 4.33984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 6.0, 8.0, 21.0, 19.0, 11.0, 22.0, 35.0, 40.0, 39.0, 56.0, 63.0, 78.0, 86.0, 103.0, 143.0, 139.0, 176.0, 192.0, 193.0, 199.0, 215.0, 227.0, 224.0, 231.0, 199.0, 169.0, 151.0, 146.0, 146.0, 113.0, 108.0, 98.0, 80.0, 48.0, 45.0, 44.0, 40.0, 27.0, 26.0, 16.0, 17.0, 8.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0107421875, -0.9813995361328125, -0.952056884765625, -0.9227142333984375, -0.89337158203125, -0.8640289306640625, -0.834686279296875, -0.8053436279296875, -0.7760009765625, -0.7466583251953125, -0.717315673828125, -0.6879730224609375, -0.65863037109375, -0.6292877197265625, -0.599945068359375, -0.5706024169921875, -0.541259765625, -0.5119171142578125, -0.482574462890625, -0.4532318115234375, -0.42388916015625, -0.3945465087890625, -0.365203857421875, -0.3358612060546875, -0.3065185546875, -0.2771759033203125, -0.247833251953125, -0.2184906005859375, -0.18914794921875, -0.1598052978515625, -0.130462646484375, -0.1011199951171875, -0.07177734375, -0.0424346923828125, -0.013092041015625, 0.0162506103515625, 0.04559326171875, 0.0749359130859375, 0.104278564453125, 0.1336212158203125, 0.1629638671875, 0.1923065185546875, 0.221649169921875, 0.2509918212890625, 0.28033447265625, 0.3096771240234375, 0.339019775390625, 0.3683624267578125, 0.397705078125, 0.4270477294921875, 0.456390380859375, 0.4857330322265625, 0.51507568359375, 0.5444183349609375, 0.573760986328125, 0.6031036376953125, 0.6324462890625, 0.6617889404296875, 0.691131591796875, 0.7204742431640625, 0.74981689453125, 0.7791595458984375, 0.808502197265625, 0.8378448486328125, 0.8671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 2.0, 10.0, 8.0, 12.0, 11.0, 16.0, 22.0, 34.0, 42.0, 42.0, 38.0, 56.0, 70.0, 49.0, 75.0, 72.0, 64.0, 66.0, 53.0, 52.0, 38.0, 35.0, 21.0, 25.0, 21.0, 18.0, 9.0, 8.0, 3.0, 11.0, 2.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.347010850906372, -3.201976776123047, -3.0569427013397217, -2.9119086265563965, -2.766874313354492, -2.621840476989746, -2.476806163787842, -2.3317720890045166, -2.1867380142211914, -2.041703939437866, -1.896669864654541, -1.7516356706619263, -1.606601595878601, -1.4615675210952759, -1.3165333271026611, -1.171499252319336, -1.0264651775360107, -0.8814311027526855, -0.7363969683647156, -0.5913628339767456, -0.4463287591934204, -0.3012946844100952, -0.15626055002212524, -0.011226415634155273, 0.13380765914916992, 0.2788417637348175, 0.4238758683204651, 0.5689100027084351, 0.7139440774917603, 0.8589781522750854, 1.0040123462677002, 1.1490464210510254, 1.2940807342529297, 1.4391148090362549, 1.58414888381958, 1.7291830778121948, 1.87421715259552, 2.0192513465881348, 2.16428542137146, 2.309319496154785, 2.4543535709381104, 2.5993876457214355, 2.7444217205047607, 2.889455795288086, 3.0344901084899902, 3.1795239448547363, 3.3245582580566406, 3.469592332839966, 3.614626407623291, 3.759660482406616, 3.9046945571899414, 4.049728870391846, 4.194762706756592, 4.339797019958496, 4.484830856323242, 4.6298651695251465, 4.774899482727051, 4.919933795928955, 5.064967632293701, 5.2100019454956055, 5.355035781860352, 5.500070095062256, 5.645103931427002, 5.790138244628906, 5.935172080993652]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 14.0, 19.0, 16.0, 16.0, 29.0, 30.0, 28.0, 37.0, 23.0, 40.0, 38.0, 41.0, 53.0, 33.0, 38.0, 45.0, 51.0, 46.0, 43.0, 46.0, 35.0, 33.0, 28.0, 29.0, 25.0, 29.0, 25.0, 17.0, 11.0, 16.0, 9.0, 6.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9165393114089966, -1.8452924489974976, -1.7740455865859985, -1.7027987241744995, -1.6315518617630005, -1.5603049993515015, -1.4890581369400024, -1.4178112745285034, -1.3465644121170044, -1.2753175497055054, -1.2040706872940063, -1.1328238248825073, -1.0615769624710083, -0.9903301000595093, -0.9190832376480103, -0.8478363752365112, -0.7765895128250122, -0.7053426504135132, -0.6340957880020142, -0.5628489255905151, -0.4916020631790161, -0.4203552007675171, -0.34910833835601807, -0.27786147594451904, -0.20661461353302002, -0.135367751121521, -0.06412088871002197, 0.007125973701477051, 0.07837283611297607, 0.1496196985244751, 0.22086656093597412, 0.29211342334747314, 0.3633601665496826, 0.43460702896118164, 0.5058538913726807, 0.5771007537841797, 0.6483476161956787, 0.7195944786071777, 0.7908413410186768, 0.8620882034301758, 0.9333350658416748, 1.0045819282531738, 1.0758287906646729, 1.1470756530761719, 1.218322515487671, 1.28956937789917, 1.360816240310669, 1.432063102722168, 1.503309965133667, 1.574556827545166, 1.645803689956665, 1.717050552368164, 1.788297414779663, 1.859544277191162, 1.9307911396026611, 2.00203800201416, 2.073284864425659, 2.144531726837158, 2.2157785892486572, 2.2870254516601562, 2.3582723140716553, 2.4295191764831543, 2.5007660388946533, 2.5720129013061523, 2.6432597637176514]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 16.0, 20.0, 28.0, 39.0, 59.0, 66.0, 79.0, 129.0, 180.0, 214.0, 296.0, 422.0, 618.0, 885.0, 1406.0, 2312.0, 3879.0, 6637.0, 11992.0, 23685.0, 47682.0, 98091.0, 186254.0, 254527.0, 195861.0, 104975.0, 51522.0, 25398.0, 13129.0, 6948.0, 4026.0, 2386.0, 1501.0, 923.0, 644.0, 457.0, 336.0, 221.0, 185.0, 120.0, 114.0, 56.0, 60.0, 40.0, 29.0, 31.0, 21.0, 9.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5258369445800781, -0.5096817016601562, -0.4935264587402344, -0.4773712158203125, -0.4612159729003906, -0.44506072998046875, -0.4289054870605469, -0.412750244140625, -0.3965950012207031, -0.38043975830078125, -0.3642845153808594, -0.3481292724609375, -0.3319740295410156, -0.31581878662109375, -0.2996635437011719, -0.28350830078125, -0.2673530578613281, -0.25119781494140625, -0.23504257202148438, -0.2188873291015625, -0.20273208618164062, -0.18657684326171875, -0.17042160034179688, -0.154266357421875, -0.13811111450195312, -0.12195587158203125, -0.10580062866210938, -0.0896453857421875, -0.07349014282226562, -0.05733489990234375, -0.041179656982421875, -0.0250244140625, -0.008869171142578125, 0.00728607177734375, 0.023441314697265625, 0.0395965576171875, 0.055751800537109375, 0.07190704345703125, 0.08806228637695312, 0.104217529296875, 0.12037277221679688, 0.13652801513671875, 0.15268325805664062, 0.1688385009765625, 0.18499374389648438, 0.20114898681640625, 0.21730422973632812, 0.23345947265625, 0.24961471557617188, 0.26576995849609375, 0.2819252014160156, 0.2980804443359375, 0.3142356872558594, 0.33039093017578125, 0.3465461730957031, 0.362701416015625, 0.3788566589355469, 0.39501190185546875, 0.4111671447753906, 0.4273223876953125, 0.4434776306152344, 0.45963287353515625, 0.4757881164550781, 0.491943359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 13.0, 15.0, 18.0, 10.0, 21.0, 23.0, 27.0, 40.0, 34.0, 35.0, 35.0, 44.0, 42.0, 46.0, 45.0, 52.0, 43.0, 46.0, 42.0, 37.0, 37.0, 29.0, 38.0, 38.0, 25.0, 21.0, 23.0, 21.0, 17.0, 15.0, 10.0, 7.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.348663330078125, -2.26568603515625, -2.182708740234375, -2.0997314453125, -2.016754150390625, -1.93377685546875, -1.850799560546875, -1.767822265625, -1.684844970703125, -1.60186767578125, -1.518890380859375, -1.4359130859375, -1.352935791015625, -1.26995849609375, -1.186981201171875, -1.10400390625, -1.021026611328125, -0.93804931640625, -0.855072021484375, -0.7720947265625, -0.689117431640625, -0.60614013671875, -0.523162841796875, -0.440185546875, -0.357208251953125, -0.27423095703125, -0.191253662109375, -0.1082763671875, -0.025299072265625, 0.05767822265625, 0.140655517578125, 0.2236328125, 0.306610107421875, 0.38958740234375, 0.472564697265625, 0.5555419921875, 0.638519287109375, 0.72149658203125, 0.804473876953125, 0.887451171875, 0.970428466796875, 1.05340576171875, 1.136383056640625, 1.2193603515625, 1.302337646484375, 1.38531494140625, 1.468292236328125, 1.55126953125, 1.634246826171875, 1.71722412109375, 1.800201416015625, 1.8831787109375, 1.966156005859375, 2.04913330078125, 2.132110595703125, 2.215087890625, 2.298065185546875, 2.38104248046875, 2.464019775390625, 2.5469970703125, 2.629974365234375, 2.71295166015625, 2.795928955078125, 2.87890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 12.0, 16.0, 24.0, 22.0, 29.0, 62.0, 65.0, 116.0, 172.0, 218.0, 388.0, 608.0, 1143.0, 2225.0, 4933.0, 13626.0, 52366.0, 905642.0, 44735.0, 12511.0, 4720.0, 2129.0, 1059.0, 606.0, 347.0, 247.0, 141.0, 113.0, 64.0, 50.0, 43.0, 23.0, 22.0, 7.0, 15.0, 8.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0], "bins": [-1.7724609375, -1.719482421875, -1.66650390625, -1.613525390625, -1.560546875, -1.507568359375, -1.45458984375, -1.401611328125, -1.3486328125, -1.295654296875, -1.24267578125, -1.189697265625, -1.13671875, -1.083740234375, -1.03076171875, -0.977783203125, -0.9248046875, -0.871826171875, -0.81884765625, -0.765869140625, -0.712890625, -0.659912109375, -0.60693359375, -0.553955078125, -0.5009765625, -0.447998046875, -0.39501953125, -0.342041015625, -0.2890625, -0.236083984375, -0.18310546875, -0.130126953125, -0.0771484375, -0.024169921875, 0.02880859375, 0.081787109375, 0.134765625, 0.187744140625, 0.24072265625, 0.293701171875, 0.3466796875, 0.399658203125, 0.45263671875, 0.505615234375, 0.55859375, 0.611572265625, 0.66455078125, 0.717529296875, 0.7705078125, 0.823486328125, 0.87646484375, 0.929443359375, 0.982421875, 1.035400390625, 1.08837890625, 1.141357421875, 1.1943359375, 1.247314453125, 1.30029296875, 1.353271484375, 1.40625, 1.459228515625, 1.51220703125, 1.565185546875, 1.6181640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 2.0, 6.0, 15.0, 10.0, 12.0, 14.0, 18.0, 27.0, 18.0, 31.0, 18.0, 35.0, 26.0, 42.0, 30.0, 36.0, 43.0, 49.0, 49.0, 36.0, 38.0, 41.0, 33.0, 47.0, 27.0, 43.0, 32.0, 22.0, 19.0, 29.0, 24.0, 20.0, 19.0, 14.0, 15.0, 8.0, 9.0, 15.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.599609375, -1.5498504638671875, -1.500091552734375, -1.4503326416015625, -1.40057373046875, -1.3508148193359375, -1.301055908203125, -1.2512969970703125, -1.2015380859375, -1.1517791748046875, -1.102020263671875, -1.0522613525390625, -1.00250244140625, -0.9527435302734375, -0.902984619140625, -0.8532257080078125, -0.803466796875, -0.7537078857421875, -0.703948974609375, -0.6541900634765625, -0.60443115234375, -0.5546722412109375, -0.504913330078125, -0.4551544189453125, -0.4053955078125, -0.3556365966796875, -0.305877685546875, -0.2561187744140625, -0.20635986328125, -0.1566009521484375, -0.106842041015625, -0.0570831298828125, -0.00732421875, 0.0424346923828125, 0.092193603515625, 0.1419525146484375, 0.19171142578125, 0.2414703369140625, 0.291229248046875, 0.3409881591796875, 0.3907470703125, 0.4405059814453125, 0.490264892578125, 0.5400238037109375, 0.58978271484375, 0.6395416259765625, 0.689300537109375, 0.7390594482421875, 0.788818359375, 0.8385772705078125, 0.888336181640625, 0.9380950927734375, 0.98785400390625, 1.0376129150390625, 1.087371826171875, 1.1371307373046875, 1.1868896484375, 1.2366485595703125, 1.286407470703125, 1.3361663818359375, 1.38592529296875, 1.4356842041015625, 1.485443115234375, 1.5352020263671875, 1.5849609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 13.0, 10.0, 17.0, 18.0, 25.0, 31.0, 41.0, 46.0, 58.0, 80.0, 108.0, 152.0, 179.0, 247.0, 354.0, 475.0, 742.0, 1176.0, 2197.0, 4414.0, 9417.0, 24542.0, 689032.0, 274530.0, 22142.0, 8808.0, 4041.0, 2069.0, 1163.0, 716.0, 464.0, 307.0, 211.0, 150.0, 99.0, 107.0, 95.0, 52.0, 35.0, 43.0, 22.0, 27.0, 16.0, 21.0, 14.0, 8.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4404296875, -0.4266471862792969, -0.41286468505859375, -0.3990821838378906, -0.3852996826171875, -0.3715171813964844, -0.35773468017578125, -0.3439521789550781, -0.330169677734375, -0.3163871765136719, -0.30260467529296875, -0.2888221740722656, -0.2750396728515625, -0.2612571716308594, -0.24747467041015625, -0.23369216918945312, -0.21990966796875, -0.20612716674804688, -0.19234466552734375, -0.17856216430664062, -0.1647796630859375, -0.15099716186523438, -0.13721466064453125, -0.12343215942382812, -0.109649658203125, -0.09586715698242188, -0.08208465576171875, -0.06830215454101562, -0.0545196533203125, -0.040737152099609375, -0.02695465087890625, -0.013172149658203125, 0.0006103515625, 0.014392852783203125, 0.02817535400390625, 0.041957855224609375, 0.0557403564453125, 0.06952285766601562, 0.08330535888671875, 0.09708786010742188, 0.110870361328125, 0.12465286254882812, 0.13843536376953125, 0.15221786499023438, 0.1660003662109375, 0.17978286743164062, 0.19356536865234375, 0.20734786987304688, 0.22113037109375, 0.23491287231445312, 0.24869537353515625, 0.2624778747558594, 0.2762603759765625, 0.2900428771972656, 0.30382537841796875, 0.3176078796386719, 0.331390380859375, 0.3451728820800781, 0.35895538330078125, 0.3727378845214844, 0.3865203857421875, 0.4003028869628906, 0.41408538818359375, 0.4278678894042969, 0.441650390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 15.0, 14.0, 18.0, 28.0, 22.0, 46.0, 38.0, 45.0, 54.0, 52.0, 73.0, 72.0, 53.0, 76.0, 70.0, 61.0, 39.0, 43.0, 43.0, 27.0, 21.0, 12.0, 14.0, 12.0, 8.0, 9.0, 6.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0590763092041016e-05, -3.9091333746910095e-05, -3.7591904401779175e-05, -3.6092475056648254e-05, -3.4593045711517334e-05, -3.3093616366386414e-05, -3.159418702125549e-05, -3.0094757676124573e-05, -2.8595328330993652e-05, -2.7095898985862732e-05, -2.559646964073181e-05, -2.409704029560089e-05, -2.259761095046997e-05, -2.109818160533905e-05, -1.959875226020813e-05, -1.809932291507721e-05, -1.659989356994629e-05, -1.5100464224815369e-05, -1.3601034879684448e-05, -1.2101605534553528e-05, -1.0602176189422607e-05, -9.102746844291687e-06, -7.603317499160767e-06, -6.103888154029846e-06, -4.604458808898926e-06, -3.1050294637680054e-06, -1.605600118637085e-06, -1.0617077350616455e-07, 1.3932585716247559e-06, 2.8926879167556763e-06, 4.392117261886597e-06, 5.891546607017517e-06, 7.3909759521484375e-06, 8.890405297279358e-06, 1.0389834642410278e-05, 1.1889263987541199e-05, 1.3388693332672119e-05, 1.488812267780304e-05, 1.638755202293396e-05, 1.788698136806488e-05, 1.93864107131958e-05, 2.088584005832672e-05, 2.238526940345764e-05, 2.3884698748588562e-05, 2.5384128093719482e-05, 2.6883557438850403e-05, 2.8382986783981323e-05, 2.9882416129112244e-05, 3.1381845474243164e-05, 3.2881274819374084e-05, 3.4380704164505005e-05, 3.5880133509635925e-05, 3.7379562854766846e-05, 3.8878992199897766e-05, 4.0378421545028687e-05, 4.187785089015961e-05, 4.337728023529053e-05, 4.487670958042145e-05, 4.637613892555237e-05, 4.787556827068329e-05, 4.937499761581421e-05, 5.087442696094513e-05, 5.237385630607605e-05, 5.387328565120697e-05, 5.537271499633789e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 7.0, 10.0, 24.0, 29.0, 42.0, 61.0, 116.0, 178.0, 306.0, 530.0, 976.0, 1740.0, 3001.0, 5905.0, 11581.0, 24480.0, 56927.0, 144132.0, 315218.0, 277357.0, 117032.0, 47187.0, 20606.0, 9945.0, 4983.0, 2687.0, 1460.0, 807.0, 494.0, 263.0, 145.0, 98.0, 64.0, 43.0, 23.0, 19.0, 15.0, 12.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.15990257263183594, -0.15488815307617188, -0.1498737335205078, -0.14485931396484375, -0.1398448944091797, -0.13483047485351562, -0.12981605529785156, -0.1248016357421875, -0.11978721618652344, -0.11477279663085938, -0.10975837707519531, -0.10474395751953125, -0.09972953796386719, -0.09471511840820312, -0.08970069885253906, -0.084686279296875, -0.07967185974121094, -0.07465744018554688, -0.06964302062988281, -0.06462860107421875, -0.05961418151855469, -0.054599761962890625, -0.04958534240722656, -0.0445709228515625, -0.03955650329589844, -0.034542083740234375, -0.029527664184570312, -0.02451324462890625, -0.019498825073242188, -0.014484405517578125, -0.009469985961914062, -0.00445556640625, 0.0005588531494140625, 0.005573272705078125, 0.010587692260742188, 0.01560211181640625, 0.020616531372070312, 0.025630950927734375, 0.030645370483398438, 0.0356597900390625, 0.04067420959472656, 0.045688629150390625, 0.05070304870605469, 0.05571746826171875, 0.06073188781738281, 0.06574630737304688, 0.07076072692871094, 0.075775146484375, 0.08078956604003906, 0.08580398559570312, 0.09081840515136719, 0.09583282470703125, 0.10084724426269531, 0.10586166381835938, 0.11087608337402344, 0.1158905029296875, 0.12090492248535156, 0.12591934204101562, 0.1309337615966797, 0.13594818115234375, 0.1409626007080078, 0.14597702026367188, 0.15099143981933594, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 16.0, 7.0, 11.0, 19.0, 26.0, 22.0, 37.0, 38.0, 52.0, 50.0, 75.0, 74.0, 80.0, 82.0, 57.0, 72.0, 52.0, 44.0, 34.0, 29.0, 25.0, 13.0, 11.0, 10.0, 13.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037933349609375, -0.036604881286621094, -0.03527641296386719, -0.03394794464111328, -0.032619476318359375, -0.03129100799560547, -0.029962539672851562, -0.028634071350097656, -0.02730560302734375, -0.025977134704589844, -0.024648666381835938, -0.02332019805908203, -0.021991729736328125, -0.02066326141357422, -0.019334793090820312, -0.018006324768066406, -0.0166778564453125, -0.015349388122558594, -0.014020919799804688, -0.012692451477050781, -0.011363983154296875, -0.010035514831542969, -0.008707046508789062, -0.007378578186035156, -0.00605010986328125, -0.004721641540527344, -0.0033931732177734375, -0.0020647048950195312, -0.000736236572265625, 0.0005922317504882812, 0.0019207000732421875, 0.0032491683959960938, 0.00457763671875, 0.005906105041503906, 0.0072345733642578125, 0.008563041687011719, 0.009891510009765625, 0.011219978332519531, 0.012548446655273438, 0.013876914978027344, 0.01520538330078125, 0.016533851623535156, 0.017862319946289062, 0.01919078826904297, 0.020519256591796875, 0.02184772491455078, 0.023176193237304688, 0.024504661560058594, 0.0258331298828125, 0.027161598205566406, 0.028490066528320312, 0.02981853485107422, 0.031147003173828125, 0.03247547149658203, 0.03380393981933594, 0.035132408142089844, 0.03646087646484375, 0.037789344787597656, 0.03911781311035156, 0.04044628143310547, 0.041774749755859375, 0.04310321807861328, 0.04443168640136719, 0.045760154724121094, 0.047088623046875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 9.0, 8.0, 12.0, 14.0, 20.0, 26.0, 34.0, 44.0, 42.0, 44.0, 54.0, 72.0, 49.0, 91.0, 57.0, 68.0, 59.0, 55.0, 44.0, 36.0, 28.0, 24.0, 26.0, 15.0, 15.0, 10.0, 5.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2583179473876953, -3.1144847869873047, -2.970651626586914, -2.8268184661865234, -2.682985544204712, -2.5391523838043213, -2.3953192234039307, -2.251486301422119, -2.1076531410217285, -1.963819980621338, -1.8199869394302368, -1.6761537790298462, -1.5323207378387451, -1.3884875774383545, -1.2446544170379639, -1.1008213758468628, -0.9569880962371826, -0.8131549954414368, -0.6693218946456909, -0.5254887342453003, -0.38165563344955444, -0.2378225326538086, -0.09398937225341797, 0.049843668937683105, 0.19367682933807373, 0.3375099301338196, 0.4813430607318878, 0.625176191329956, 0.7690092921257019, 0.9128423929214478, 1.0566755533218384, 1.2005085945129395, 1.34434175491333, 1.4881749153137207, 1.6320079565048218, 1.7758411169052124, 1.9196741580963135, 2.063507318496704, 2.2073404788970947, 2.3511734008789062, 2.495006561279297, 2.6388397216796875, 2.782672882080078, 2.9265060424804688, 3.0703389644622803, 3.214172124862671, 3.3580052852630615, 3.501838207244873, 3.6456716060638428, 3.7895047664642334, 3.933337926864624, 4.0771708488464355, 4.221004009246826, 4.364837169647217, 4.508670330047607, 4.652503490447998, 4.796336650848389, 4.940169811248779, 5.08400297164917, 5.2278361320495605, 5.371669292449951, 5.515501976013184, 5.659335136413574, 5.803168296813965, 5.9470014572143555]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 0.0, 5.0, 3.0, 3.0, 6.0, 9.0, 12.0, 17.0, 19.0, 14.0, 30.0, 33.0, 26.0, 37.0, 20.0, 45.0, 44.0, 36.0, 48.0, 37.0, 34.0, 53.0, 43.0, 44.0, 50.0, 45.0, 31.0, 33.0, 31.0, 29.0, 25.0, 26.0, 25.0, 17.0, 12.0, 15.0, 9.0, 6.0, 7.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8723468780517578, -1.8014521598815918, -1.7305575609207153, -1.6596628427505493, -1.5887682437896729, -1.5178735256195068, -1.4469788074493408, -1.3760842084884644, -1.305189609527588, -1.2342948913574219, -1.1634002923965454, -1.0925055742263794, -1.021610975265503, -0.9507162570953369, -0.8798215985298157, -0.8089269399642944, -0.7380322217941284, -0.6671375632286072, -0.5962429046630859, -0.5253481864929199, -0.45445355772972107, -0.38355889916419983, -0.3126642107963562, -0.24176955223083496, -0.17087489366531372, -0.09998022764921188, -0.029085561633110046, 0.04180911183357239, 0.11270377039909363, 0.18359842896461487, 0.2544931173324585, 0.32538777589797974, 0.396282434463501, 0.4671770930290222, 0.5380717515945435, 0.6089664697647095, 0.6798610687255859, 0.750755786895752, 0.8216504454612732, 0.8925451040267944, 0.9634397625923157, 1.034334421157837, 1.105229139328003, 1.1761237382888794, 1.2470184564590454, 1.3179130554199219, 1.388807773590088, 1.459702491760254, 1.5305970907211304, 1.6014918088912964, 1.6723864078521729, 1.7432811260223389, 1.8141757249832153, 1.8850704431533813, 1.9559650421142578, 2.026859760284424, 2.09775447845459, 2.168649196624756, 2.239543914794922, 2.310438394546509, 2.381333112716675, 2.452227830886841, 2.523122549057007, 2.5940170288085938, 2.6649117469787598]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 11.0, 18.0, 29.0, 46.0, 80.0, 135.0, 152.0, 243.0, 368.0, 544.0, 781.0, 1198.0, 1843.0, 2801.0, 4347.0, 6658.0, 10642.0, 16859.0, 26331.0, 40831.0, 62197.0, 89107.0, 119286.0, 139780.0, 139628.0, 119168.0, 89375.0, 62131.0, 40817.0, 26163.0, 16846.0, 10651.0, 6846.0, 4386.0, 2808.0, 1831.0, 1201.0, 762.0, 545.0, 384.0, 236.0, 146.0, 107.0, 73.0, 53.0, 28.0, 25.0, 20.0, 10.0, 9.0, 0.0, 8.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.267578125, -2.19671630859375, -2.1258544921875, -2.05499267578125, -1.984130859375, -1.91326904296875, -1.8424072265625, -1.77154541015625, -1.70068359375, -1.62982177734375, -1.5589599609375, -1.48809814453125, -1.417236328125, -1.34637451171875, -1.2755126953125, -1.20465087890625, -1.1337890625, -1.06292724609375, -0.9920654296875, -0.92120361328125, -0.850341796875, -0.77947998046875, -0.7086181640625, -0.63775634765625, -0.56689453125, -0.49603271484375, -0.4251708984375, -0.35430908203125, -0.283447265625, -0.21258544921875, -0.1417236328125, -0.07086181640625, 0.0, 0.07086181640625, 0.1417236328125, 0.21258544921875, 0.283447265625, 0.35430908203125, 0.4251708984375, 0.49603271484375, 0.56689453125, 0.63775634765625, 0.7086181640625, 0.77947998046875, 0.850341796875, 0.92120361328125, 0.9920654296875, 1.06292724609375, 1.1337890625, 1.20465087890625, 1.2755126953125, 1.34637451171875, 1.417236328125, 1.48809814453125, 1.5589599609375, 1.62982177734375, 1.70068359375, 1.77154541015625, 1.8424072265625, 1.91326904296875, 1.984130859375, 2.05499267578125, 2.1258544921875, 2.19671630859375, 2.267578125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 14.0, 18.0, 14.0, 25.0, 32.0, 28.0, 37.0, 39.0, 41.0, 28.0, 43.0, 38.0, 44.0, 41.0, 36.0, 43.0, 50.0, 42.0, 41.0, 43.0, 35.0, 28.0, 38.0, 22.0, 13.0, 32.0, 20.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.638671875, -2.5579833984375, -2.477294921875, -2.3966064453125, -2.31591796875, -2.2352294921875, -2.154541015625, -2.0738525390625, -1.9931640625, -1.9124755859375, -1.831787109375, -1.7510986328125, -1.67041015625, -1.5897216796875, -1.509033203125, -1.4283447265625, -1.34765625, -1.2669677734375, -1.186279296875, -1.1055908203125, -1.02490234375, -0.9442138671875, -0.863525390625, -0.7828369140625, -0.7021484375, -0.6214599609375, -0.540771484375, -0.4600830078125, -0.37939453125, -0.2987060546875, -0.218017578125, -0.1373291015625, -0.056640625, 0.0240478515625, 0.104736328125, 0.1854248046875, 0.26611328125, 0.3468017578125, 0.427490234375, 0.5081787109375, 0.5888671875, 0.6695556640625, 0.750244140625, 0.8309326171875, 0.91162109375, 0.9923095703125, 1.072998046875, 1.1536865234375, 1.234375, 1.3150634765625, 1.395751953125, 1.4764404296875, 1.55712890625, 1.6378173828125, 1.718505859375, 1.7991943359375, 1.8798828125, 1.9605712890625, 2.041259765625, 2.1219482421875, 2.20263671875, 2.2833251953125, 2.364013671875, 2.4447021484375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 9.0, 7.0, 7.0, 10.0, 21.0, 31.0, 44.0, 49.0, 70.0, 112.0, 204.0, 315.0, 462.0, 722.0, 1159.0, 1797.0, 2922.0, 4496.0, 7597.0, 12275.0, 20201.0, 33183.0, 52551.0, 78899.0, 110832.0, 138860.0, 149269.0, 133426.0, 103732.0, 71641.0, 46834.0, 29523.0, 18213.0, 11049.0, 6710.0, 4189.0, 2593.0, 1588.0, 1065.0, 662.0, 422.0, 270.0, 181.0, 124.0, 72.0, 51.0, 46.0, 29.0, 13.0, 12.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.138671875, -2.065887451171875, -1.99310302734375, -1.920318603515625, -1.8475341796875, -1.774749755859375, -1.70196533203125, -1.629180908203125, -1.556396484375, -1.483612060546875, -1.41082763671875, -1.338043212890625, -1.2652587890625, -1.192474365234375, -1.11968994140625, -1.046905517578125, -0.97412109375, -0.901336669921875, -0.82855224609375, -0.755767822265625, -0.6829833984375, -0.610198974609375, -0.53741455078125, -0.464630126953125, -0.391845703125, -0.319061279296875, -0.24627685546875, -0.173492431640625, -0.1007080078125, -0.027923583984375, 0.04486083984375, 0.117645263671875, 0.1904296875, 0.263214111328125, 0.33599853515625, 0.408782958984375, 0.4815673828125, 0.554351806640625, 0.62713623046875, 0.699920654296875, 0.772705078125, 0.845489501953125, 0.91827392578125, 0.991058349609375, 1.0638427734375, 1.136627197265625, 1.20941162109375, 1.282196044921875, 1.35498046875, 1.427764892578125, 1.50054931640625, 1.573333740234375, 1.6461181640625, 1.718902587890625, 1.79168701171875, 1.864471435546875, 1.937255859375, 2.010040283203125, 2.08282470703125, 2.155609130859375, 2.2283935546875, 2.301177978515625, 2.37396240234375, 2.446746826171875, 2.51953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 9.0, 21.0, 11.0, 17.0, 23.0, 15.0, 20.0, 25.0, 28.0, 27.0, 22.0, 42.0, 33.0, 42.0, 35.0, 39.0, 49.0, 33.0, 47.0, 39.0, 37.0, 39.0, 35.0, 28.0, 33.0, 35.0, 26.0, 27.0, 22.0, 13.0, 21.0, 14.0, 12.0, 9.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.5205078125, -1.47528076171875, -1.4300537109375, -1.38482666015625, -1.339599609375, -1.29437255859375, -1.2491455078125, -1.20391845703125, -1.15869140625, -1.11346435546875, -1.0682373046875, -1.02301025390625, -0.977783203125, -0.93255615234375, -0.8873291015625, -0.84210205078125, -0.796875, -0.75164794921875, -0.7064208984375, -0.66119384765625, -0.615966796875, -0.57073974609375, -0.5255126953125, -0.48028564453125, -0.43505859375, -0.38983154296875, -0.3446044921875, -0.29937744140625, -0.254150390625, -0.20892333984375, -0.1636962890625, -0.11846923828125, -0.0732421875, -0.02801513671875, 0.0172119140625, 0.06243896484375, 0.107666015625, 0.15289306640625, 0.1981201171875, 0.24334716796875, 0.28857421875, 0.33380126953125, 0.3790283203125, 0.42425537109375, 0.469482421875, 0.51470947265625, 0.5599365234375, 0.60516357421875, 0.650390625, 0.69561767578125, 0.7408447265625, 0.78607177734375, 0.831298828125, 0.87652587890625, 0.9217529296875, 0.96697998046875, 1.01220703125, 1.05743408203125, 1.1026611328125, 1.14788818359375, 1.193115234375, 1.23834228515625, 1.2835693359375, 1.32879638671875, 1.3740234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 16.0, 15.0, 33.0, 48.0, 85.0, 135.0, 190.0, 282.0, 479.0, 818.0, 1425.0, 2497.0, 4452.0, 8546.0, 17122.0, 34491.0, 70453.0, 136416.0, 218914.0, 232280.0, 154749.0, 82283.0, 40966.0, 19931.0, 9976.0, 5108.0, 2848.0, 1583.0, 935.0, 556.0, 336.0, 226.0, 119.0, 79.0, 45.0, 31.0, 35.0, 18.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.962890625, -1.897705078125, -1.83251953125, -1.767333984375, -1.7021484375, -1.636962890625, -1.57177734375, -1.506591796875, -1.44140625, -1.376220703125, -1.31103515625, -1.245849609375, -1.1806640625, -1.115478515625, -1.05029296875, -0.985107421875, -0.919921875, -0.854736328125, -0.78955078125, -0.724365234375, -0.6591796875, -0.593994140625, -0.52880859375, -0.463623046875, -0.3984375, -0.333251953125, -0.26806640625, -0.202880859375, -0.1376953125, -0.072509765625, -0.00732421875, 0.057861328125, 0.123046875, 0.188232421875, 0.25341796875, 0.318603515625, 0.3837890625, 0.448974609375, 0.51416015625, 0.579345703125, 0.64453125, 0.709716796875, 0.77490234375, 0.840087890625, 0.9052734375, 0.970458984375, 1.03564453125, 1.100830078125, 1.166015625, 1.231201171875, 1.29638671875, 1.361572265625, 1.4267578125, 1.491943359375, 1.55712890625, 1.622314453125, 1.6875, 1.752685546875, 1.81787109375, 1.883056640625, 1.9482421875, 2.013427734375, 2.07861328125, 2.143798828125, 2.208984375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 20.0, 24.0, 33.0, 42.0, 46.0, 50.0, 69.0, 49.0, 76.0, 63.0, 61.0, 55.0, 62.0, 64.0, 44.0, 35.0, 34.0, 31.0, 16.0, 20.0, 10.0, 12.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00016999244689941406, -0.00016469135880470276, -0.00015939027070999146, -0.00015408918261528015, -0.00014878809452056885, -0.00014348700642585754, -0.00013818591833114624, -0.00013288483023643494, -0.00012758374214172363, -0.00012228265404701233, -0.00011698156595230103, -0.00011168047785758972, -0.00010637938976287842, -0.00010107830166816711, -9.577721357345581e-05, -9.047612547874451e-05, -8.51750373840332e-05, -7.98739492893219e-05, -7.45728611946106e-05, -6.927177309989929e-05, -6.397068500518799e-05, -5.8669596910476685e-05, -5.336850881576538e-05, -4.806742072105408e-05, -4.2766332626342773e-05, -3.746524453163147e-05, -3.2164156436920166e-05, -2.6863068342208862e-05, -2.156198024749756e-05, -1.6260892152786255e-05, -1.0959804058074951e-05, -5.6587159633636475e-06, -3.5762786865234375e-07, 4.94346022605896e-06, 1.0244548320770264e-05, 1.5545636415481567e-05, 2.084672451019287e-05, 2.6147812604904175e-05, 3.144890069961548e-05, 3.674998879432678e-05, 4.2051076889038086e-05, 4.735216498374939e-05, 5.265325307846069e-05, 5.7954341173172e-05, 6.32554292678833e-05, 6.85565173625946e-05, 7.385760545730591e-05, 7.915869355201721e-05, 8.445978164672852e-05, 8.976086974143982e-05, 9.506195783615112e-05, 0.00010036304593086243, 0.00010566413402557373, 0.00011096522212028503, 0.00011626631021499634, 0.00012156739830970764, 0.00012686848640441895, 0.00013216957449913025, 0.00013747066259384155, 0.00014277175068855286, 0.00014807283878326416, 0.00015337392687797546, 0.00015867501497268677, 0.00016397610306739807, 0.00016927719116210938]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 5.0, 8.0, 12.0, 24.0, 34.0, 40.0, 57.0, 81.0, 109.0, 217.0, 322.0, 523.0, 872.0, 1444.0, 2874.0, 5700.0, 12329.0, 27098.0, 61463.0, 130434.0, 228291.0, 254400.0, 167923.0, 83573.0, 37722.0, 16872.0, 7695.0, 3728.0, 1947.0, 1085.0, 576.0, 363.0, 204.0, 172.0, 115.0, 70.0, 44.0, 39.0, 30.0, 16.0, 11.0, 10.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.310546875, -2.24298095703125, -2.1754150390625, -2.10784912109375, -2.040283203125, -1.97271728515625, -1.9051513671875, -1.83758544921875, -1.77001953125, -1.70245361328125, -1.6348876953125, -1.56732177734375, -1.499755859375, -1.43218994140625, -1.3646240234375, -1.29705810546875, -1.2294921875, -1.16192626953125, -1.0943603515625, -1.02679443359375, -0.959228515625, -0.89166259765625, -0.8240966796875, -0.75653076171875, -0.68896484375, -0.62139892578125, -0.5538330078125, -0.48626708984375, -0.418701171875, -0.35113525390625, -0.2835693359375, -0.21600341796875, -0.1484375, -0.08087158203125, -0.0133056640625, 0.05426025390625, 0.121826171875, 0.18939208984375, 0.2569580078125, 0.32452392578125, 0.39208984375, 0.45965576171875, 0.5272216796875, 0.59478759765625, 0.662353515625, 0.72991943359375, 0.7974853515625, 0.86505126953125, 0.9326171875, 1.00018310546875, 1.0677490234375, 1.13531494140625, 1.202880859375, 1.27044677734375, 1.3380126953125, 1.40557861328125, 1.47314453125, 1.54071044921875, 1.6082763671875, 1.67584228515625, 1.743408203125, 1.81097412109375, 1.8785400390625, 1.94610595703125, 2.013671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 12.0, 6.0, 14.0, 5.0, 15.0, 19.0, 18.0, 34.0, 47.0, 50.0, 67.0, 80.0, 78.0, 85.0, 68.0, 63.0, 78.0, 54.0, 37.0, 39.0, 27.0, 20.0, 24.0, 15.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.48282623291015625, -0.4651641845703125, -0.44750213623046875, -0.429840087890625, -0.41217803955078125, -0.3945159912109375, -0.37685394287109375, -0.35919189453125, -0.34152984619140625, -0.3238677978515625, -0.30620574951171875, -0.288543701171875, -0.27088165283203125, -0.2532196044921875, -0.23555755615234375, -0.2178955078125, -0.20023345947265625, -0.1825714111328125, -0.16490936279296875, -0.147247314453125, -0.12958526611328125, -0.1119232177734375, -0.09426116943359375, -0.07659912109375, -0.05893707275390625, -0.0412750244140625, -0.02361297607421875, -0.005950927734375, 0.01171112060546875, 0.0293731689453125, 0.04703521728515625, 0.064697265625, 0.08235931396484375, 0.1000213623046875, 0.11768341064453125, 0.135345458984375, 0.15300750732421875, 0.1706695556640625, 0.18833160400390625, 0.20599365234375, 0.22365570068359375, 0.2413177490234375, 0.25897979736328125, 0.276641845703125, 0.29430389404296875, 0.3119659423828125, 0.32962799072265625, 0.3472900390625, 0.36495208740234375, 0.3826141357421875, 0.40027618408203125, 0.417938232421875, 0.43560028076171875, 0.4532623291015625, 0.47092437744140625, 0.48858642578125, 0.5062484741210938, 0.5239105224609375, 0.5415725708007812, 0.559234619140625, 0.5768966674804688, 0.5945587158203125, 0.6122207641601562, 0.6298828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 25.0, 26.0, 27.0, 30.0, 42.0, 51.0, 36.0, 60.0, 62.0, 66.0, 83.0, 76.0, 68.0, 50.0, 48.0, 51.0, 31.0, 24.0, 29.0, 14.0, 20.0, 11.0, 6.0, 7.0, 6.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1759355068206787, -3.0269339084625244, -2.877932071685791, -2.7289304733276367, -2.5799286365509033, -2.430927038192749, -2.2819252014160156, -2.1329236030578613, -1.9839218854904175, -1.8349201679229736, -1.6859184503555298, -1.536916732788086, -1.3879151344299316, -1.2389132976531982, -1.089911699295044, -0.9409099817276001, -0.7919082641601562, -0.6429065465927124, -0.49390485882759094, -0.3449031710624695, -0.19590145349502563, -0.04689973592758179, 0.10210192203521729, 0.25110363960266113, 0.400105357170105, 0.5491070747375488, 0.6981087923049927, 0.8471104502677917, 0.9961121678352356, 1.1451139450073242, 1.2941155433654785, 1.4431172609329224, 1.592118740081787, 1.741120457649231, 1.8901221752166748, 2.039123773574829, 2.1881256103515625, 2.337127208709717, 2.486128807067871, 2.6351306438446045, 2.784132480621338, 2.933134078979492, 3.0821359157562256, 3.23113751411438, 3.3801393508911133, 3.5291409492492676, 3.678142547607422, 3.8271443843841553, 3.9761459827423096, 4.125147819519043, 4.274149417877197, 4.423151016235352, 4.572152614593506, 4.721154689788818, 4.870156288146973, 5.019157886505127, 5.168159484863281, 5.3171610832214355, 5.46616268157959, 5.615164756774902, 5.764166355133057, 5.913167953491211, 6.062169551849365, 6.2111711502075195, 6.360173225402832]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 11.0, 9.0, 7.0, 13.0, 24.0, 21.0, 32.0, 35.0, 19.0, 31.0, 42.0, 33.0, 36.0, 40.0, 40.0, 34.0, 37.0, 48.0, 43.0, 33.0, 37.0, 28.0, 42.0, 34.0, 36.0, 22.0, 24.0, 25.0, 20.0, 19.0, 13.0, 23.0, 19.0, 14.0, 6.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1072566509246826, -2.0383243560791016, -1.96939218044281, -1.900459885597229, -1.8315277099609375, -1.7625954151153564, -1.6936631202697754, -1.6247308254241943, -1.5557986497879028, -1.4868663549423218, -1.4179341793060303, -1.3490018844604492, -1.2800695896148682, -1.2111374139785767, -1.1422051191329956, -1.073272943496704, -1.004340648651123, -0.9354084134101868, -0.8664761781692505, -0.7975438833236694, -0.7286116480827332, -0.6596794128417969, -0.5907471179962158, -0.5218148827552795, -0.45288264751434326, -0.383950412273407, -0.3150181472301483, -0.24608589708805084, -0.17715364694595337, -0.10822141170501709, -0.03928914666175842, 0.029643118381500244, 0.09857535362243652, 0.167507603764534, 0.23643985390663147, 0.30537211894989014, 0.3743043541908264, 0.4432365894317627, 0.5121688842773438, 0.58110111951828, 0.6500333547592163, 0.7189655900001526, 0.7878978252410889, 0.8568301200866699, 0.9257623553276062, 0.9946945905685425, 1.0636268854141235, 1.132559061050415, 1.201491355895996, 1.2704236507415771, 1.3393558263778687, 1.4082881212234497, 1.4772202968597412, 1.5461525917053223, 1.6150848865509033, 1.6840171813964844, 1.7529493570327759, 1.821881651878357, 1.8908138275146484, 1.9597461223602295, 2.0286784172058105, 2.0976104736328125, 2.1665427684783936, 2.2354750633239746, 2.3044073581695557]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 8.0, 3.0, 6.0, 5.0, 16.0, 18.0, 31.0, 25.0, 43.0, 68.0, 77.0, 119.0, 168.0, 223.0, 339.0, 495.0, 772.0, 1151.0, 1826.0, 2863.0, 4612.0, 7647.0, 12852.0, 22804.0, 41960.0, 81546.0, 167286.0, 372217.0, 809354.0, 1163699.0, 799715.0, 362097.0, 162759.0, 78841.0, 41532.0, 22924.0, 13196.0, 7871.0, 4791.0, 3019.0, 1889.0, 1172.0, 722.0, 508.0, 330.0, 221.0, 166.0, 108.0, 74.0, 45.0, 31.0, 12.0, 10.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-4.2265625, -4.100341796875, -3.97412109375, -3.847900390625, -3.7216796875, -3.595458984375, -3.46923828125, -3.343017578125, -3.216796875, -3.090576171875, -2.96435546875, -2.838134765625, -2.7119140625, -2.585693359375, -2.45947265625, -2.333251953125, -2.20703125, -2.080810546875, -1.95458984375, -1.828369140625, -1.7021484375, -1.575927734375, -1.44970703125, -1.323486328125, -1.197265625, -1.071044921875, -0.94482421875, -0.818603515625, -0.6923828125, -0.566162109375, -0.43994140625, -0.313720703125, -0.1875, -0.061279296875, 0.06494140625, 0.191162109375, 0.3173828125, 0.443603515625, 0.56982421875, 0.696044921875, 0.822265625, 0.948486328125, 1.07470703125, 1.200927734375, 1.3271484375, 1.453369140625, 1.57958984375, 1.705810546875, 1.83203125, 1.958251953125, 2.08447265625, 2.210693359375, 2.3369140625, 2.463134765625, 2.58935546875, 2.715576171875, 2.841796875, 2.968017578125, 3.09423828125, 3.220458984375, 3.3466796875, 3.472900390625, 3.59912109375, 3.725341796875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 11.0, 11.0, 10.0, 16.0, 20.0, 30.0, 20.0, 42.0, 29.0, 31.0, 31.0, 26.0, 45.0, 30.0, 47.0, 39.0, 33.0, 31.0, 29.0, 39.0, 32.0, 35.0, 45.0, 33.0, 26.0, 28.0, 27.0, 25.0, 22.0, 15.0, 12.0, 13.0, 11.0, 14.0, 10.0, 12.0, 4.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6083984375, -1.5599517822265625, -1.511505126953125, -1.4630584716796875, -1.41461181640625, -1.3661651611328125, -1.317718505859375, -1.2692718505859375, -1.2208251953125, -1.1723785400390625, -1.123931884765625, -1.0754852294921875, -1.02703857421875, -0.9785919189453125, -0.930145263671875, -0.8816986083984375, -0.833251953125, -0.7848052978515625, -0.736358642578125, -0.6879119873046875, -0.63946533203125, -0.5910186767578125, -0.542572021484375, -0.4941253662109375, -0.4456787109375, -0.3972320556640625, -0.348785400390625, -0.3003387451171875, -0.25189208984375, -0.2034454345703125, -0.154998779296875, -0.1065521240234375, -0.05810546875, -0.0096588134765625, 0.038787841796875, 0.0872344970703125, 0.13568115234375, 0.1841278076171875, 0.232574462890625, 0.2810211181640625, 0.3294677734375, 0.3779144287109375, 0.426361083984375, 0.4748077392578125, 0.52325439453125, 0.5717010498046875, 0.620147705078125, 0.6685943603515625, 0.717041015625, 0.7654876708984375, 0.813934326171875, 0.8623809814453125, 0.91082763671875, 0.9592742919921875, 1.007720947265625, 1.0561676025390625, 1.1046142578125, 1.1530609130859375, 1.201507568359375, 1.2499542236328125, 1.29840087890625, 1.3468475341796875, 1.395294189453125, 1.4437408447265625, 1.4921875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 15.0, 29.0, 50.0, 64.0, 99.0, 185.0, 266.0, 455.0, 781.0, 1220.0, 2101.0, 3397.0, 5882.0, 10704.0, 19212.0, 36738.0, 70946.0, 148270.0, 320188.0, 685952.0, 1124935.0, 904769.0, 449266.0, 205279.0, 97639.0, 48815.0, 25193.0, 13506.0, 7581.0, 4274.0, 2447.0, 1529.0, 911.0, 554.0, 340.0, 249.0, 138.0, 113.0, 55.0, 29.0, 27.0, 23.0, 11.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.20233154296875, -4.0609130859375, -3.91949462890625, -3.778076171875, -3.63665771484375, -3.4952392578125, -3.35382080078125, -3.21240234375, -3.07098388671875, -2.9295654296875, -2.78814697265625, -2.646728515625, -2.50531005859375, -2.3638916015625, -2.22247314453125, -2.0810546875, -1.93963623046875, -1.7982177734375, -1.65679931640625, -1.515380859375, -1.37396240234375, -1.2325439453125, -1.09112548828125, -0.94970703125, -0.80828857421875, -0.6668701171875, -0.52545166015625, -0.384033203125, -0.24261474609375, -0.1011962890625, 0.04022216796875, 0.181640625, 0.32305908203125, 0.4644775390625, 0.60589599609375, 0.747314453125, 0.88873291015625, 1.0301513671875, 1.17156982421875, 1.31298828125, 1.45440673828125, 1.5958251953125, 1.73724365234375, 1.878662109375, 2.02008056640625, 2.1614990234375, 2.30291748046875, 2.4443359375, 2.58575439453125, 2.7271728515625, 2.86859130859375, 3.010009765625, 3.15142822265625, 3.2928466796875, 3.43426513671875, 3.57568359375, 3.71710205078125, 3.8585205078125, 3.99993896484375, 4.141357421875, 4.28277587890625, 4.4241943359375, 4.56561279296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 15.0, 13.0, 22.0, 17.0, 29.0, 34.0, 51.0, 63.0, 68.0, 77.0, 114.0, 146.0, 152.0, 201.0, 230.0, 259.0, 244.0, 282.0, 281.0, 279.0, 244.0, 233.0, 212.0, 158.0, 150.0, 103.0, 69.0, 67.0, 56.0, 47.0, 34.0, 26.0, 21.0, 19.0, 13.0, 15.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.239715576171875, -1.20306396484375, -1.166412353515625, -1.1297607421875, -1.093109130859375, -1.05645751953125, -1.019805908203125, -0.983154296875, -0.946502685546875, -0.90985107421875, -0.873199462890625, -0.8365478515625, -0.799896240234375, -0.76324462890625, -0.726593017578125, -0.68994140625, -0.653289794921875, -0.61663818359375, -0.579986572265625, -0.5433349609375, -0.506683349609375, -0.47003173828125, -0.433380126953125, -0.396728515625, -0.360076904296875, -0.32342529296875, -0.286773681640625, -0.2501220703125, -0.213470458984375, -0.17681884765625, -0.140167236328125, -0.103515625, -0.066864013671875, -0.03021240234375, 0.006439208984375, 0.0430908203125, 0.079742431640625, 0.11639404296875, 0.153045654296875, 0.189697265625, 0.226348876953125, 0.26300048828125, 0.299652099609375, 0.3363037109375, 0.372955322265625, 0.40960693359375, 0.446258544921875, 0.48291015625, 0.519561767578125, 0.55621337890625, 0.592864990234375, 0.6295166015625, 0.666168212890625, 0.70281982421875, 0.739471435546875, 0.776123046875, 0.812774658203125, 0.84942626953125, 0.886077880859375, 0.9227294921875, 0.959381103515625, 0.99603271484375, 1.032684326171875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 14.0, 16.0, 15.0, 27.0, 29.0, 30.0, 50.0, 47.0, 56.0, 55.0, 86.0, 78.0, 63.0, 66.0, 60.0, 64.0, 44.0, 40.0, 27.0, 21.0, 17.0, 16.0, 11.0, 12.0, 8.0, 11.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52296781539917, -4.3727850914001465, -4.222602844238281, -4.072420120239258, -3.9222373962402344, -3.772054672241211, -3.6218721866607666, -3.4716897010803223, -3.321506977081299, -3.1713242530822754, -3.021141767501831, -2.8709592819213867, -2.7207765579223633, -2.57059383392334, -2.4204113483428955, -2.270228862762451, -2.1200461387634277, -1.9698635339736938, -1.81968092918396, -1.669498324394226, -1.5193157196044922, -1.3691331148147583, -1.2189505100250244, -1.0687679052352905, -0.9185853004455566, -0.7684026956558228, -0.6182200908660889, -0.468037486076355, -0.3178548812866211, -0.1676722764968872, -0.01748967170715332, 0.13269293308258057, 0.28287506103515625, 0.43305766582489014, 0.583240270614624, 0.7334228754043579, 0.8836054801940918, 1.0337880849838257, 1.1839706897735596, 1.3341532945632935, 1.4843358993530273, 1.6345185041427612, 1.7847011089324951, 1.934883713722229, 2.085066318511963, 2.2352490425109863, 2.3854315280914307, 2.535614013671875, 2.6857967376708984, 2.835979461669922, 2.986161947250366, 3.1363444328308105, 3.286527156829834, 3.4367098808288574, 3.5868923664093018, 3.737074851989746, 3.8872575759887695, 4.037440299987793, 4.187623023986816, 4.337805271148682, 4.487987995147705, 4.6381707191467285, 4.788352966308594, 4.938535690307617, 5.088718414306641]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 11.0, 7.0, 16.0, 17.0, 17.0, 15.0, 23.0, 20.0, 26.0, 23.0, 32.0, 27.0, 36.0, 36.0, 25.0, 49.0, 36.0, 44.0, 40.0, 34.0, 27.0, 35.0, 41.0, 34.0, 36.0, 38.0, 24.0, 32.0, 20.0, 16.0, 22.0, 23.0, 20.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 10.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7342405319213867, -1.6759778261184692, -1.6177152395248413, -1.5594525337219238, -1.5011898279190063, -1.4429271221160889, -1.384664535522461, -1.3264018297195435, -1.268139123916626, -1.2098764181137085, -1.1516138315200806, -1.093351125717163, -1.0350884199142456, -0.9768257737159729, -0.9185631275177002, -0.8603004217147827, -0.8020378351211548, -0.7437751889228821, -0.6855124831199646, -0.6272498369216919, -0.5689871311187744, -0.5107244849205017, -0.452461838722229, -0.3941991627216339, -0.3359364867210388, -0.2776738107204437, -0.21941114962100983, -0.16114848852157593, -0.10288581252098083, -0.04462313652038574, 0.013639509677886963, 0.07190218567848206, 0.13016486167907715, 0.18842753767967224, 0.24669019877910614, 0.30495285987854004, 0.36321553587913513, 0.4214782118797302, 0.47974085807800293, 0.5380035638809204, 0.5962662100791931, 0.6545288562774658, 0.7127915620803833, 0.771054208278656, 0.8293168544769287, 0.8875795602798462, 0.9458422064781189, 1.0041048526763916, 1.062367558479309, 1.1206302642822266, 1.1788928508758545, 1.237155556678772, 1.2954182624816895, 1.3536808490753174, 1.4119435548782349, 1.4702062606811523, 1.5284688472747803, 1.5867315530776978, 1.6449941396713257, 1.7032568454742432, 1.7615195512771606, 1.8197822570800781, 1.878044843673706, 1.9363075494766235, 1.994570255279541]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 14.0, 29.0, 39.0, 86.0, 164.0, 220.0, 390.0, 604.0, 1095.0, 1785.0, 3161.0, 6031.0, 10358.0, 19464.0, 36833.0, 68971.0, 124869.0, 194771.0, 218822.0, 159262.0, 93230.0, 49961.0, 26749.0, 13998.0, 7681.0, 4259.0, 2444.0, 1315.0, 747.0, 467.0, 295.0, 169.0, 93.0, 52.0, 38.0, 29.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4033203125, -0.3921928405761719, -0.38106536865234375, -0.3699378967285156, -0.3588104248046875, -0.3476829528808594, -0.33655548095703125, -0.3254280090332031, -0.314300537109375, -0.3031730651855469, -0.29204559326171875, -0.2809181213378906, -0.2697906494140625, -0.2586631774902344, -0.24753570556640625, -0.23640823364257812, -0.22528076171875, -0.21415328979492188, -0.20302581787109375, -0.19189834594726562, -0.1807708740234375, -0.16964340209960938, -0.15851593017578125, -0.14738845825195312, -0.136260986328125, -0.12513351440429688, -0.11400604248046875, -0.10287857055664062, -0.0917510986328125, -0.08062362670898438, -0.06949615478515625, -0.058368682861328125, -0.0472412109375, -0.036113739013671875, -0.02498626708984375, -0.013858795166015625, -0.0027313232421875, 0.008396148681640625, 0.01952362060546875, 0.030651092529296875, 0.041778564453125, 0.052906036376953125, 0.06403350830078125, 0.07516098022460938, 0.0862884521484375, 0.09741592407226562, 0.10854339599609375, 0.11967086791992188, 0.13079833984375, 0.14192581176757812, 0.15305328369140625, 0.16418075561523438, 0.1753082275390625, 0.18643569946289062, 0.19756317138671875, 0.20869064331054688, 0.219818115234375, 0.23094558715820312, 0.24207305908203125, 0.2532005310058594, 0.2643280029296875, 0.2754554748535156, 0.28658294677734375, 0.2977104187011719, 0.308837890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 6.0, 15.0, 9.0, 16.0, 12.0, 15.0, 34.0, 25.0, 26.0, 24.0, 29.0, 28.0, 27.0, 34.0, 34.0, 31.0, 30.0, 35.0, 35.0, 34.0, 41.0, 35.0, 27.0, 30.0, 27.0, 33.0, 23.0, 32.0, 21.0, 28.0, 21.0, 24.0, 21.0, 12.0, 23.0, 10.0, 9.0, 8.0, 12.0, 5.0, 6.0, 11.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7475433349609375, -1.687469482421875, -1.6273956298828125, -1.56732177734375, -1.5072479248046875, -1.447174072265625, -1.3871002197265625, -1.3270263671875, -1.2669525146484375, -1.206878662109375, -1.1468048095703125, -1.08673095703125, -1.0266571044921875, -0.966583251953125, -0.9065093994140625, -0.846435546875, -0.7863616943359375, -0.726287841796875, -0.6662139892578125, -0.60614013671875, -0.5460662841796875, -0.485992431640625, -0.4259185791015625, -0.3658447265625, -0.3057708740234375, -0.245697021484375, -0.1856231689453125, -0.12554931640625, -0.0654754638671875, -0.005401611328125, 0.0546722412109375, 0.11474609375, 0.1748199462890625, 0.234893798828125, 0.2949676513671875, 0.35504150390625, 0.4151153564453125, 0.475189208984375, 0.5352630615234375, 0.5953369140625, 0.6554107666015625, 0.715484619140625, 0.7755584716796875, 0.83563232421875, 0.8957061767578125, 0.955780029296875, 1.0158538818359375, 1.075927734375, 1.1360015869140625, 1.196075439453125, 1.2561492919921875, 1.31622314453125, 1.3762969970703125, 1.436370849609375, 1.4964447021484375, 1.5565185546875, 1.6165924072265625, 1.676666259765625, 1.7367401123046875, 1.79681396484375, 1.8568878173828125, 1.916961669921875, 1.9770355224609375, 2.037109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 13.0, 7.0, 10.0, 9.0, 23.0, 27.0, 35.0, 45.0, 62.0, 86.0, 107.0, 171.0, 212.0, 367.0, 511.0, 798.0, 1344.0, 2176.0, 4090.0, 7837.0, 17034.0, 45426.0, 817685.0, 104685.0, 23152.0, 10193.0, 5227.0, 2753.0, 1623.0, 908.0, 581.0, 401.0, 277.0, 177.0, 142.0, 94.0, 61.0, 55.0, 40.0, 30.0, 19.0, 14.0, 16.0, 11.0, 7.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8077774047851562, -0.7796173095703125, -0.7514572143554688, -0.723297119140625, -0.6951370239257812, -0.6669769287109375, -0.6388168334960938, -0.61065673828125, -0.5824966430664062, -0.5543365478515625, -0.5261764526367188, -0.498016357421875, -0.46985626220703125, -0.4416961669921875, -0.41353607177734375, -0.3853759765625, -0.35721588134765625, -0.3290557861328125, -0.30089569091796875, -0.272735595703125, -0.24457550048828125, -0.2164154052734375, -0.18825531005859375, -0.16009521484375, -0.13193511962890625, -0.1037750244140625, -0.07561492919921875, -0.047454833984375, -0.01929473876953125, 0.0088653564453125, 0.03702545166015625, 0.065185546875, 0.09334564208984375, 0.1215057373046875, 0.14966583251953125, 0.177825927734375, 0.20598602294921875, 0.2341461181640625, 0.26230621337890625, 0.29046630859375, 0.31862640380859375, 0.3467864990234375, 0.37494659423828125, 0.403106689453125, 0.43126678466796875, 0.4594268798828125, 0.48758697509765625, 0.5157470703125, 0.5439071655273438, 0.5720672607421875, 0.6002273559570312, 0.628387451171875, 0.6565475463867188, 0.6847076416015625, 0.7128677368164062, 0.74102783203125, 0.7691879272460938, 0.7973480224609375, 0.8255081176757812, 0.853668212890625, 0.8818283081054688, 0.9099884033203125, 0.9381484985351562, 0.96630859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 9.0, 14.0, 13.0, 14.0, 9.0, 12.0, 18.0, 28.0, 31.0, 23.0, 37.0, 38.0, 32.0, 36.0, 41.0, 36.0, 31.0, 38.0, 46.0, 41.0, 30.0, 33.0, 34.0, 37.0, 30.0, 31.0, 29.0, 18.0, 20.0, 22.0, 24.0, 12.0, 20.0, 12.0, 12.0, 10.0, 8.0, 8.0, 13.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2724609375, -1.230499267578125, -1.18853759765625, -1.146575927734375, -1.1046142578125, -1.062652587890625, -1.02069091796875, -0.978729248046875, -0.936767578125, -0.894805908203125, -0.85284423828125, -0.810882568359375, -0.7689208984375, -0.726959228515625, -0.68499755859375, -0.643035888671875, -0.60107421875, -0.559112548828125, -0.51715087890625, -0.475189208984375, -0.4332275390625, -0.391265869140625, -0.34930419921875, -0.307342529296875, -0.265380859375, -0.223419189453125, -0.18145751953125, -0.139495849609375, -0.0975341796875, -0.055572509765625, -0.01361083984375, 0.028350830078125, 0.0703125, 0.112274169921875, 0.15423583984375, 0.196197509765625, 0.2381591796875, 0.280120849609375, 0.32208251953125, 0.364044189453125, 0.406005859375, 0.447967529296875, 0.48992919921875, 0.531890869140625, 0.5738525390625, 0.615814208984375, 0.65777587890625, 0.699737548828125, 0.74169921875, 0.783660888671875, 0.82562255859375, 0.867584228515625, 0.9095458984375, 0.951507568359375, 0.99346923828125, 1.035430908203125, 1.077392578125, 1.119354248046875, 1.16131591796875, 1.203277587890625, 1.2452392578125, 1.287200927734375, 1.32916259765625, 1.371124267578125, 1.4130859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 17.0, 19.0, 35.0, 38.0, 65.0, 96.0, 174.0, 268.0, 418.0, 637.0, 1136.0, 1815.0, 3097.0, 5285.0, 9482.0, 18389.0, 41509.0, 872844.0, 49095.0, 19737.0, 10362.0, 5755.0, 3300.0, 1882.0, 1185.0, 667.0, 465.0, 268.0, 182.0, 93.0, 69.0, 46.0, 41.0, 21.0, 20.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21637725830078125, -0.2097320556640625, -0.20308685302734375, -0.196441650390625, -0.18979644775390625, -0.1831512451171875, -0.17650604248046875, -0.16986083984375, -0.16321563720703125, -0.1565704345703125, -0.14992523193359375, -0.143280029296875, -0.13663482666015625, -0.1299896240234375, -0.12334442138671875, -0.11669921875, -0.11005401611328125, -0.1034088134765625, -0.09676361083984375, -0.090118408203125, -0.08347320556640625, -0.0768280029296875, -0.07018280029296875, -0.06353759765625, -0.05689239501953125, -0.0502471923828125, -0.04360198974609375, -0.036956787109375, -0.03031158447265625, -0.0236663818359375, -0.01702117919921875, -0.0103759765625, -0.00373077392578125, 0.0029144287109375, 0.00955963134765625, 0.016204833984375, 0.02285003662109375, 0.0294952392578125, 0.03614044189453125, 0.04278564453125, 0.04943084716796875, 0.0560760498046875, 0.06272125244140625, 0.069366455078125, 0.07601165771484375, 0.0826568603515625, 0.08930206298828125, 0.095947265625, 0.10259246826171875, 0.1092376708984375, 0.11588287353515625, 0.122528076171875, 0.12917327880859375, 0.1358184814453125, 0.14246368408203125, 0.14910888671875, 0.15575408935546875, 0.1623992919921875, 0.16904449462890625, 0.175689697265625, 0.18233489990234375, 0.1889801025390625, 0.19562530517578125, 0.2022705078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 9.0, 14.0, 23.0, 29.0, 28.0, 39.0, 49.0, 47.0, 64.0, 71.0, 82.0, 71.0, 65.0, 59.0, 63.0, 62.0, 42.0, 39.0, 31.0, 29.0, 15.0, 13.0, 5.0, 9.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.7637691497802734e-05, -5.59687614440918e-05, -5.429983139038086e-05, -5.263090133666992e-05, -5.0961971282958984e-05, -4.929304122924805e-05, -4.762411117553711e-05, -4.595518112182617e-05, -4.4286251068115234e-05, -4.26173210144043e-05, -4.094839096069336e-05, -3.927946090698242e-05, -3.7610530853271484e-05, -3.594160079956055e-05, -3.427267074584961e-05, -3.260374069213867e-05, -3.0934810638427734e-05, -2.9265880584716797e-05, -2.759695053100586e-05, -2.5928020477294922e-05, -2.4259090423583984e-05, -2.2590160369873047e-05, -2.092123031616211e-05, -1.9252300262451172e-05, -1.7583370208740234e-05, -1.5914440155029297e-05, -1.424551010131836e-05, -1.2576580047607422e-05, -1.0907649993896484e-05, -9.238719940185547e-06, -7.569789886474609e-06, -5.900859832763672e-06, -4.231929779052734e-06, -2.562999725341797e-06, -8.940696716308594e-07, 7.748603820800781e-07, 2.4437904357910156e-06, 4.112720489501953e-06, 5.781650543212891e-06, 7.450580596923828e-06, 9.119510650634766e-06, 1.0788440704345703e-05, 1.245737075805664e-05, 1.4126300811767578e-05, 1.5795230865478516e-05, 1.7464160919189453e-05, 1.913309097290039e-05, 2.0802021026611328e-05, 2.2470951080322266e-05, 2.4139881134033203e-05, 2.580881118774414e-05, 2.7477741241455078e-05, 2.9146671295166016e-05, 3.081560134887695e-05, 3.248453140258789e-05, 3.415346145629883e-05, 3.5822391510009766e-05, 3.74913215637207e-05, 3.916025161743164e-05, 4.082918167114258e-05, 4.2498111724853516e-05, 4.416704177856445e-05, 4.583597183227539e-05, 4.750490188598633e-05, 4.9173831939697266e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 16.0, 30.0, 50.0, 59.0, 97.0, 153.0, 254.0, 354.0, 548.0, 887.0, 1365.0, 2205.0, 3612.0, 5744.0, 9350.0, 15719.0, 26414.0, 44122.0, 76052.0, 125850.0, 182444.0, 193555.0, 142334.0, 88334.0, 52021.0, 30322.0, 18254.0, 10655.0, 6620.0, 4070.0, 2552.0, 1611.0, 1051.0, 635.0, 443.0, 251.0, 169.0, 117.0, 67.0, 49.0, 38.0, 15.0, 19.0, 9.0, 4.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.07196044921875, -0.06985282897949219, -0.06774520874023438, -0.06563758850097656, -0.06352996826171875, -0.06142234802246094, -0.059314727783203125, -0.05720710754394531, -0.0550994873046875, -0.05299186706542969, -0.050884246826171875, -0.04877662658691406, -0.04666900634765625, -0.04456138610839844, -0.042453765869140625, -0.04034614562988281, -0.038238525390625, -0.03613090515136719, -0.034023284912109375, -0.03191566467285156, -0.02980804443359375, -0.027700424194335938, -0.025592803955078125, -0.023485183715820312, -0.0213775634765625, -0.019269943237304688, -0.017162322998046875, -0.015054702758789062, -0.01294708251953125, -0.010839462280273438, -0.008731842041015625, -0.0066242218017578125, -0.0045166015625, -0.0024089813232421875, -0.000301361083984375, 0.0018062591552734375, 0.00391387939453125, 0.0060214996337890625, 0.008129119873046875, 0.010236740112304688, 0.0123443603515625, 0.014451980590820312, 0.016559600830078125, 0.018667221069335938, 0.02077484130859375, 0.022882461547851562, 0.024990081787109375, 0.027097702026367188, 0.029205322265625, 0.03131294250488281, 0.033420562744140625, 0.03552818298339844, 0.03763580322265625, 0.03974342346191406, 0.041851043701171875, 0.04395866394042969, 0.0460662841796875, 0.04817390441894531, 0.050281524658203125, 0.05238914489746094, 0.05449676513671875, 0.05660438537597656, 0.058712005615234375, 0.06081962585449219, 0.06292724609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 9.0, 9.0, 9.0, 8.0, 14.0, 16.0, 19.0, 16.0, 22.0, 32.0, 26.0, 34.0, 44.0, 40.0, 57.0, 29.0, 47.0, 56.0, 52.0, 48.0, 51.0, 58.0, 41.0, 47.0, 27.0, 26.0, 27.0, 23.0, 13.0, 16.0, 14.0, 6.0, 9.0, 8.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.017547607421875, -0.017049312591552734, -0.01655101776123047, -0.016052722930908203, -0.015554428100585938, -0.015056133270263672, -0.014557838439941406, -0.01405954360961914, -0.013561248779296875, -0.01306295394897461, -0.012564659118652344, -0.012066364288330078, -0.011568069458007812, -0.011069774627685547, -0.010571479797363281, -0.010073184967041016, -0.00957489013671875, -0.009076595306396484, -0.008578300476074219, -0.008080005645751953, -0.0075817108154296875, -0.007083415985107422, -0.006585121154785156, -0.006086826324462891, -0.005588531494140625, -0.005090236663818359, -0.004591941833496094, -0.004093647003173828, -0.0035953521728515625, -0.003097057342529297, -0.0025987625122070312, -0.0021004676818847656, -0.0016021728515625, -0.0011038780212402344, -0.0006055831909179688, -0.00010728836059570312, 0.0003910064697265625, 0.0008893013000488281, 0.0013875961303710938, 0.0018858909606933594, 0.002384185791015625, 0.0028824806213378906, 0.0033807754516601562, 0.003879070281982422, 0.0043773651123046875, 0.004875659942626953, 0.005373954772949219, 0.005872249603271484, 0.00637054443359375, 0.006868839263916016, 0.007367134094238281, 0.007865428924560547, 0.008363723754882812, 0.008862018585205078, 0.009360313415527344, 0.00985860824584961, 0.010356903076171875, 0.01085519790649414, 0.011353492736816406, 0.011851787567138672, 0.012350082397460938, 0.012848377227783203, 0.013346672058105469, 0.013844966888427734, 0.01434326171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 13.0, 19.0, 13.0, 26.0, 28.0, 30.0, 39.0, 63.0, 47.0, 54.0, 86.0, 82.0, 57.0, 67.0, 57.0, 68.0, 50.0, 38.0, 29.0, 21.0, 17.0, 16.0, 14.0, 10.0, 9.0, 11.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.529380798339844, -4.3796868324279785, -4.229992866516113, -4.080298900604248, -3.930605173110962, -3.7809112071990967, -3.6312174797058105, -3.4815235137939453, -3.33182954788208, -3.182135581970215, -3.0324416160583496, -2.8827478885650635, -2.7330539226531982, -2.583359956741333, -2.433666229248047, -2.2839722633361816, -2.1342782974243164, -1.9845843315124512, -1.8348904848098755, -1.6851966381072998, -1.5355026721954346, -1.3858087062835693, -1.2361148595809937, -1.086421012878418, -0.9367270469665527, -0.7870331406593323, -0.6373392343521118, -0.48764532804489136, -0.3379514217376709, -0.18825751543045044, -0.03856360912322998, 0.1111302375793457, 0.26082468032836914, 0.4105185866355896, 0.5602124929428101, 0.7099063992500305, 0.859600305557251, 1.0092942714691162, 1.158988118171692, 1.3086819648742676, 1.4583759307861328, 1.608069896697998, 1.7577637434005737, 1.9074575901031494, 2.0571515560150146, 2.20684552192688, 2.356539249420166, 2.5062332153320312, 2.6559271812438965, 2.8056211471557617, 2.955315113067627, 3.105008840560913, 3.2547028064727783, 3.4043967723846436, 3.5540904998779297, 3.703784465789795, 3.85347843170166, 4.003172397613525, 4.152866363525391, 4.302560329437256, 4.452254295349121, 4.601947784423828, 4.751641750335693, 4.901335716247559, 5.051029682159424]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 5.0, 16.0, 19.0, 14.0, 17.0, 23.0, 21.0, 25.0, 25.0, 30.0, 26.0, 38.0, 33.0, 28.0, 46.0, 38.0, 43.0, 42.0, 33.0, 26.0, 41.0, 33.0, 33.0, 41.0, 35.0, 27.0, 31.0, 20.0, 16.0, 21.0, 25.0, 19.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7494254112243652, -1.6914043426513672, -1.6333832740783691, -1.575362205505371, -1.517341136932373, -1.459320068359375, -1.401298999786377, -1.343277931213379, -1.2852568626403809, -1.2272357940673828, -1.1692147254943848, -1.1111936569213867, -1.0531725883483887, -0.9951515197753906, -0.9371304512023926, -0.8791093826293945, -0.8210883140563965, -0.7630672454833984, -0.7050461769104004, -0.6470251083374023, -0.5890040397644043, -0.5309829711914062, -0.4729619026184082, -0.41494083404541016, -0.3569197654724121, -0.29889869689941406, -0.24087762832641602, -0.18285655975341797, -0.12483549118041992, -0.06681442260742188, -0.008793354034423828, 0.04922771453857422, 0.10724878311157227, 0.1652698516845703, 0.22329092025756836, 0.2813119888305664, 0.33933305740356445, 0.3973541259765625, 0.45537519454956055, 0.5133962631225586, 0.5714173316955566, 0.6294384002685547, 0.6874594688415527, 0.7454805374145508, 0.8035016059875488, 0.8615226745605469, 0.9195437431335449, 0.977564811706543, 1.035585880279541, 1.093606948852539, 1.151628017425537, 1.2096490859985352, 1.2676701545715332, 1.3256912231445312, 1.3837122917175293, 1.4417333602905273, 1.4997544288635254, 1.5577754974365234, 1.6157965660095215, 1.6738176345825195, 1.7318387031555176, 1.7898597717285156, 1.8478808403015137, 1.9059019088745117, 1.9639229774475098]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 27.0, 38.0, 57.0, 97.0, 163.0, 211.0, 317.0, 554.0, 809.0, 1272.0, 2022.0, 3350.0, 5101.0, 8424.0, 13640.0, 22573.0, 36626.0, 58771.0, 90041.0, 124956.0, 151061.0, 151670.0, 127535.0, 91557.0, 59864.0, 37578.0, 23229.0, 14002.0, 8603.0, 5253.0, 3255.0, 2146.0, 1289.0, 845.0, 549.0, 372.0, 221.0, 155.0, 93.0, 65.0, 51.0, 32.0, 15.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.455078125, -2.37841796875, -2.3017578125, -2.22509765625, -2.1484375, -2.07177734375, -1.9951171875, -1.91845703125, -1.841796875, -1.76513671875, -1.6884765625, -1.61181640625, -1.53515625, -1.45849609375, -1.3818359375, -1.30517578125, -1.228515625, -1.15185546875, -1.0751953125, -0.99853515625, -0.921875, -0.84521484375, -0.7685546875, -0.69189453125, -0.615234375, -0.53857421875, -0.4619140625, -0.38525390625, -0.30859375, -0.23193359375, -0.1552734375, -0.07861328125, -0.001953125, 0.07470703125, 0.1513671875, 0.22802734375, 0.3046875, 0.38134765625, 0.4580078125, 0.53466796875, 0.611328125, 0.68798828125, 0.7646484375, 0.84130859375, 0.91796875, 0.99462890625, 1.0712890625, 1.14794921875, 1.224609375, 1.30126953125, 1.3779296875, 1.45458984375, 1.53125, 1.60791015625, 1.6845703125, 1.76123046875, 1.837890625, 1.91455078125, 1.9912109375, 2.06787109375, 2.14453125, 2.22119140625, 2.2978515625, 2.37451171875, 2.451171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 11.0, 14.0, 18.0, 25.0, 18.0, 22.0, 32.0, 29.0, 27.0, 37.0, 34.0, 23.0, 38.0, 38.0, 51.0, 44.0, 44.0, 40.0, 36.0, 35.0, 36.0, 35.0, 28.0, 29.0, 28.0, 28.0, 25.0, 24.0, 19.0, 14.0, 8.0, 11.0, 15.0, 11.0, 2.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.955596923828125, -1.88775634765625, -1.819915771484375, -1.7520751953125, -1.684234619140625, -1.61639404296875, -1.548553466796875, -1.480712890625, -1.412872314453125, -1.34503173828125, -1.277191162109375, -1.2093505859375, -1.141510009765625, -1.07366943359375, -1.005828857421875, -0.93798828125, -0.870147705078125, -0.80230712890625, -0.734466552734375, -0.6666259765625, -0.598785400390625, -0.53094482421875, -0.463104248046875, -0.395263671875, -0.327423095703125, -0.25958251953125, -0.191741943359375, -0.1239013671875, -0.056060791015625, 0.01177978515625, 0.079620361328125, 0.1474609375, 0.215301513671875, 0.28314208984375, 0.350982666015625, 0.4188232421875, 0.486663818359375, 0.55450439453125, 0.622344970703125, 0.690185546875, 0.758026123046875, 0.82586669921875, 0.893707275390625, 0.9615478515625, 1.029388427734375, 1.09722900390625, 1.165069580078125, 1.23291015625, 1.300750732421875, 1.36859130859375, 1.436431884765625, 1.5042724609375, 1.572113037109375, 1.63995361328125, 1.707794189453125, 1.775634765625, 1.843475341796875, 1.91131591796875, 1.979156494140625, 2.0469970703125, 2.114837646484375, 2.18267822265625, 2.250518798828125, 2.318359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 17.0, 19.0, 41.0, 50.0, 76.0, 105.0, 177.0, 287.0, 352.0, 568.0, 844.0, 1387.0, 2294.0, 3789.0, 6142.0, 10569.0, 17988.0, 30935.0, 52496.0, 83792.0, 123336.0, 157414.0, 165512.0, 137665.0, 98118.0, 62314.0, 37769.0, 22045.0, 12906.0, 7640.0, 4486.0, 2709.0, 1716.0, 1047.0, 666.0, 424.0, 265.0, 201.0, 135.0, 85.0, 44.0, 45.0, 17.0, 18.0, 14.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.527587890625, -2.44384765625, -2.360107421875, -2.2763671875, -2.192626953125, -2.10888671875, -2.025146484375, -1.94140625, -1.857666015625, -1.77392578125, -1.690185546875, -1.6064453125, -1.522705078125, -1.43896484375, -1.355224609375, -1.271484375, -1.187744140625, -1.10400390625, -1.020263671875, -0.9365234375, -0.852783203125, -0.76904296875, -0.685302734375, -0.6015625, -0.517822265625, -0.43408203125, -0.350341796875, -0.2666015625, -0.182861328125, -0.09912109375, -0.015380859375, 0.068359375, 0.152099609375, 0.23583984375, 0.319580078125, 0.4033203125, 0.487060546875, 0.57080078125, 0.654541015625, 0.73828125, 0.822021484375, 0.90576171875, 0.989501953125, 1.0732421875, 1.156982421875, 1.24072265625, 1.324462890625, 1.408203125, 1.491943359375, 1.57568359375, 1.659423828125, 1.7431640625, 1.826904296875, 1.91064453125, 1.994384765625, 2.078125, 2.161865234375, 2.24560546875, 2.329345703125, 2.4130859375, 2.496826171875, 2.58056640625, 2.664306640625, 2.748046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 5.0, 12.0, 16.0, 19.0, 27.0, 23.0, 24.0, 37.0, 25.0, 30.0, 40.0, 32.0, 36.0, 38.0, 36.0, 52.0, 44.0, 36.0, 47.0, 43.0, 35.0, 38.0, 27.0, 20.0, 24.0, 28.0, 29.0, 14.0, 12.0, 19.0, 7.0, 12.0, 7.0, 8.0, 13.0, 5.0, 2.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.13092041015625, -1.0899658203125, -1.04901123046875, -1.008056640625, -0.96710205078125, -0.9261474609375, -0.88519287109375, -0.84423828125, -0.80328369140625, -0.7623291015625, -0.72137451171875, -0.680419921875, -0.63946533203125, -0.5985107421875, -0.55755615234375, -0.5166015625, -0.47564697265625, -0.4346923828125, -0.39373779296875, -0.352783203125, -0.31182861328125, -0.2708740234375, -0.22991943359375, -0.18896484375, -0.14801025390625, -0.1070556640625, -0.06610107421875, -0.025146484375, 0.01580810546875, 0.0567626953125, 0.09771728515625, 0.138671875, 0.17962646484375, 0.2205810546875, 0.26153564453125, 0.302490234375, 0.34344482421875, 0.3843994140625, 0.42535400390625, 0.46630859375, 0.50726318359375, 0.5482177734375, 0.58917236328125, 0.630126953125, 0.67108154296875, 0.7120361328125, 0.75299072265625, 0.7939453125, 0.83489990234375, 0.8758544921875, 0.91680908203125, 0.957763671875, 0.99871826171875, 1.0396728515625, 1.08062744140625, 1.12158203125, 1.16253662109375, 1.2034912109375, 1.24444580078125, 1.285400390625, 1.32635498046875, 1.3673095703125, 1.40826416015625, 1.44921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 12.0, 17.0, 17.0, 36.0, 48.0, 66.0, 123.0, 205.0, 307.0, 504.0, 829.0, 1428.0, 2382.0, 4214.0, 7388.0, 13151.0, 23990.0, 42627.0, 75139.0, 124603.0, 177281.0, 191828.0, 152613.0, 98457.0, 57875.0, 32195.0, 17738.0, 10187.0, 5525.0, 3166.0, 1889.0, 1059.0, 661.0, 383.0, 232.0, 132.0, 91.0, 63.0, 36.0, 32.0, 14.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4732513427734375, -1.421112060546875, -1.3689727783203125, -1.31683349609375, -1.2646942138671875, -1.212554931640625, -1.1604156494140625, -1.1082763671875, -1.0561370849609375, -1.003997802734375, -0.9518585205078125, -0.89971923828125, -0.8475799560546875, -0.795440673828125, -0.7433013916015625, -0.691162109375, -0.6390228271484375, -0.586883544921875, -0.5347442626953125, -0.48260498046875, -0.4304656982421875, -0.378326416015625, -0.3261871337890625, -0.2740478515625, -0.2219085693359375, -0.169769287109375, -0.1176300048828125, -0.06549072265625, -0.0133514404296875, 0.038787841796875, 0.0909271240234375, 0.14306640625, 0.1952056884765625, 0.247344970703125, 0.2994842529296875, 0.35162353515625, 0.4037628173828125, 0.455902099609375, 0.5080413818359375, 0.5601806640625, 0.6123199462890625, 0.664459228515625, 0.7165985107421875, 0.76873779296875, 0.8208770751953125, 0.873016357421875, 0.9251556396484375, 0.977294921875, 1.0294342041015625, 1.081573486328125, 1.1337127685546875, 1.18585205078125, 1.2379913330078125, 1.290130615234375, 1.3422698974609375, 1.3944091796875, 1.4465484619140625, 1.498687744140625, 1.5508270263671875, 1.60296630859375, 1.6551055908203125, 1.707244873046875, 1.7593841552734375, 1.8115234375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 6.0, 9.0, 17.0, 17.0, 28.0, 40.0, 45.0, 52.0, 75.0, 106.0, 101.0, 101.0, 90.0, 76.0, 66.0, 37.0, 43.0, 18.0, 27.0, 13.0, 15.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019490718841552734, -0.00018788687884807587, -0.0001808665692806244, -0.0001738462597131729, -0.00016682595014572144, -0.00015980564057826996, -0.00015278533101081848, -0.000145765021443367, -0.00013874471187591553, -0.00013172440230846405, -0.00012470409274101257, -0.0001176837831735611, -0.00011066347360610962, -0.00010364316403865814, -9.662285447120667e-05, -8.960254490375519e-05, -8.258223533630371e-05, -7.556192576885223e-05, -6.854161620140076e-05, -6.152130663394928e-05, -5.45009970664978e-05, -4.7480687499046326e-05, -4.046037793159485e-05, -3.344006836414337e-05, -2.6419758796691895e-05, -1.9399449229240417e-05, -1.237913966178894e-05, -5.358830094337463e-06, 1.6614794731140137e-06, 8.68178904056549e-06, 1.5702098608016968e-05, 2.2722408175468445e-05, 2.9742717742919922e-05, 3.67630273103714e-05, 4.3783336877822876e-05, 5.080364644527435e-05, 5.782395601272583e-05, 6.484426558017731e-05, 7.186457514762878e-05, 7.888488471508026e-05, 8.590519428253174e-05, 9.292550384998322e-05, 9.994581341743469e-05, 0.00010696612298488617, 0.00011398643255233765, 0.00012100674211978912, 0.0001280270516872406, 0.00013504736125469208, 0.00014206767082214355, 0.00014908798038959503, 0.0001561082899570465, 0.00016312859952449799, 0.00017014890909194946, 0.00017716921865940094, 0.00018418952822685242, 0.0001912098377943039, 0.00019823014736175537, 0.00020525045692920685, 0.00021227076649665833, 0.0002192910760641098, 0.00022631138563156128, 0.00023333169519901276, 0.00024035200476646423, 0.0002473723143339157, 0.0002543926239013672]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 5.0, 13.0, 16.0, 19.0, 38.0, 43.0, 58.0, 124.0, 151.0, 239.0, 352.0, 537.0, 829.0, 1228.0, 1876.0, 2971.0, 4544.0, 7138.0, 11260.0, 17251.0, 27439.0, 42794.0, 65154.0, 94782.0, 127091.0, 147868.0, 142009.0, 115157.0, 82496.0, 55309.0, 36010.0, 22997.0, 14392.0, 9351.0, 6029.0, 3758.0, 2494.0, 1615.0, 1050.0, 699.0, 462.0, 313.0, 183.0, 146.0, 83.0, 52.0, 49.0, 20.0, 15.0, 12.0, 11.0, 6.0, 9.0, 6.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.177734375, -1.1407012939453125, -1.103668212890625, -1.0666351318359375, -1.02960205078125, -0.9925689697265625, -0.955535888671875, -0.9185028076171875, -0.8814697265625, -0.8444366455078125, -0.807403564453125, -0.7703704833984375, -0.73333740234375, -0.6963043212890625, -0.659271240234375, -0.6222381591796875, -0.585205078125, -0.5481719970703125, -0.511138916015625, -0.4741058349609375, -0.43707275390625, -0.4000396728515625, -0.363006591796875, -0.3259735107421875, -0.2889404296875, -0.2519073486328125, -0.214874267578125, -0.1778411865234375, -0.14080810546875, -0.1037750244140625, -0.066741943359375, -0.0297088623046875, 0.00732421875, 0.0443572998046875, 0.081390380859375, 0.1184234619140625, 0.15545654296875, 0.1924896240234375, 0.229522705078125, 0.2665557861328125, 0.3035888671875, 0.3406219482421875, 0.377655029296875, 0.4146881103515625, 0.45172119140625, 0.4887542724609375, 0.525787353515625, 0.5628204345703125, 0.599853515625, 0.6368865966796875, 0.673919677734375, 0.7109527587890625, 0.74798583984375, 0.7850189208984375, 0.822052001953125, 0.8590850830078125, 0.8961181640625, 0.9331512451171875, 0.970184326171875, 1.0072174072265625, 1.04425048828125, 1.0812835693359375, 1.118316650390625, 1.1553497314453125, 1.1923828125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 10.0, 12.0, 20.0, 16.0, 18.0, 22.0, 23.0, 35.0, 38.0, 41.0, 41.0, 39.0, 48.0, 63.0, 48.0, 49.0, 36.0, 52.0, 42.0, 28.0, 41.0, 34.0, 31.0, 26.0, 24.0, 26.0, 22.0, 13.0, 15.0, 9.0, 8.0, 12.0, 11.0, 1.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2984199523925781, -0.28775787353515625, -0.2770957946777344, -0.2664337158203125, -0.2557716369628906, -0.24510955810546875, -0.23444747924804688, -0.223785400390625, -0.21312332153320312, -0.20246124267578125, -0.19179916381835938, -0.1811370849609375, -0.17047500610351562, -0.15981292724609375, -0.14915084838867188, -0.13848876953125, -0.12782669067382812, -0.11716461181640625, -0.10650253295898438, -0.0958404541015625, -0.08517837524414062, -0.07451629638671875, -0.06385421752929688, -0.053192138671875, -0.042530059814453125, -0.03186798095703125, -0.021205902099609375, -0.0105438232421875, 0.000118255615234375, 0.01078033447265625, 0.021442413330078125, 0.0321044921875, 0.042766571044921875, 0.05342864990234375, 0.06409072875976562, 0.0747528076171875, 0.08541488647460938, 0.09607696533203125, 0.10673904418945312, 0.117401123046875, 0.12806320190429688, 0.13872528076171875, 0.14938735961914062, 0.1600494384765625, 0.17071151733398438, 0.18137359619140625, 0.19203567504882812, 0.20269775390625, 0.21335983276367188, 0.22402191162109375, 0.23468399047851562, 0.2453460693359375, 0.2560081481933594, 0.26667022705078125, 0.2773323059082031, 0.287994384765625, 0.2986564636230469, 0.30931854248046875, 0.3199806213378906, 0.3306427001953125, 0.3413047790527344, 0.35196685791015625, 0.3626289367675781, 0.373291015625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 15.0, 12.0, 17.0, 15.0, 14.0, 30.0, 39.0, 53.0, 56.0, 61.0, 63.0, 66.0, 76.0, 63.0, 77.0, 54.0, 56.0, 47.0, 37.0, 22.0, 17.0, 23.0, 16.0, 14.0, 9.0, 10.0, 3.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.714277267456055, -4.566986083984375, -4.419694900512695, -4.272403717041016, -4.125112533569336, -3.9778213500976562, -3.8305299282073975, -3.6832387447357178, -3.535947561264038, -3.3886563777923584, -3.2413651943206787, -3.094074010848999, -2.9467825889587402, -2.7994914054870605, -2.652200222015381, -2.504909038543701, -2.3576178550720215, -2.210326671600342, -2.063035488128662, -1.9157441854476929, -1.7684530019760132, -1.6211618185043335, -1.4738705158233643, -1.3265793323516846, -1.1792881488800049, -1.0319969654083252, -0.8847057223320007, -0.7374144792556763, -0.5901232957839966, -0.4428321123123169, -0.29554086923599243, -0.14824962615966797, -0.0009589195251464844, 0.1463322937488556, 0.29362350702285767, 0.44091472029685974, 0.5882059335708618, 0.7354971170425415, 0.882788360118866, 1.0300796031951904, 1.1773707866668701, 1.3246619701385498, 1.4719531536102295, 1.6192444562911987, 1.7665356397628784, 1.913826823234558, 2.0611181259155273, 2.208409309387207, 2.3557004928588867, 2.5029916763305664, 2.650282859802246, 2.797574043273926, 2.9448652267456055, 3.092156410217285, 3.239447832107544, 3.3867390155792236, 3.5340301990509033, 3.681321382522583, 3.8286125659942627, 3.9759037494659424, 4.123195171356201, 4.270486354827881, 4.4177775382995605, 4.56506872177124, 4.71235990524292]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 4.0, 1.0, 8.0, 8.0, 9.0, 9.0, 11.0, 20.0, 15.0, 10.0, 19.0, 19.0, 24.0, 31.0, 26.0, 25.0, 36.0, 30.0, 28.0, 37.0, 44.0, 50.0, 38.0, 35.0, 38.0, 32.0, 29.0, 24.0, 28.0, 36.0, 25.0, 34.0, 30.0, 26.0, 19.0, 22.0, 24.0, 11.0, 8.0, 10.0, 14.0, 10.0, 7.0, 7.0, 9.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.959781289100647, -1.899973750114441, -1.8401663303375244, -1.7803587913513184, -1.7205513715744019, -1.6607438325881958, -1.6009364128112793, -1.5411288738250732, -1.4813213348388672, -1.4215137958526611, -1.3617063760757446, -1.3018988370895386, -1.242091417312622, -1.182283878326416, -1.12247633934021, -1.0626689195632935, -1.002861499786377, -0.9430540204048157, -0.8832465410232544, -0.8234390020370483, -0.7636315822601318, -0.7038240432739258, -0.6440165638923645, -0.5842090845108032, -0.5244016051292419, -0.46459412574768066, -0.4047866463661194, -0.3449791371822357, -0.28517165780067444, -0.22536417841911316, -0.1655566692352295, -0.10574918985366821, -0.045941710472106934, 0.013865776360034943, 0.07367326319217682, 0.1334807574748993, 0.19328823685646057, 0.25309571623802185, 0.3129032254219055, 0.3727107048034668, 0.4325181841850281, 0.49232566356658936, 0.5521331429481506, 0.6119406223297119, 0.671748161315918, 0.7315555810928345, 0.7913631200790405, 0.8511705994606018, 0.9109780788421631, 0.9707855582237244, 1.0305930376052856, 1.0904005765914917, 1.1502079963684082, 1.2100155353546143, 1.2698230743408203, 1.3296304941177368, 1.3894379138946533, 1.4492454528808594, 1.5090528726577759, 1.568860411643982, 1.6286678314208984, 1.6884753704071045, 1.7482829093933105, 1.808090329170227, 1.867897868156433]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 8.0, 13.0, 24.0, 31.0, 45.0, 81.0, 96.0, 135.0, 206.0, 328.0, 492.0, 762.0, 1116.0, 1753.0, 2804.0, 4488.0, 7367.0, 11936.0, 20540.0, 36259.0, 67500.0, 133005.0, 278507.0, 600425.0, 1037957.0, 969389.0, 520258.0, 242263.0, 117210.0, 60344.0, 32393.0, 18549.0, 10894.0, 6470.0, 3895.0, 2428.0, 1514.0, 1015.0, 598.0, 393.0, 281.0, 179.0, 118.0, 79.0, 44.0, 30.0, 25.0, 13.0, 9.0, 7.0, 5.0, 2.0, 1.0], "bins": [-4.3046875, -4.184783935546875, -4.06488037109375, -3.944976806640625, -3.8250732421875, -3.705169677734375, -3.58526611328125, -3.465362548828125, -3.345458984375, -3.225555419921875, -3.10565185546875, -2.985748291015625, -2.8658447265625, -2.745941162109375, -2.62603759765625, -2.506134033203125, -2.38623046875, -2.266326904296875, -2.14642333984375, -2.026519775390625, -1.9066162109375, -1.786712646484375, -1.66680908203125, -1.546905517578125, -1.427001953125, -1.307098388671875, -1.18719482421875, -1.067291259765625, -0.9473876953125, -0.827484130859375, -0.70758056640625, -0.587677001953125, -0.4677734375, -0.347869873046875, -0.22796630859375, -0.108062744140625, 0.0118408203125, 0.131744384765625, 0.25164794921875, 0.371551513671875, 0.491455078125, 0.611358642578125, 0.73126220703125, 0.851165771484375, 0.9710693359375, 1.090972900390625, 1.21087646484375, 1.330780029296875, 1.45068359375, 1.570587158203125, 1.69049072265625, 1.810394287109375, 1.9302978515625, 2.050201416015625, 2.17010498046875, 2.290008544921875, 2.409912109375, 2.529815673828125, 2.64971923828125, 2.769622802734375, 2.8895263671875, 3.009429931640625, 3.12933349609375, 3.249237060546875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 14.0, 10.0, 10.0, 10.0, 18.0, 20.0, 20.0, 21.0, 24.0, 31.0, 20.0, 47.0, 35.0, 36.0, 38.0, 31.0, 41.0, 38.0, 47.0, 39.0, 42.0, 48.0, 36.0, 48.0, 28.0, 38.0, 34.0, 29.0, 12.0, 24.0, 7.0, 17.0, 10.0, 19.0, 10.0, 13.0, 6.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.87890625, -1.8269805908203125, -1.775054931640625, -1.7231292724609375, -1.67120361328125, -1.6192779541015625, -1.567352294921875, -1.5154266357421875, -1.4635009765625, -1.4115753173828125, -1.359649658203125, -1.3077239990234375, -1.25579833984375, -1.2038726806640625, -1.151947021484375, -1.1000213623046875, -1.048095703125, -0.9961700439453125, -0.944244384765625, -0.8923187255859375, -0.84039306640625, -0.7884674072265625, -0.736541748046875, -0.6846160888671875, -0.6326904296875, -0.5807647705078125, -0.528839111328125, -0.4769134521484375, -0.42498779296875, -0.3730621337890625, -0.321136474609375, -0.2692108154296875, -0.21728515625, -0.1653594970703125, -0.113433837890625, -0.0615081787109375, -0.00958251953125, 0.0423431396484375, 0.094268798828125, 0.1461944580078125, 0.1981201171875, 0.2500457763671875, 0.301971435546875, 0.3538970947265625, 0.40582275390625, 0.4577484130859375, 0.509674072265625, 0.5615997314453125, 0.613525390625, 0.6654510498046875, 0.717376708984375, 0.7693023681640625, 0.82122802734375, 0.8731536865234375, 0.925079345703125, 0.9770050048828125, 1.0289306640625, 1.0808563232421875, 1.132781982421875, 1.1847076416015625, 1.23663330078125, 1.2885589599609375, 1.340484619140625, 1.3924102783203125, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 8.0, 18.0, 27.0, 45.0, 59.0, 87.0, 145.0, 225.0, 361.0, 564.0, 861.0, 1291.0, 2038.0, 3275.0, 5463.0, 8708.0, 14303.0, 23790.0, 40590.0, 69876.0, 124796.0, 226503.0, 414431.0, 707492.0, 906769.0, 708604.0, 413161.0, 225275.0, 124499.0, 70042.0, 40275.0, 23608.0, 14370.0, 8596.0, 5232.0, 3268.0, 2005.0, 1304.0, 830.0, 520.0, 321.0, 233.0, 120.0, 98.0, 66.0, 50.0, 24.0, 19.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.484375, -3.373748779296875, -3.26312255859375, -3.152496337890625, -3.0418701171875, -2.931243896484375, -2.82061767578125, -2.709991455078125, -2.599365234375, -2.488739013671875, -2.37811279296875, -2.267486572265625, -2.1568603515625, -2.046234130859375, -1.93560791015625, -1.824981689453125, -1.71435546875, -1.603729248046875, -1.49310302734375, -1.382476806640625, -1.2718505859375, -1.161224365234375, -1.05059814453125, -0.939971923828125, -0.829345703125, -0.718719482421875, -0.60809326171875, -0.497467041015625, -0.3868408203125, -0.276214599609375, -0.16558837890625, -0.054962158203125, 0.0556640625, 0.166290283203125, 0.27691650390625, 0.387542724609375, 0.4981689453125, 0.608795166015625, 0.71942138671875, 0.830047607421875, 0.940673828125, 1.051300048828125, 1.16192626953125, 1.272552490234375, 1.3831787109375, 1.493804931640625, 1.60443115234375, 1.715057373046875, 1.82568359375, 1.936309814453125, 2.04693603515625, 2.157562255859375, 2.2681884765625, 2.378814697265625, 2.48944091796875, 2.600067138671875, 2.710693359375, 2.821319580078125, 2.93194580078125, 3.042572021484375, 3.1531982421875, 3.263824462890625, 3.37445068359375, 3.485076904296875, 3.595703125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 12.0, 8.0, 14.0, 21.0, 25.0, 39.0, 30.0, 48.0, 45.0, 60.0, 71.0, 86.0, 99.0, 98.0, 136.0, 139.0, 166.0, 185.0, 198.0, 223.0, 236.0, 217.0, 206.0, 216.0, 205.0, 155.0, 182.0, 130.0, 126.0, 124.0, 98.0, 77.0, 69.0, 68.0, 45.0, 38.0, 37.0, 27.0, 21.0, 14.0, 13.0, 14.0, 8.0, 7.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8623046875, -0.8345413208007812, -0.8067779541015625, -0.7790145874023438, -0.751251220703125, -0.7234878540039062, -0.6957244873046875, -0.6679611206054688, -0.64019775390625, -0.6124343872070312, -0.5846710205078125, -0.5569076538085938, -0.529144287109375, -0.5013809204101562, -0.4736175537109375, -0.44585418701171875, -0.4180908203125, -0.39032745361328125, -0.3625640869140625, -0.33480072021484375, -0.307037353515625, -0.27927398681640625, -0.2515106201171875, -0.22374725341796875, -0.19598388671875, -0.16822052001953125, -0.1404571533203125, -0.11269378662109375, -0.084930419921875, -0.05716705322265625, -0.0294036865234375, -0.00164031982421875, 0.026123046875, 0.05388641357421875, 0.0816497802734375, 0.10941314697265625, 0.137176513671875, 0.16493988037109375, 0.1927032470703125, 0.22046661376953125, 0.24822998046875, 0.27599334716796875, 0.3037567138671875, 0.33152008056640625, 0.359283447265625, 0.38704681396484375, 0.4148101806640625, 0.44257354736328125, 0.4703369140625, 0.49810028076171875, 0.5258636474609375, 0.5536270141601562, 0.581390380859375, 0.6091537475585938, 0.6369171142578125, 0.6646804809570312, 0.69244384765625, 0.7202072143554688, 0.7479705810546875, 0.7757339477539062, 0.803497314453125, 0.8312606811523438, 0.8590240478515625, 0.8867874145507812, 0.91455078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 9.0, 4.0, 6.0, 4.0, 6.0, 13.0, 13.0, 20.0, 27.0, 26.0, 34.0, 52.0, 60.0, 64.0, 67.0, 66.0, 64.0, 71.0, 64.0, 58.0, 60.0, 34.0, 27.0, 28.0, 30.0, 16.0, 20.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.285930633544922, -4.141051292419434, -3.996171712875366, -3.851292133331299, -3.7064127922058105, -3.561533212661743, -3.416653633117676, -3.2717742919921875, -3.12689471244812, -2.9820151329040527, -2.8371357917785645, -2.692256212234497, -2.5473766326904297, -2.4024972915649414, -2.257617712020874, -2.1127381324768066, -1.9678587913513184, -1.8229793310165405, -1.6780998706817627, -1.5332202911376953, -1.3883408308029175, -1.2434613704681396, -1.0985817909240723, -0.9537023305892944, -0.8088228702545166, -0.6639434099197388, -0.5190638899803162, -0.37418439984321594, -0.22930490970611572, -0.08442544937133789, 0.06045407056808472, 0.20533359050750732, 0.35021352767944336, 0.4950930178165436, 0.6399725079536438, 0.7848520278930664, 0.9297314882278442, 1.074610948562622, 1.2194905281066895, 1.3643699884414673, 1.5092494487762451, 1.654128909111023, 1.7990083694458008, 1.9438879489898682, 2.0887675285339355, 2.233646869659424, 2.378526449203491, 2.5234060287475586, 2.668285369873047, 2.8131649494171143, 2.9580442905426025, 3.10292387008667, 3.247803211212158, 3.3926827907562256, 3.537562370300293, 3.6824417114257812, 3.8273212909698486, 3.972200870513916, 4.117080211639404, 4.261959552764893, 4.406839370727539, 4.551718711853027, 4.696598052978516, 4.841477870941162, 4.98635721206665]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 10.0, 13.0, 12.0, 11.0, 12.0, 11.0, 15.0, 21.0, 25.0, 17.0, 23.0, 26.0, 24.0, 31.0, 36.0, 32.0, 37.0, 29.0, 25.0, 37.0, 52.0, 44.0, 32.0, 37.0, 38.0, 40.0, 34.0, 36.0, 33.0, 26.0, 22.0, 23.0, 18.0, 26.0, 13.0, 18.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7316498756408691, -1.6734554767608643, -1.6152609586715698, -1.557066559791565, -1.4988720417022705, -1.4406776428222656, -1.3824831247329712, -1.3242887258529663, -1.2660942077636719, -1.207899808883667, -1.1497052907943726, -1.0915108919143677, -1.0333163738250732, -0.9751219749450684, -0.9169274568557739, -0.858733057975769, -0.8005385994911194, -0.7423441410064697, -0.6841496825218201, -0.6259552240371704, -0.5677607655525208, -0.5095663070678711, -0.4513718783855438, -0.39317741990089417, -0.3349829614162445, -0.27678850293159485, -0.2185940444469452, -0.16039960086345673, -0.10220514237880707, -0.044010698795318604, 0.014183759689331055, 0.07237821817398071, 0.13057267665863037, 0.18876713514328003, 0.2469615936279297, 0.30515605211257935, 0.363350510597229, 0.4215449392795563, 0.47973939776420593, 0.5379338264465332, 0.5961283445358276, 0.6543228030204773, 0.712517261505127, 0.7707117199897766, 0.8289061784744263, 0.8871005773544312, 0.9452950954437256, 1.0034894943237305, 1.0616838932037354, 1.1198782920837402, 1.1780728101730347, 1.2362672090530396, 1.294461727142334, 1.3526561260223389, 1.4108506441116333, 1.4690450429916382, 1.5272395610809326, 1.5854339599609375, 1.643628478050232, 1.7018228769302368, 1.7600173950195312, 1.8182117938995361, 1.8764063119888306, 1.9346007108688354, 1.9927952289581299]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 18.0, 15.0, 23.0, 38.0, 75.0, 123.0, 150.0, 253.0, 431.0, 660.0, 1107.0, 1918.0, 3246.0, 6093.0, 11105.0, 20615.0, 39160.0, 73818.0, 134500.0, 211318.0, 220414.0, 147458.0, 81425.0, 43648.0, 23108.0, 12175.0, 6649.0, 3775.0, 1994.0, 1231.0, 764.0, 483.0, 260.0, 176.0, 113.0, 56.0, 46.0, 33.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3155326843261719, -0.30538177490234375, -0.2952308654785156, -0.2850799560546875, -0.2749290466308594, -0.26477813720703125, -0.2546272277832031, -0.244476318359375, -0.23432540893554688, -0.22417449951171875, -0.21402359008789062, -0.2038726806640625, -0.19372177124023438, -0.18357086181640625, -0.17341995239257812, -0.16326904296875, -0.15311813354492188, -0.14296722412109375, -0.13281631469726562, -0.1226654052734375, -0.11251449584960938, -0.10236358642578125, -0.09221267700195312, -0.082061767578125, -0.07191085815429688, -0.06175994873046875, -0.051609039306640625, -0.0414581298828125, -0.031307220458984375, -0.02115631103515625, -0.011005401611328125, -0.0008544921875, 0.009296417236328125, 0.01944732666015625, 0.029598236083984375, 0.0397491455078125, 0.049900054931640625, 0.06005096435546875, 0.07020187377929688, 0.080352783203125, 0.09050369262695312, 0.10065460205078125, 0.11080551147460938, 0.1209564208984375, 0.13110733032226562, 0.14125823974609375, 0.15140914916992188, 0.16156005859375, 0.17171096801757812, 0.18186187744140625, 0.19201278686523438, 0.2021636962890625, 0.21231460571289062, 0.22246551513671875, 0.23261642456054688, 0.242767333984375, 0.2529182434082031, 0.26306915283203125, 0.2732200622558594, 0.2833709716796875, 0.2935218811035156, 0.30367279052734375, 0.3138236999511719, 0.323974609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 17.0, 5.0, 13.0, 9.0, 11.0, 20.0, 22.0, 19.0, 23.0, 30.0, 34.0, 33.0, 30.0, 18.0, 32.0, 33.0, 48.0, 48.0, 42.0, 51.0, 53.0, 37.0, 42.0, 41.0, 41.0, 39.0, 29.0, 32.0, 18.0, 12.0, 20.0, 17.0, 12.0, 15.0, 6.0, 12.0, 7.0, 7.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.25, -2.1741943359375, -2.098388671875, -2.0225830078125, -1.94677734375, -1.8709716796875, -1.795166015625, -1.7193603515625, -1.6435546875, -1.5677490234375, -1.491943359375, -1.4161376953125, -1.34033203125, -1.2645263671875, -1.188720703125, -1.1129150390625, -1.037109375, -0.9613037109375, -0.885498046875, -0.8096923828125, -0.73388671875, -0.6580810546875, -0.582275390625, -0.5064697265625, -0.4306640625, -0.3548583984375, -0.279052734375, -0.2032470703125, -0.12744140625, -0.0516357421875, 0.024169921875, 0.0999755859375, 0.17578125, 0.2515869140625, 0.327392578125, 0.4031982421875, 0.47900390625, 0.5548095703125, 0.630615234375, 0.7064208984375, 0.7822265625, 0.8580322265625, 0.933837890625, 1.0096435546875, 1.08544921875, 1.1612548828125, 1.237060546875, 1.3128662109375, 1.388671875, 1.4644775390625, 1.540283203125, 1.6160888671875, 1.69189453125, 1.7677001953125, 1.843505859375, 1.9193115234375, 1.9951171875, 2.0709228515625, 2.146728515625, 2.2225341796875, 2.29833984375, 2.3741455078125, 2.449951171875, 2.5257568359375, 2.6015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 13.0, 24.0, 39.0, 49.0, 61.0, 70.0, 110.0, 151.0, 201.0, 363.0, 497.0, 749.0, 1258.0, 2142.0, 3781.0, 7894.0, 17018.0, 47203.0, 830002.0, 93310.0, 22229.0, 9632.0, 4901.0, 2628.0, 1528.0, 882.0, 560.0, 390.0, 235.0, 169.0, 111.0, 82.0, 63.0, 36.0, 34.0, 24.0, 20.0, 22.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8016128540039062, -0.7736358642578125, -0.7456588745117188, -0.717681884765625, -0.6897048950195312, -0.6617279052734375, -0.6337509155273438, -0.60577392578125, -0.5777969360351562, -0.5498199462890625, -0.5218429565429688, -0.493865966796875, -0.46588897705078125, -0.4379119873046875, -0.40993499755859375, -0.3819580078125, -0.35398101806640625, -0.3260040283203125, -0.29802703857421875, -0.270050048828125, -0.24207305908203125, -0.2140960693359375, -0.18611907958984375, -0.15814208984375, -0.13016510009765625, -0.1021881103515625, -0.07421112060546875, -0.046234130859375, -0.01825714111328125, 0.0097198486328125, 0.03769683837890625, 0.065673828125, 0.09365081787109375, 0.1216278076171875, 0.14960479736328125, 0.177581787109375, 0.20555877685546875, 0.2335357666015625, 0.26151275634765625, 0.28948974609375, 0.31746673583984375, 0.3454437255859375, 0.37342071533203125, 0.401397705078125, 0.42937469482421875, 0.4573516845703125, 0.48532867431640625, 0.5133056640625, 0.5412826538085938, 0.5692596435546875, 0.5972366333007812, 0.625213623046875, 0.6531906127929688, 0.6811676025390625, 0.7091445922851562, 0.73712158203125, 0.7650985717773438, 0.7930755615234375, 0.8210525512695312, 0.849029541015625, 0.8770065307617188, 0.9049835205078125, 0.9329605102539062, 0.9609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 5.0, 10.0, 11.0, 12.0, 13.0, 13.0, 17.0, 30.0, 29.0, 16.0, 27.0, 30.0, 32.0, 30.0, 30.0, 37.0, 38.0, 34.0, 34.0, 41.0, 42.0, 48.0, 38.0, 36.0, 34.0, 28.0, 23.0, 23.0, 19.0, 23.0, 23.0, 22.0, 24.0, 15.0, 17.0, 10.0, 16.0, 11.0, 7.0, 8.0, 3.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2261810302734375, -1.183807373046875, -1.1414337158203125, -1.09906005859375, -1.0566864013671875, -1.014312744140625, -0.9719390869140625, -0.9295654296875, -0.8871917724609375, -0.844818115234375, -0.8024444580078125, -0.76007080078125, -0.7176971435546875, -0.675323486328125, -0.6329498291015625, -0.590576171875, -0.5482025146484375, -0.505828857421875, -0.4634552001953125, -0.42108154296875, -0.3787078857421875, -0.336334228515625, -0.2939605712890625, -0.2515869140625, -0.2092132568359375, -0.166839599609375, -0.1244659423828125, -0.08209228515625, -0.0397186279296875, 0.002655029296875, 0.0450286865234375, 0.08740234375, 0.1297760009765625, 0.172149658203125, 0.2145233154296875, 0.25689697265625, 0.2992706298828125, 0.341644287109375, 0.3840179443359375, 0.4263916015625, 0.4687652587890625, 0.511138916015625, 0.5535125732421875, 0.59588623046875, 0.6382598876953125, 0.680633544921875, 0.7230072021484375, 0.765380859375, 0.8077545166015625, 0.850128173828125, 0.8925018310546875, 0.93487548828125, 0.9772491455078125, 1.019622802734375, 1.0619964599609375, 1.1043701171875, 1.1467437744140625, 1.189117431640625, 1.2314910888671875, 1.27386474609375, 1.3162384033203125, 1.358612060546875, 1.4009857177734375, 1.443359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 24.0, 15.0, 27.0, 46.0, 59.0, 90.0, 109.0, 210.0, 308.0, 516.0, 731.0, 1193.0, 1766.0, 2802.0, 4689.0, 7983.0, 14481.0, 28652.0, 596362.0, 328898.0, 26547.0, 13487.0, 7548.0, 4452.0, 2775.0, 1746.0, 1026.0, 689.0, 425.0, 308.0, 195.0, 127.0, 73.0, 47.0, 36.0, 31.0, 21.0, 14.0, 7.0, 12.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.17181968688964844, -0.16675949096679688, -0.1616992950439453, -0.15663909912109375, -0.1515789031982422, -0.14651870727539062, -0.14145851135253906, -0.1363983154296875, -0.13133811950683594, -0.12627792358398438, -0.12121772766113281, -0.11615753173828125, -0.11109733581542969, -0.10603713989257812, -0.10097694396972656, -0.095916748046875, -0.09085655212402344, -0.08579635620117188, -0.08073616027832031, -0.07567596435546875, -0.07061576843261719, -0.06555557250976562, -0.06049537658691406, -0.0554351806640625, -0.05037498474121094, -0.045314788818359375, -0.04025459289550781, -0.03519439697265625, -0.030134201049804688, -0.025074005126953125, -0.020013809204101562, -0.01495361328125, -0.009893417358398438, -0.004833221435546875, 0.0002269744873046875, 0.00528717041015625, 0.010347366333007812, 0.015407562255859375, 0.020467758178710938, 0.0255279541015625, 0.030588150024414062, 0.035648345947265625, 0.04070854187011719, 0.04576873779296875, 0.05082893371582031, 0.055889129638671875, 0.06094932556152344, 0.066009521484375, 0.07106971740722656, 0.07612991333007812, 0.08119010925292969, 0.08625030517578125, 0.09131050109863281, 0.09637069702148438, 0.10143089294433594, 0.1064910888671875, 0.11155128479003906, 0.11661148071289062, 0.12167167663574219, 0.12673187255859375, 0.1317920684814453, 0.13685226440429688, 0.14191246032714844, 0.14697265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 9.0, 11.0, 17.0, 24.0, 19.0, 38.0, 33.0, 48.0, 46.0, 56.0, 52.0, 67.0, 74.0, 56.0, 63.0, 56.0, 51.0, 43.0, 32.0, 29.0, 38.0, 30.0, 13.0, 17.0, 11.0, 13.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.1313858926296234e-05, -3.0143186450004578e-05, -2.897251397371292e-05, -2.7801841497421265e-05, -2.6631169021129608e-05, -2.546049654483795e-05, -2.4289824068546295e-05, -2.311915159225464e-05, -2.1948479115962982e-05, -2.0777806639671326e-05, -1.960713416337967e-05, -1.8436461687088013e-05, -1.7265789210796356e-05, -1.60951167345047e-05, -1.4924444258213043e-05, -1.3753771781921387e-05, -1.258309930562973e-05, -1.1412426829338074e-05, -1.0241754353046417e-05, -9.07108187675476e-06, -7.900409400463104e-06, -6.729736924171448e-06, -5.559064447879791e-06, -4.388391971588135e-06, -3.2177194952964783e-06, -2.0470470190048218e-06, -8.763745427131653e-07, 2.942979335784912e-07, 1.4649704098701477e-06, 2.635642886161804e-06, 3.8063153624534607e-06, 4.976987838745117e-06, 6.147660315036774e-06, 7.31833279132843e-06, 8.489005267620087e-06, 9.659677743911743e-06, 1.08303502202034e-05, 1.2001022696495056e-05, 1.3171695172786713e-05, 1.4342367649078369e-05, 1.5513040125370026e-05, 1.6683712601661682e-05, 1.785438507795334e-05, 1.9025057554244995e-05, 2.019573003053665e-05, 2.1366402506828308e-05, 2.2537074983119965e-05, 2.370774745941162e-05, 2.4878419935703278e-05, 2.6049092411994934e-05, 2.721976488828659e-05, 2.8390437364578247e-05, 2.9561109840869904e-05, 3.073178231716156e-05, 3.1902454793453217e-05, 3.307312726974487e-05, 3.424379974603653e-05, 3.5414472222328186e-05, 3.658514469861984e-05, 3.77558171749115e-05, 3.8926489651203156e-05, 4.009716212749481e-05, 4.126783460378647e-05, 4.2438507080078125e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 12.0, 29.0, 50.0, 55.0, 88.0, 168.0, 244.0, 338.0, 524.0, 938.0, 1530.0, 2553.0, 4356.0, 7806.0, 14568.0, 27175.0, 51326.0, 97521.0, 170502.0, 231786.0, 192073.0, 113840.0, 60271.0, 31694.0, 17046.0, 9338.0, 5179.0, 3035.0, 1673.0, 1027.0, 678.0, 361.0, 242.0, 156.0, 120.0, 82.0, 50.0, 40.0, 16.0, 18.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058837890625, -0.056708335876464844, -0.05457878112792969, -0.05244922637939453, -0.050319671630859375, -0.04819011688232422, -0.04606056213378906, -0.043931007385253906, -0.04180145263671875, -0.039671897888183594, -0.03754234313964844, -0.03541278839111328, -0.033283233642578125, -0.03115367889404297, -0.029024124145507812, -0.026894569396972656, -0.0247650146484375, -0.022635459899902344, -0.020505905151367188, -0.01837635040283203, -0.016246795654296875, -0.014117240905761719, -0.011987686157226562, -0.009858131408691406, -0.00772857666015625, -0.005599021911621094, -0.0034694671630859375, -0.0013399124145507812, 0.000789642333984375, 0.0029191970825195312, 0.0050487518310546875, 0.007178306579589844, 0.009307861328125, 0.011437416076660156, 0.013566970825195312, 0.01569652557373047, 0.017826080322265625, 0.01995563507080078, 0.022085189819335938, 0.024214744567871094, 0.02634429931640625, 0.028473854064941406, 0.030603408813476562, 0.03273296356201172, 0.034862518310546875, 0.03699207305908203, 0.03912162780761719, 0.041251182556152344, 0.0433807373046875, 0.045510292053222656, 0.04763984680175781, 0.04976940155029297, 0.051898956298828125, 0.05402851104736328, 0.05615806579589844, 0.058287620544433594, 0.06041717529296875, 0.0625467300415039, 0.06467628479003906, 0.06680583953857422, 0.06893539428710938, 0.07106494903564453, 0.07319450378417969, 0.07532405853271484, 0.07745361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 7.0, 18.0, 27.0, 21.0, 32.0, 39.0, 27.0, 48.0, 53.0, 61.0, 61.0, 70.0, 60.0, 54.0, 56.0, 49.0, 39.0, 40.0, 31.0, 37.0, 26.0, 15.0, 13.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0193328857421875, -0.018761157989501953, -0.018189430236816406, -0.01761770248413086, -0.017045974731445312, -0.016474246978759766, -0.01590251922607422, -0.015330791473388672, -0.014759063720703125, -0.014187335968017578, -0.013615608215332031, -0.013043880462646484, -0.012472152709960938, -0.01190042495727539, -0.011328697204589844, -0.010756969451904297, -0.01018524169921875, -0.009613513946533203, -0.009041786193847656, -0.00847005844116211, -0.007898330688476562, -0.007326602935791016, -0.006754875183105469, -0.006183147430419922, -0.005611419677734375, -0.005039691925048828, -0.004467964172363281, -0.0038962364196777344, -0.0033245086669921875, -0.0027527809143066406, -0.0021810531616210938, -0.0016093254089355469, -0.00103759765625, -0.0004658699035644531, 0.00010585784912109375, 0.0006775856018066406, 0.0012493133544921875, 0.0018210411071777344, 0.0023927688598632812, 0.002964496612548828, 0.003536224365234375, 0.004107952117919922, 0.004679679870605469, 0.005251407623291016, 0.0058231353759765625, 0.006394863128662109, 0.006966590881347656, 0.007538318634033203, 0.00811004638671875, 0.008681774139404297, 0.009253501892089844, 0.00982522964477539, 0.010396957397460938, 0.010968685150146484, 0.011540412902832031, 0.012112140655517578, 0.012683868408203125, 0.013255596160888672, 0.013827323913574219, 0.014399051666259766, 0.014970779418945312, 0.01554250717163086, 0.016114234924316406, 0.016685962677001953, 0.0172576904296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 9.0, 3.0, 7.0, 4.0, 4.0, 17.0, 13.0, 21.0, 28.0, 27.0, 34.0, 51.0, 57.0, 70.0, 62.0, 64.0, 70.0, 73.0, 66.0, 61.0, 52.0, 34.0, 27.0, 28.0, 26.0, 20.0, 16.0, 9.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.278392314910889, -4.133045196533203, -3.9876976013183594, -3.842350482940674, -3.697003126144409, -3.5516557693481445, -3.406308650970459, -3.2609612941741943, -3.1156139373779297, -2.970266580581665, -2.8249192237854004, -2.679572105407715, -2.53422474861145, -2.3888773918151855, -2.2435302734375, -2.0981829166412354, -1.9528355598449707, -1.807488203048706, -1.662140965461731, -1.5167937278747559, -1.3714463710784912, -1.2260990142822266, -1.0807517766952515, -0.9354045391082764, -0.7900571823120117, -0.6447098851203918, -0.499362587928772, -0.3540152907371521, -0.20866799354553223, -0.06332069635391235, 0.08202660083770752, 0.22737383842468262, 0.37272071838378906, 0.5180680155754089, 0.6634153127670288, 0.8087626099586487, 0.9541099071502686, 1.0994572639465332, 1.2448045015335083, 1.3901517391204834, 1.535499095916748, 1.6808464527130127, 1.8261936902999878, 1.971540927886963, 2.1168882846832275, 2.262235641479492, 2.4075827598571777, 2.5529301166534424, 2.698277473449707, 2.8436248302459717, 2.9889721870422363, 3.134319305419922, 3.2796666622161865, 3.425014019012451, 3.5703611373901367, 3.7157084941864014, 3.861055850982666, 4.006402969360352, 4.151750564575195, 4.297097682952881, 4.442444801330566, 4.58779239654541, 4.733139514923096, 4.878486633300781, 5.023834228515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 10.0, 11.0, 11.0, 16.0, 8.0, 13.0, 17.0, 18.0, 25.0, 22.0, 19.0, 28.0, 26.0, 33.0, 28.0, 33.0, 37.0, 31.0, 27.0, 35.0, 54.0, 41.0, 35.0, 40.0, 30.0, 41.0, 38.0, 34.0, 30.0, 27.0, 23.0, 23.0, 18.0, 24.0, 12.0, 19.0, 11.0, 8.0, 10.0, 4.0, 9.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7050451040267944, -1.6472798585891724, -1.5895144939422607, -1.5317492485046387, -1.473983883857727, -1.416218638420105, -1.3584532737731934, -1.3006880283355713, -1.2429227828979492, -1.1851575374603271, -1.1273921728134155, -1.0696269273757935, -1.0118615627288818, -0.9540963172912598, -0.8963310122489929, -0.8385657072067261, -0.7808003425598145, -0.7230350375175476, -0.6652697324752808, -0.6075044870376587, -0.5497391223907471, -0.4919738471508026, -0.43420857191085815, -0.3764432668685913, -0.31867796182632446, -0.2609126567840576, -0.20314736664295197, -0.1453820765018463, -0.08761677145957947, -0.029851466417312622, 0.027913808822631836, 0.08567911386489868, 0.14344441890716553, 0.20120972394943237, 0.2589750289916992, 0.3167403042316437, 0.3745056092739105, 0.43227091431617737, 0.4900361895561218, 0.5478014945983887, 0.6055667996406555, 0.6633321046829224, 0.7210974097251892, 0.778862714767456, 0.8366279602050781, 0.8943933248519897, 0.9521585702896118, 1.0099239349365234, 1.0676891803741455, 1.1254544258117676, 1.1832197904586792, 1.2409850358963013, 1.298750400543213, 1.356515645980835, 1.414280891418457, 1.4720462560653687, 1.5298116207122803, 1.5875768661499023, 1.645342230796814, 1.703107476234436, 1.7608728408813477, 1.8186380863189697, 1.8764033317565918, 1.9341686964035034, 1.9919339418411255]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 11.0, 20.0, 20.0, 42.0, 77.0, 98.0, 128.0, 218.0, 349.0, 585.0, 975.0, 1551.0, 2663.0, 4779.0, 8291.0, 14726.0, 26864.0, 48478.0, 82217.0, 130019.0, 174190.0, 180841.0, 144901.0, 96157.0, 57218.0, 31781.0, 18156.0, 9759.0, 5586.0, 3123.0, 1839.0, 1040.0, 675.0, 428.0, 264.0, 179.0, 106.0, 79.0, 32.0, 18.0, 24.0, 12.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.412353515625, -2.32666015625, -2.240966796875, -2.1552734375, -2.069580078125, -1.98388671875, -1.898193359375, -1.8125, -1.726806640625, -1.64111328125, -1.555419921875, -1.4697265625, -1.384033203125, -1.29833984375, -1.212646484375, -1.126953125, -1.041259765625, -0.95556640625, -0.869873046875, -0.7841796875, -0.698486328125, -0.61279296875, -0.527099609375, -0.44140625, -0.355712890625, -0.27001953125, -0.184326171875, -0.0986328125, -0.012939453125, 0.07275390625, 0.158447265625, 0.244140625, 0.329833984375, 0.41552734375, 0.501220703125, 0.5869140625, 0.672607421875, 0.75830078125, 0.843994140625, 0.9296875, 1.015380859375, 1.10107421875, 1.186767578125, 1.2724609375, 1.358154296875, 1.44384765625, 1.529541015625, 1.615234375, 1.700927734375, 1.78662109375, 1.872314453125, 1.9580078125, 2.043701171875, 2.12939453125, 2.215087890625, 2.30078125, 2.386474609375, 2.47216796875, 2.557861328125, 2.6435546875, 2.729248046875, 2.81494140625, 2.900634765625, 2.986328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 13.0, 6.0, 16.0, 13.0, 17.0, 26.0, 24.0, 15.0, 14.0, 27.0, 22.0, 29.0, 26.0, 36.0, 29.0, 39.0, 33.0, 33.0, 33.0, 30.0, 40.0, 45.0, 43.0, 40.0, 37.0, 35.0, 35.0, 31.0, 30.0, 18.0, 27.0, 23.0, 19.0, 17.0, 7.0, 13.0, 15.0, 10.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.0311279296875, -1.964599609375, -1.8980712890625, -1.83154296875, -1.7650146484375, -1.698486328125, -1.6319580078125, -1.5654296875, -1.4989013671875, -1.432373046875, -1.3658447265625, -1.29931640625, -1.2327880859375, -1.166259765625, -1.0997314453125, -1.033203125, -0.9666748046875, -0.900146484375, -0.8336181640625, -0.76708984375, -0.7005615234375, -0.634033203125, -0.5675048828125, -0.5009765625, -0.4344482421875, -0.367919921875, -0.3013916015625, -0.23486328125, -0.1683349609375, -0.101806640625, -0.0352783203125, 0.03125, 0.0977783203125, 0.164306640625, 0.2308349609375, 0.29736328125, 0.3638916015625, 0.430419921875, 0.4969482421875, 0.5634765625, 0.6300048828125, 0.696533203125, 0.7630615234375, 0.82958984375, 0.8961181640625, 0.962646484375, 1.0291748046875, 1.095703125, 1.1622314453125, 1.228759765625, 1.2952880859375, 1.36181640625, 1.4283447265625, 1.494873046875, 1.5614013671875, 1.6279296875, 1.6944580078125, 1.760986328125, 1.8275146484375, 1.89404296875, 1.9605712890625, 2.027099609375, 2.0936279296875, 2.16015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 8.0, 15.0, 18.0, 46.0, 42.0, 68.0, 98.0, 179.0, 226.0, 350.0, 587.0, 903.0, 1424.0, 2294.0, 3856.0, 6355.0, 10891.0, 18187.0, 30565.0, 49960.0, 79273.0, 115614.0, 149237.0, 159552.0, 139697.0, 103913.0, 68673.0, 42416.0, 25448.0, 15387.0, 8994.0, 5552.0, 3264.0, 1986.0, 1254.0, 737.0, 485.0, 335.0, 210.0, 140.0, 96.0, 62.0, 50.0, 34.0, 18.0, 10.0, 16.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.443359375, -2.365386962890625, -2.28741455078125, -2.209442138671875, -2.1314697265625, -2.053497314453125, -1.97552490234375, -1.897552490234375, -1.819580078125, -1.741607666015625, -1.66363525390625, -1.585662841796875, -1.5076904296875, -1.429718017578125, -1.35174560546875, -1.273773193359375, -1.19580078125, -1.117828369140625, -1.03985595703125, -0.961883544921875, -0.8839111328125, -0.805938720703125, -0.72796630859375, -0.649993896484375, -0.572021484375, -0.494049072265625, -0.41607666015625, -0.338104248046875, -0.2601318359375, -0.182159423828125, -0.10418701171875, -0.026214599609375, 0.0517578125, 0.129730224609375, 0.20770263671875, 0.285675048828125, 0.3636474609375, 0.441619873046875, 0.51959228515625, 0.597564697265625, 0.675537109375, 0.753509521484375, 0.83148193359375, 0.909454345703125, 0.9874267578125, 1.065399169921875, 1.14337158203125, 1.221343994140625, 1.29931640625, 1.377288818359375, 1.45526123046875, 1.533233642578125, 1.6112060546875, 1.689178466796875, 1.76715087890625, 1.845123291015625, 1.923095703125, 2.001068115234375, 2.07904052734375, 2.157012939453125, 2.2349853515625, 2.312957763671875, 2.39093017578125, 2.468902587890625, 2.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 6.0, 13.0, 14.0, 14.0, 19.0, 22.0, 18.0, 22.0, 28.0, 17.0, 16.0, 23.0, 30.0, 30.0, 42.0, 32.0, 45.0, 34.0, 24.0, 37.0, 41.0, 39.0, 45.0, 37.0, 29.0, 51.0, 32.0, 34.0, 21.0, 21.0, 19.0, 17.0, 13.0, 16.0, 13.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2705078125, -1.2288055419921875, -1.187103271484375, -1.1454010009765625, -1.10369873046875, -1.0619964599609375, -1.020294189453125, -0.9785919189453125, -0.9368896484375, -0.8951873779296875, -0.853485107421875, -0.8117828369140625, -0.77008056640625, -0.7283782958984375, -0.686676025390625, -0.6449737548828125, -0.603271484375, -0.5615692138671875, -0.519866943359375, -0.4781646728515625, -0.43646240234375, -0.3947601318359375, -0.353057861328125, -0.3113555908203125, -0.2696533203125, -0.2279510498046875, -0.186248779296875, -0.1445465087890625, -0.10284423828125, -0.0611419677734375, -0.019439697265625, 0.0222625732421875, 0.06396484375, 0.1056671142578125, 0.147369384765625, 0.1890716552734375, 0.23077392578125, 0.2724761962890625, 0.314178466796875, 0.3558807373046875, 0.3975830078125, 0.4392852783203125, 0.480987548828125, 0.5226898193359375, 0.56439208984375, 0.6060943603515625, 0.647796630859375, 0.6894989013671875, 0.731201171875, 0.7729034423828125, 0.814605712890625, 0.8563079833984375, 0.89801025390625, 0.9397125244140625, 0.981414794921875, 1.0231170654296875, 1.0648193359375, 1.1065216064453125, 1.148223876953125, 1.1899261474609375, 1.23162841796875, 1.2733306884765625, 1.315032958984375, 1.3567352294921875, 1.3984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 4.0, 15.0, 12.0, 16.0, 18.0, 34.0, 52.0, 95.0, 112.0, 180.0, 260.0, 425.0, 645.0, 1055.0, 1622.0, 2684.0, 4336.0, 7315.0, 12311.0, 21421.0, 38694.0, 68384.0, 118096.0, 177524.0, 201459.0, 158868.0, 99524.0, 56996.0, 31973.0, 18074.0, 10507.0, 6053.0, 3822.0, 2150.0, 1345.0, 907.0, 549.0, 307.0, 249.0, 162.0, 103.0, 63.0, 35.0, 33.0, 24.0, 14.0, 10.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2935028076171875, -1.246185302734375, -1.1988677978515625, -1.15155029296875, -1.1042327880859375, -1.056915283203125, -1.0095977783203125, -0.9622802734375, -0.9149627685546875, -0.867645263671875, -0.8203277587890625, -0.77301025390625, -0.7256927490234375, -0.678375244140625, -0.6310577392578125, -0.583740234375, -0.5364227294921875, -0.489105224609375, -0.4417877197265625, -0.39447021484375, -0.3471527099609375, -0.299835205078125, -0.2525177001953125, -0.2052001953125, -0.1578826904296875, -0.110565185546875, -0.0632476806640625, -0.01593017578125, 0.0313873291015625, 0.078704833984375, 0.1260223388671875, 0.17333984375, 0.2206573486328125, 0.267974853515625, 0.3152923583984375, 0.36260986328125, 0.4099273681640625, 0.457244873046875, 0.5045623779296875, 0.5518798828125, 0.5991973876953125, 0.646514892578125, 0.6938323974609375, 0.74114990234375, 0.7884674072265625, 0.835784912109375, 0.8831024169921875, 0.930419921875, 0.9777374267578125, 1.025054931640625, 1.0723724365234375, 1.11968994140625, 1.1670074462890625, 1.214324951171875, 1.2616424560546875, 1.3089599609375, 1.3562774658203125, 1.403594970703125, 1.4509124755859375, 1.49822998046875, 1.5455474853515625, 1.592864990234375, 1.6401824951171875, 1.6875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 10.0, 17.0, 16.0, 20.0, 28.0, 40.0, 36.0, 47.0, 67.0, 83.0, 69.0, 79.0, 76.0, 71.0, 69.0, 49.0, 51.0, 35.0, 27.0, 27.0, 11.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017762184143066406, -0.00017231516540050507, -0.00016700848937034607, -0.00016170181334018707, -0.00015639513731002808, -0.00015108846127986908, -0.00014578178524971008, -0.00014047510921955109, -0.0001351684331893921, -0.0001298617571592331, -0.0001245550811290741, -0.0001192484050989151, -0.0001139417290687561, -0.00010863505303859711, -0.00010332837700843811, -9.802170097827911e-05, -9.271502494812012e-05, -8.740834891796112e-05, -8.210167288780212e-05, -7.679499685764313e-05, -7.148832082748413e-05, -6.618164479732513e-05, -6.087496876716614e-05, -5.556829273700714e-05, -5.0261616706848145e-05, -4.495494067668915e-05, -3.964826464653015e-05, -3.4341588616371155e-05, -2.9034912586212158e-05, -2.372823655605316e-05, -1.8421560525894165e-05, -1.3114884495735168e-05, -7.808208465576172e-06, -2.5015324354171753e-06, 2.8051435947418213e-06, 8.111819624900818e-06, 1.3418495655059814e-05, 1.872517168521881e-05, 2.4031847715377808e-05, 2.9338523745536804e-05, 3.46451997756958e-05, 3.99518758058548e-05, 4.5258551836013794e-05, 5.056522786617279e-05, 5.587190389633179e-05, 6.117857992649078e-05, 6.648525595664978e-05, 7.179193198680878e-05, 7.709860801696777e-05, 8.240528404712677e-05, 8.771196007728577e-05, 9.301863610744476e-05, 9.832531213760376e-05, 0.00010363198816776276, 0.00010893866419792175, 0.00011424534022808075, 0.00011955201625823975, 0.00012485869228839874, 0.00013016536831855774, 0.00013547204434871674, 0.00014077872037887573, 0.00014608539640903473, 0.00015139207243919373, 0.00015669874846935272, 0.00016200542449951172]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 5.0, 9.0, 17.0, 30.0, 50.0, 66.0, 84.0, 142.0, 216.0, 305.0, 439.0, 595.0, 956.0, 1435.0, 2398.0, 3601.0, 5798.0, 9505.0, 15782.0, 26081.0, 44170.0, 73606.0, 115551.0, 160099.0, 175035.0, 148360.0, 103196.0, 64003.0, 37971.0, 22636.0, 13627.0, 8365.0, 5224.0, 3295.0, 2029.0, 1322.0, 851.0, 585.0, 334.0, 289.0, 146.0, 115.0, 77.0, 39.0, 28.0, 29.0, 15.0, 13.0, 11.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.3056640625, -1.2665252685546875, -1.227386474609375, -1.1882476806640625, -1.14910888671875, -1.1099700927734375, -1.070831298828125, -1.0316925048828125, -0.9925537109375, -0.9534149169921875, -0.914276123046875, -0.8751373291015625, -0.83599853515625, -0.7968597412109375, -0.757720947265625, -0.7185821533203125, -0.679443359375, -0.6403045654296875, -0.601165771484375, -0.5620269775390625, -0.52288818359375, -0.4837493896484375, -0.444610595703125, -0.4054718017578125, -0.3663330078125, -0.3271942138671875, -0.288055419921875, -0.2489166259765625, -0.20977783203125, -0.1706390380859375, -0.131500244140625, -0.0923614501953125, -0.05322265625, -0.0140838623046875, 0.025054931640625, 0.0641937255859375, 0.10333251953125, 0.1424713134765625, 0.181610107421875, 0.2207489013671875, 0.2598876953125, 0.2990264892578125, 0.338165283203125, 0.3773040771484375, 0.41644287109375, 0.4555816650390625, 0.494720458984375, 0.5338592529296875, 0.572998046875, 0.6121368408203125, 0.651275634765625, 0.6904144287109375, 0.72955322265625, 0.7686920166015625, 0.807830810546875, 0.8469696044921875, 0.8861083984375, 0.9252471923828125, 0.964385986328125, 1.0035247802734375, 1.04266357421875, 1.0818023681640625, 1.120941162109375, 1.1600799560546875, 1.19921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 3.0, 5.0, 9.0, 16.0, 24.0, 17.0, 20.0, 42.0, 36.0, 49.0, 52.0, 55.0, 57.0, 72.0, 55.0, 66.0, 74.0, 51.0, 50.0, 39.0, 44.0, 26.0, 22.0, 23.0, 25.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2727622985839844, -0.26061248779296875, -0.24846267700195312, -0.2363128662109375, -0.22416305541992188, -0.21201324462890625, -0.19986343383789062, -0.187713623046875, -0.17556381225585938, -0.16341400146484375, -0.15126419067382812, -0.1391143798828125, -0.12696456909179688, -0.11481475830078125, -0.10266494750976562, -0.09051513671875, -0.07836532592773438, -0.06621551513671875, -0.054065704345703125, -0.0419158935546875, -0.029766082763671875, -0.01761627197265625, -0.005466461181640625, 0.006683349609375, 0.018833160400390625, 0.03098297119140625, 0.043132781982421875, 0.0552825927734375, 0.06743240356445312, 0.07958221435546875, 0.09173202514648438, 0.1038818359375, 0.11603164672851562, 0.12818145751953125, 0.14033126831054688, 0.1524810791015625, 0.16463088989257812, 0.17678070068359375, 0.18893051147460938, 0.201080322265625, 0.21323013305664062, 0.22537994384765625, 0.23752975463867188, 0.2496795654296875, 0.2618293762207031, 0.27397918701171875, 0.2861289978027344, 0.29827880859375, 0.3104286193847656, 0.32257843017578125, 0.3347282409667969, 0.3468780517578125, 0.3590278625488281, 0.37117767333984375, 0.3833274841308594, 0.395477294921875, 0.4076271057128906, 0.41977691650390625, 0.4319267272949219, 0.4440765380859375, 0.4562263488769531, 0.46837615966796875, 0.4805259704589844, 0.49267578125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 18.0, 29.0, 26.0, 33.0, 43.0, 46.0, 64.0, 60.0, 61.0, 64.0, 71.0, 64.0, 72.0, 57.0, 47.0, 37.0, 28.0, 17.0, 29.0, 24.0, 11.0, 9.0, 4.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.868194103240967, -4.724942207336426, -4.581690311431885, -4.438438415527344, -4.2951860427856445, -4.1519341468811035, -4.0086822509765625, -3.8654303550720215, -3.7221784591674805, -3.5789265632629395, -3.4356744289398193, -3.2924225330352783, -3.1491706371307373, -3.005918502807617, -2.862666606903076, -2.719414710998535, -2.576162576675415, -2.432910680770874, -2.289658546447754, -2.146406650543213, -2.003154754638672, -1.8599027395248413, -1.7166507244110107, -1.5733988285064697, -1.4301468133926392, -1.2868947982788086, -1.1436429023742676, -1.000390887260437, -0.8571389317512512, -0.7138869762420654, -0.5706349611282349, -0.42738306522369385, -0.2841310501098633, -0.1408790796995163, 0.0023728907108306885, 0.14562487602233887, 0.28887683153152466, 0.43212878704071045, 0.575380802154541, 0.718632698059082, 0.8618847131729126, 1.0051367282867432, 1.1483886241912842, 1.2916406393051147, 1.4348926544189453, 1.5781445503234863, 1.721396565437317, 1.864648461341858, 2.0079004764556885, 2.1511523723602295, 2.2944045066833496, 2.4376564025878906, 2.5809082984924316, 2.7241601943969727, 2.8674123287200928, 3.010664224624634, 3.153916358947754, 3.297168254852295, 3.440420389175415, 3.583672285079956, 3.726924180984497, 3.870176315307617, 4.013428211212158, 4.156680107116699, 4.29993200302124]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 7.0, 6.0, 12.0, 11.0, 12.0, 16.0, 12.0, 18.0, 27.0, 19.0, 14.0, 22.0, 22.0, 36.0, 39.0, 24.0, 26.0, 36.0, 34.0, 46.0, 41.0, 39.0, 47.0, 36.0, 36.0, 38.0, 37.0, 27.0, 31.0, 37.0, 25.0, 26.0, 24.0, 21.0, 16.0, 10.0, 14.0, 7.0, 8.0, 13.0, 5.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.992197871208191, -1.9318187236785889, -1.8714396953582764, -1.8110605478286743, -1.7506814002990723, -1.6903023719787598, -1.6299232244491577, -1.5695440769195557, -1.5091650485992432, -1.4487859010696411, -1.3884068727493286, -1.3280277252197266, -1.2676485776901245, -1.2072694301605225, -1.14689040184021, -1.086511254310608, -1.0261321067810059, -0.9657530188560486, -0.9053738713264465, -0.8449947834014893, -0.7846156358718872, -0.7242365479469299, -0.6638574600219727, -0.6034783124923706, -0.5430992245674133, -0.48272010684013367, -0.422340989112854, -0.36196190118789673, -0.30158278346061707, -0.2412036657333374, -0.18082457780838013, -0.12044546008110046, -0.06006622314453125, 0.00031288713216781616, 0.06069199740886688, 0.12107110023498535, 0.18145021796226501, 0.24182933568954468, 0.30220842361450195, 0.3625875413417816, 0.4229666590690613, 0.48334577679634094, 0.5437248945236206, 0.6041039824485779, 0.6644830703735352, 0.7248622179031372, 0.7852413058280945, 0.8456203937530518, 0.9059995412826538, 0.9663786292076111, 1.0267577171325684, 1.0871368646621704, 1.1475160121917725, 1.207895040512085, 1.268274188041687, 1.328653335571289, 1.3890323638916016, 1.4494115114212036, 1.5097905397415161, 1.5701696872711182, 1.6305488348007202, 1.6909279823303223, 1.7513070106506348, 1.8116861581802368, 1.8720653057098389]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 17.0, 18.0, 22.0, 43.0, 74.0, 133.0, 199.0, 298.0, 498.0, 832.0, 1419.0, 2618.0, 4620.0, 8675.0, 16585.0, 34867.0, 79247.0, 198938.0, 562609.0, 1347464.0, 1192420.0, 452143.0, 162392.0, 66632.0, 30030.0, 14683.0, 7471.0, 3989.0, 2204.0, 1272.0, 765.0, 438.0, 247.0, 158.0, 101.0, 58.0, 33.0, 26.0, 10.0, 11.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.64776611328125, -4.4869384765625, -4.32611083984375, -4.165283203125, -4.00445556640625, -3.8436279296875, -3.68280029296875, -3.52197265625, -3.36114501953125, -3.2003173828125, -3.03948974609375, -2.878662109375, -2.71783447265625, -2.5570068359375, -2.39617919921875, -2.2353515625, -2.07452392578125, -1.9136962890625, -1.75286865234375, -1.592041015625, -1.43121337890625, -1.2703857421875, -1.10955810546875, -0.94873046875, -0.78790283203125, -0.6270751953125, -0.46624755859375, -0.305419921875, -0.14459228515625, 0.0162353515625, 0.17706298828125, 0.337890625, 0.49871826171875, 0.6595458984375, 0.82037353515625, 0.981201171875, 1.14202880859375, 1.3028564453125, 1.46368408203125, 1.62451171875, 1.78533935546875, 1.9461669921875, 2.10699462890625, 2.267822265625, 2.42864990234375, 2.5894775390625, 2.75030517578125, 2.9111328125, 3.07196044921875, 3.2327880859375, 3.39361572265625, 3.554443359375, 3.71527099609375, 3.8760986328125, 4.03692626953125, 4.19775390625, 4.35858154296875, 4.5194091796875, 4.68023681640625, 4.841064453125, 5.00189208984375, 5.1627197265625, 5.32354736328125, 5.484375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 8.0, 7.0, 13.0, 9.0, 19.0, 17.0, 20.0, 17.0, 11.0, 31.0, 20.0, 38.0, 29.0, 34.0, 44.0, 41.0, 42.0, 38.0, 41.0, 48.0, 35.0, 40.0, 36.0, 49.0, 30.0, 41.0, 32.0, 34.0, 22.0, 30.0, 18.0, 24.0, 15.0, 13.0, 8.0, 11.0, 10.0, 8.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.8583984375, -1.8057098388671875, -1.753021240234375, -1.7003326416015625, -1.64764404296875, -1.5949554443359375, -1.542266845703125, -1.4895782470703125, -1.4368896484375, -1.3842010498046875, -1.331512451171875, -1.2788238525390625, -1.22613525390625, -1.1734466552734375, -1.120758056640625, -1.0680694580078125, -1.015380859375, -0.9626922607421875, -0.910003662109375, -0.8573150634765625, -0.80462646484375, -0.7519378662109375, -0.699249267578125, -0.6465606689453125, -0.5938720703125, -0.5411834716796875, -0.488494873046875, -0.4358062744140625, -0.38311767578125, -0.3304290771484375, -0.277740478515625, -0.2250518798828125, -0.17236328125, -0.1196746826171875, -0.066986083984375, -0.0142974853515625, 0.03839111328125, 0.0910797119140625, 0.143768310546875, 0.1964569091796875, 0.2491455078125, 0.3018341064453125, 0.354522705078125, 0.4072113037109375, 0.45989990234375, 0.5125885009765625, 0.565277099609375, 0.6179656982421875, 0.670654296875, 0.7233428955078125, 0.776031494140625, 0.8287200927734375, 0.88140869140625, 0.9340972900390625, 0.986785888671875, 1.0394744873046875, 1.0921630859375, 1.1448516845703125, 1.197540283203125, 1.2502288818359375, 1.30291748046875, 1.3556060791015625, 1.408294677734375, 1.4609832763671875, 1.513671875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 8.0, 15.0, 20.0, 31.0, 33.0, 54.0, 86.0, 126.0, 180.0, 296.0, 420.0, 613.0, 970.0, 1446.0, 2363.0, 4023.0, 6676.0, 11517.0, 20180.0, 37937.0, 72101.0, 141521.0, 287879.0, 578844.0, 980187.0, 950174.0, 543755.0, 269077.0, 133547.0, 67561.0, 35751.0, 19595.0, 10842.0, 6314.0, 3635.0, 2349.0, 1418.0, 925.0, 592.0, 385.0, 253.0, 174.0, 123.0, 86.0, 62.0, 34.0, 24.0, 20.0, 16.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.07421875, -3.94671630859375, -3.8192138671875, -3.69171142578125, -3.564208984375, -3.43670654296875, -3.3092041015625, -3.18170166015625, -3.05419921875, -2.92669677734375, -2.7991943359375, -2.67169189453125, -2.544189453125, -2.41668701171875, -2.2891845703125, -2.16168212890625, -2.0341796875, -1.90667724609375, -1.7791748046875, -1.65167236328125, -1.524169921875, -1.39666748046875, -1.2691650390625, -1.14166259765625, -1.01416015625, -0.88665771484375, -0.7591552734375, -0.63165283203125, -0.504150390625, -0.37664794921875, -0.2491455078125, -0.12164306640625, 0.005859375, 0.13336181640625, 0.2608642578125, 0.38836669921875, 0.515869140625, 0.64337158203125, 0.7708740234375, 0.89837646484375, 1.02587890625, 1.15338134765625, 1.2808837890625, 1.40838623046875, 1.535888671875, 1.66339111328125, 1.7908935546875, 1.91839599609375, 2.0458984375, 2.17340087890625, 2.3009033203125, 2.42840576171875, 2.555908203125, 2.68341064453125, 2.8109130859375, 2.93841552734375, 3.06591796875, 3.19342041015625, 3.3209228515625, 3.44842529296875, 3.575927734375, 3.70343017578125, 3.8309326171875, 3.95843505859375, 4.0859375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 7.0, 11.0, 7.0, 10.0, 12.0, 16.0, 25.0, 24.0, 51.0, 51.0, 73.0, 68.0, 77.0, 107.0, 114.0, 135.0, 164.0, 200.0, 215.0, 219.0, 247.0, 272.0, 272.0, 241.0, 227.0, 205.0, 181.0, 159.0, 144.0, 105.0, 98.0, 61.0, 51.0, 47.0, 42.0, 36.0, 27.0, 12.0, 15.0, 13.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8853073120117188, -0.8531341552734375, -0.8209609985351562, -0.788787841796875, -0.7566146850585938, -0.7244415283203125, -0.6922683715820312, -0.66009521484375, -0.6279220581054688, -0.5957489013671875, -0.5635757446289062, -0.531402587890625, -0.49922943115234375, -0.4670562744140625, -0.43488311767578125, -0.4027099609375, -0.37053680419921875, -0.3383636474609375, -0.30619049072265625, -0.274017333984375, -0.24184417724609375, -0.2096710205078125, -0.17749786376953125, -0.14532470703125, -0.11315155029296875, -0.0809783935546875, -0.04880523681640625, -0.016632080078125, 0.01554107666015625, 0.0477142333984375, 0.07988739013671875, 0.112060546875, 0.14423370361328125, 0.1764068603515625, 0.20858001708984375, 0.240753173828125, 0.27292633056640625, 0.3050994873046875, 0.33727264404296875, 0.36944580078125, 0.40161895751953125, 0.4337921142578125, 0.46596527099609375, 0.498138427734375, 0.5303115844726562, 0.5624847412109375, 0.5946578979492188, 0.6268310546875, 0.6590042114257812, 0.6911773681640625, 0.7233505249023438, 0.755523681640625, 0.7876968383789062, 0.8198699951171875, 0.8520431518554688, 0.88421630859375, 0.9163894653320312, 0.9485626220703125, 0.9807357788085938, 1.012908935546875, 1.0450820922851562, 1.0772552490234375, 1.1094284057617188, 1.1416015625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 6.0, 7.0, 11.0, 14.0, 18.0, 26.0, 41.0, 37.0, 50.0, 53.0, 86.0, 95.0, 67.0, 86.0, 84.0, 51.0, 59.0, 59.0, 33.0, 25.0, 19.0, 16.0, 13.0, 12.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.172397613525391, -6.000027179718018, -5.8276567459106445, -5.655285835266113, -5.48291540145874, -5.310544967651367, -5.138174533843994, -4.965804100036621, -4.79343318939209, -4.621062755584717, -4.448692321777344, -4.2763214111328125, -4.1039509773254395, -3.9315805435180664, -3.7592101097106934, -3.5868396759033203, -3.4144692420959473, -3.242098808288574, -3.069728136062622, -2.897357702255249, -2.724987030029297, -2.552616596221924, -2.380246162414551, -2.2078757286071777, -2.0355050563812256, -1.863134503364563, -1.6907639503479004, -1.5183935165405273, -1.3460229635238647, -1.1736524105072021, -1.001281976699829, -0.8289114236831665, -0.6565403938293457, -0.4841698706150055, -0.3117993474006653, -0.13942885398864746, 0.03294169902801514, 0.20531225204467773, 0.3776826858520508, 0.5500532388687134, 0.722423791885376, 0.8947943449020386, 1.0671648979187012, 1.2395353317260742, 1.4119058847427368, 1.5842764377593994, 1.7566468715667725, 1.929017424583435, 2.1013879776000977, 2.2737584114074707, 2.446129083633423, 2.618499517440796, 2.790870189666748, 2.963240623474121, 3.135611057281494, 3.307981491088867, 3.4803521633148193, 3.6527225971221924, 3.8250932693481445, 3.9974637031555176, 4.169834136962891, 4.342205047607422, 4.514575004577637, 4.686945915222168, 4.859316349029541]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 12.0, 10.0, 5.0, 16.0, 14.0, 19.0, 24.0, 11.0, 20.0, 18.0, 19.0, 20.0, 33.0, 30.0, 33.0, 32.0, 34.0, 28.0, 40.0, 35.0, 31.0, 40.0, 42.0, 44.0, 33.0, 25.0, 30.0, 35.0, 24.0, 21.0, 30.0, 26.0, 25.0, 26.0, 11.0, 11.0, 11.0, 8.0, 10.0, 9.0, 2.0, 8.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.6643472909927368, -1.6124193668365479, -1.5604914426803589, -1.50856351852417, -1.4566354751586914, -1.4047075510025024, -1.3527796268463135, -1.3008517026901245, -1.2489237785339355, -1.1969958543777466, -1.1450679302215576, -1.093139886856079, -1.0412119626998901, -0.9892840385437012, -0.9373561143875122, -0.8854281902313232, -0.8335001468658447, -0.7815722227096558, -0.729644238948822, -0.6777163147926331, -0.6257883310317993, -0.5738604068756104, -0.5219324827194214, -0.47000452876091003, -0.4180765748023987, -0.36614862084388733, -0.314220666885376, -0.262292742729187, -0.21036478877067566, -0.1584368348121643, -0.10650891065597534, -0.05458095669746399, -0.0026531219482421875, 0.04927482455968857, 0.10120277106761932, 0.15313071012496948, 0.20505866408348083, 0.2569866180419922, 0.30891454219818115, 0.3608424961566925, 0.41277045011520386, 0.4646984040737152, 0.5166263580322266, 0.5685542821884155, 0.6204822063446045, 0.6724101901054382, 0.7243381142616272, 0.7762660980224609, 0.8281940221786499, 0.8801219463348389, 0.9320499300956726, 0.9839778542518616, 1.0359058380126953, 1.0878337621688843, 1.1397616863250732, 1.1916896104812622, 1.2436175346374512, 1.2955454587936401, 1.347473382949829, 1.3994014263153076, 1.4513293504714966, 1.5032572746276855, 1.5551851987838745, 1.6071131229400635, 1.659041166305542]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 22.0, 31.0, 37.0, 36.0, 70.0, 101.0, 195.0, 276.0, 458.0, 765.0, 1103.0, 1784.0, 2949.0, 4554.0, 7714.0, 12976.0, 22532.0, 39025.0, 68688.0, 119159.0, 180762.0, 204086.0, 156394.0, 94745.0, 54244.0, 31093.0, 17896.0, 10541.0, 6200.0, 3717.0, 2431.0, 1392.0, 928.0, 577.0, 410.0, 250.0, 128.0, 94.0, 58.0, 46.0, 23.0, 20.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25749969482421875, -0.2483978271484375, -0.23929595947265625, -0.230194091796875, -0.22109222412109375, -0.2119903564453125, -0.20288848876953125, -0.19378662109375, -0.18468475341796875, -0.1755828857421875, -0.16648101806640625, -0.157379150390625, -0.14827728271484375, -0.1391754150390625, -0.13007354736328125, -0.1209716796875, -0.11186981201171875, -0.1027679443359375, -0.09366607666015625, -0.084564208984375, -0.07546234130859375, -0.0663604736328125, -0.05725860595703125, -0.04815673828125, -0.03905487060546875, -0.0299530029296875, -0.02085113525390625, -0.011749267578125, -0.00264739990234375, 0.0064544677734375, 0.01555633544921875, 0.024658203125, 0.03376007080078125, 0.0428619384765625, 0.05196380615234375, 0.061065673828125, 0.07016754150390625, 0.0792694091796875, 0.08837127685546875, 0.09747314453125, 0.10657501220703125, 0.1156768798828125, 0.12477874755859375, 0.133880615234375, 0.14298248291015625, 0.1520843505859375, 0.16118621826171875, 0.1702880859375, 0.17938995361328125, 0.1884918212890625, 0.19759368896484375, 0.206695556640625, 0.21579742431640625, 0.2248992919921875, 0.23400115966796875, 0.24310302734375, 0.25220489501953125, 0.2613067626953125, 0.27040863037109375, 0.279510498046875, 0.28861236572265625, 0.2977142333984375, 0.30681610107421875, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 10.0, 12.0, 14.0, 10.0, 15.0, 19.0, 16.0, 22.0, 31.0, 23.0, 37.0, 47.0, 32.0, 45.0, 39.0, 44.0, 33.0, 32.0, 47.0, 55.0, 47.0, 36.0, 38.0, 40.0, 30.0, 33.0, 25.0, 32.0, 20.0, 23.0, 13.0, 9.0, 17.0, 7.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087554931640625, -2.01495361328125, -1.942352294921875, -1.8697509765625, -1.797149658203125, -1.72454833984375, -1.651947021484375, -1.579345703125, -1.506744384765625, -1.43414306640625, -1.361541748046875, -1.2889404296875, -1.216339111328125, -1.14373779296875, -1.071136474609375, -0.99853515625, -0.925933837890625, -0.85333251953125, -0.780731201171875, -0.7081298828125, -0.635528564453125, -0.56292724609375, -0.490325927734375, -0.417724609375, -0.345123291015625, -0.27252197265625, -0.199920654296875, -0.1273193359375, -0.054718017578125, 0.01788330078125, 0.090484619140625, 0.1630859375, 0.235687255859375, 0.30828857421875, 0.380889892578125, 0.4534912109375, 0.526092529296875, 0.59869384765625, 0.671295166015625, 0.743896484375, 0.816497802734375, 0.88909912109375, 0.961700439453125, 1.0343017578125, 1.106903076171875, 1.17950439453125, 1.252105712890625, 1.32470703125, 1.397308349609375, 1.46990966796875, 1.542510986328125, 1.6151123046875, 1.687713623046875, 1.76031494140625, 1.832916259765625, 1.905517578125, 1.978118896484375, 2.05072021484375, 2.123321533203125, 2.1959228515625, 2.268524169921875, 2.34112548828125, 2.413726806640625, 2.486328125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 13.0, 13.0, 16.0, 26.0, 33.0, 38.0, 63.0, 88.0, 136.0, 176.0, 337.0, 570.0, 958.0, 1697.0, 3674.0, 8331.0, 23168.0, 211303.0, 747447.0, 30491.0, 10686.0, 4421.0, 2013.0, 1126.0, 582.0, 397.0, 259.0, 139.0, 92.0, 74.0, 59.0, 31.0, 25.0, 18.0, 8.0, 13.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.21484375, -1.1770172119140625, -1.139190673828125, -1.1013641357421875, -1.06353759765625, -1.0257110595703125, -0.987884521484375, -0.9500579833984375, -0.9122314453125, -0.8744049072265625, -0.836578369140625, -0.7987518310546875, -0.76092529296875, -0.7230987548828125, -0.685272216796875, -0.6474456787109375, -0.609619140625, -0.5717926025390625, -0.533966064453125, -0.4961395263671875, -0.45831298828125, -0.4204864501953125, -0.382659912109375, -0.3448333740234375, -0.3070068359375, -0.2691802978515625, -0.231353759765625, -0.1935272216796875, -0.15570068359375, -0.1178741455078125, -0.080047607421875, -0.0422210693359375, -0.00439453125, 0.0334320068359375, 0.071258544921875, 0.1090850830078125, 0.14691162109375, 0.1847381591796875, 0.222564697265625, 0.2603912353515625, 0.2982177734375, 0.3360443115234375, 0.373870849609375, 0.4116973876953125, 0.44952392578125, 0.4873504638671875, 0.525177001953125, 0.5630035400390625, 0.600830078125, 0.6386566162109375, 0.676483154296875, 0.7143096923828125, 0.75213623046875, 0.7899627685546875, 0.827789306640625, 0.8656158447265625, 0.9034423828125, 0.9412689208984375, 0.979095458984375, 1.0169219970703125, 1.05474853515625, 1.0925750732421875, 1.130401611328125, 1.1682281494140625, 1.2060546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 11.0, 11.0, 17.0, 11.0, 22.0, 18.0, 24.0, 30.0, 36.0, 30.0, 30.0, 42.0, 37.0, 32.0, 31.0, 40.0, 45.0, 51.0, 41.0, 34.0, 45.0, 47.0, 40.0, 38.0, 38.0, 28.0, 21.0, 19.0, 24.0, 16.0, 12.0, 13.0, 9.0, 5.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.2974853515625, -1.250244140625, -1.2030029296875, -1.15576171875, -1.1085205078125, -1.061279296875, -1.0140380859375, -0.966796875, -0.9195556640625, -0.872314453125, -0.8250732421875, -0.77783203125, -0.7305908203125, -0.683349609375, -0.6361083984375, -0.5888671875, -0.5416259765625, -0.494384765625, -0.4471435546875, -0.39990234375, -0.3526611328125, -0.305419921875, -0.2581787109375, -0.2109375, -0.1636962890625, -0.116455078125, -0.0692138671875, -0.02197265625, 0.0252685546875, 0.072509765625, 0.1197509765625, 0.1669921875, 0.2142333984375, 0.261474609375, 0.3087158203125, 0.35595703125, 0.4031982421875, 0.450439453125, 0.4976806640625, 0.544921875, 0.5921630859375, 0.639404296875, 0.6866455078125, 0.73388671875, 0.7811279296875, 0.828369140625, 0.8756103515625, 0.9228515625, 0.9700927734375, 1.017333984375, 1.0645751953125, 1.11181640625, 1.1590576171875, 1.206298828125, 1.2535400390625, 1.30078125, 1.3480224609375, 1.395263671875, 1.4425048828125, 1.48974609375, 1.5369873046875, 1.584228515625, 1.6314697265625, 1.6787109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 12.0, 7.0, 5.0, 8.0, 28.0, 32.0, 37.0, 60.0, 96.0, 124.0, 204.0, 299.0, 461.0, 809.0, 1405.0, 2594.0, 4836.0, 10603.0, 26809.0, 790727.0, 168339.0, 22337.0, 9116.0, 4222.0, 2181.0, 1224.0, 728.0, 478.0, 272.0, 161.0, 90.0, 66.0, 49.0, 43.0, 21.0, 23.0, 17.0, 8.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26624298095703125, -0.2573394775390625, -0.24843597412109375, -0.239532470703125, -0.23062896728515625, -0.2217254638671875, -0.21282196044921875, -0.20391845703125, -0.19501495361328125, -0.1861114501953125, -0.17720794677734375, -0.168304443359375, -0.15940093994140625, -0.1504974365234375, -0.14159393310546875, -0.1326904296875, -0.12378692626953125, -0.1148834228515625, -0.10597991943359375, -0.097076416015625, -0.08817291259765625, -0.0792694091796875, -0.07036590576171875, -0.06146240234375, -0.05255889892578125, -0.0436553955078125, -0.03475189208984375, -0.025848388671875, -0.01694488525390625, -0.0080413818359375, 0.00086212158203125, 0.009765625, 0.01866912841796875, 0.0275726318359375, 0.03647613525390625, 0.045379638671875, 0.05428314208984375, 0.0631866455078125, 0.07209014892578125, 0.08099365234375, 0.08989715576171875, 0.0988006591796875, 0.10770416259765625, 0.116607666015625, 0.12551116943359375, 0.1344146728515625, 0.14331817626953125, 0.1522216796875, 0.16112518310546875, 0.1700286865234375, 0.17893218994140625, 0.187835693359375, 0.19673919677734375, 0.2056427001953125, 0.21454620361328125, 0.22344970703125, 0.23235321044921875, 0.2412567138671875, 0.25016021728515625, 0.259063720703125, 0.26796722412109375, 0.2768707275390625, 0.28577423095703125, 0.294677734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 2.0, 4.0, 7.0, 14.0, 11.0, 13.0, 13.0, 22.0, 21.0, 18.0, 18.0, 29.0, 36.0, 44.0, 35.0, 49.0, 43.0, 41.0, 61.0, 51.0, 54.0, 41.0, 56.0, 41.0, 45.0, 28.0, 41.0, 21.0, 21.0, 26.0, 13.0, 18.0, 9.0, 9.0, 9.0, 3.0, 8.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.184246063232422e-05, -4.0601007640361786e-05, -3.935955464839935e-05, -3.811810165643692e-05, -3.687664866447449e-05, -3.5635195672512054e-05, -3.439374268054962e-05, -3.315228968858719e-05, -3.1910836696624756e-05, -3.066938370466232e-05, -2.942793071269989e-05, -2.8186477720737457e-05, -2.6945024728775024e-05, -2.570357173681259e-05, -2.446211874485016e-05, -2.3220665752887726e-05, -2.1979212760925293e-05, -2.073775976896286e-05, -1.9496306777000427e-05, -1.8254853785037994e-05, -1.701340079307556e-05, -1.577194780111313e-05, -1.4530494809150696e-05, -1.3289041817188263e-05, -1.204758882522583e-05, -1.0806135833263397e-05, -9.564682841300964e-06, -8.323229849338531e-06, -7.081776857376099e-06, -5.840323865413666e-06, -4.598870873451233e-06, -3.3574178814888e-06, -2.115964889526367e-06, -8.745118975639343e-07, 3.6694109439849854e-07, 1.6083940863609314e-06, 2.8498470783233643e-06, 4.091300070285797e-06, 5.33275306224823e-06, 6.574206054210663e-06, 7.815659046173096e-06, 9.057112038135529e-06, 1.0298565030097961e-05, 1.1540018022060394e-05, 1.2781471014022827e-05, 1.402292400598526e-05, 1.5264376997947693e-05, 1.6505829989910126e-05, 1.774728298187256e-05, 1.898873597383499e-05, 2.0230188965797424e-05, 2.1471641957759857e-05, 2.271309494972229e-05, 2.3954547941684723e-05, 2.5196000933647156e-05, 2.643745392560959e-05, 2.767890691757202e-05, 2.8920359909534454e-05, 3.0161812901496887e-05, 3.140326589345932e-05, 3.264471888542175e-05, 3.3886171877384186e-05, 3.512762486934662e-05, 3.636907786130905e-05, 3.7610530853271484e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 5.0, 5.0, 4.0, 8.0, 14.0, 20.0, 23.0, 24.0, 39.0, 44.0, 77.0, 122.0, 153.0, 210.0, 279.0, 416.0, 558.0, 771.0, 1094.0, 1661.0, 2290.0, 3371.0, 5129.0, 7983.0, 13040.0, 21359.0, 37246.0, 66164.0, 116637.0, 185253.0, 213896.0, 153189.0, 90693.0, 50861.0, 28460.0, 16905.0, 10218.0, 6586.0, 4299.0, 2760.0, 1956.0, 1309.0, 965.0, 726.0, 506.0, 366.0, 227.0, 168.0, 129.0, 113.0, 67.0, 50.0, 34.0, 16.0, 21.0, 15.0, 12.0, 6.0, 9.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.0679931640625, -0.06581878662109375, -0.0636444091796875, -0.06147003173828125, -0.059295654296875, -0.05712127685546875, -0.0549468994140625, -0.05277252197265625, -0.05059814453125, -0.04842376708984375, -0.0462493896484375, -0.04407501220703125, -0.041900634765625, -0.03972625732421875, -0.0375518798828125, -0.03537750244140625, -0.033203125, -0.03102874755859375, -0.0288543701171875, -0.02667999267578125, -0.024505615234375, -0.02233123779296875, -0.0201568603515625, -0.01798248291015625, -0.01580810546875, -0.01363372802734375, -0.0114593505859375, -0.00928497314453125, -0.007110595703125, -0.00493621826171875, -0.0027618408203125, -0.00058746337890625, 0.0015869140625, 0.00376129150390625, 0.0059356689453125, 0.00811004638671875, 0.010284423828125, 0.01245880126953125, 0.0146331787109375, 0.01680755615234375, 0.01898193359375, 0.02115631103515625, 0.0233306884765625, 0.02550506591796875, 0.027679443359375, 0.02985382080078125, 0.0320281982421875, 0.03420257568359375, 0.036376953125, 0.03855133056640625, 0.0407257080078125, 0.04290008544921875, 0.045074462890625, 0.04724884033203125, 0.0494232177734375, 0.05159759521484375, 0.05377197265625, 0.05594635009765625, 0.0581207275390625, 0.06029510498046875, 0.062469482421875, 0.06464385986328125, 0.0668182373046875, 0.06899261474609375, 0.0711669921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 8.0, 6.0, 11.0, 13.0, 17.0, 28.0, 28.0, 39.0, 42.0, 72.0, 44.0, 61.0, 62.0, 90.0, 73.0, 66.0, 68.0, 50.0, 46.0, 46.0, 31.0, 21.0, 23.0, 14.0, 9.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023406982421875, -0.022638797760009766, -0.02187061309814453, -0.021102428436279297, -0.020334243774414062, -0.019566059112548828, -0.018797874450683594, -0.01802968978881836, -0.017261505126953125, -0.01649332046508789, -0.015725135803222656, -0.014956951141357422, -0.014188766479492188, -0.013420581817626953, -0.012652397155761719, -0.011884212493896484, -0.01111602783203125, -0.010347843170166016, -0.009579658508300781, -0.008811473846435547, -0.008043289184570312, -0.007275104522705078, -0.006506919860839844, -0.005738735198974609, -0.004970550537109375, -0.004202365875244141, -0.0034341812133789062, -0.002665996551513672, -0.0018978118896484375, -0.0011296272277832031, -0.00036144256591796875, 0.0004067420959472656, 0.0011749267578125, 0.0019431114196777344, 0.0027112960815429688, 0.003479480743408203, 0.0042476654052734375, 0.005015850067138672, 0.005784034729003906, 0.006552219390869141, 0.007320404052734375, 0.00808858871459961, 0.008856773376464844, 0.009624958038330078, 0.010393142700195312, 0.011161327362060547, 0.011929512023925781, 0.012697696685791016, 0.01346588134765625, 0.014234066009521484, 0.015002250671386719, 0.015770435333251953, 0.016538619995117188, 0.017306804656982422, 0.018074989318847656, 0.01884317398071289, 0.019611358642578125, 0.02037954330444336, 0.021147727966308594, 0.021915912628173828, 0.022684097290039062, 0.023452281951904297, 0.02422046661376953, 0.024988651275634766, 0.0257568359375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 11.0, 17.0, 21.0, 31.0, 32.0, 47.0, 47.0, 58.0, 89.0, 99.0, 63.0, 95.0, 73.0, 57.0, 50.0, 59.0, 27.0, 23.0, 20.0, 17.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.15084171295166, -5.977791786193848, -5.804741859436035, -5.631691932678223, -5.45864200592041, -5.285592079162598, -5.112542152404785, -4.939492702484131, -4.766442775726318, -4.593392848968506, -4.420342922210693, -4.247292995452881, -4.074243068695068, -3.901193380355835, -3.7281434535980225, -3.555093765258789, -3.3820436000823975, -3.208993673324585, -3.0359437465667725, -2.862894058227539, -2.6898441314697266, -2.516794204711914, -2.3437442779541016, -2.170694351196289, -1.9976445436477661, -1.8245946168899536, -1.6515448093414307, -1.4784948825836182, -1.3054449558258057, -1.1323951482772827, -0.9593452215194702, -0.7862954139709473, -0.6132454872131348, -0.44019562005996704, -0.26714572310447693, -0.09409582614898682, 0.07895404100418091, 0.25200390815734863, 0.42505383491516113, 0.5981036424636841, 0.7711535692214966, 0.9442034363746643, 1.117253303527832, 1.2903032302856445, 1.463353157043457, 1.63640296459198, 1.8094528913497925, 1.9825026988983154, 2.155552625656128, 2.3286025524139404, 2.501652479171753, 2.6747021675109863, 2.847752094268799, 3.0208020210266113, 3.193851947784424, 3.3669018745422363, 3.539951801300049, 3.7130017280578613, 3.886051654815674, 4.059101581573486, 4.232151508331299, 4.405200958251953, 4.578250885009766, 4.751300811767578, 4.924350738525391]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 11.0, 11.0, 6.0, 13.0, 15.0, 21.0, 23.0, 11.0, 20.0, 19.0, 16.0, 20.0, 36.0, 28.0, 32.0, 31.0, 40.0, 26.0, 39.0, 33.0, 32.0, 40.0, 42.0, 40.0, 35.0, 27.0, 28.0, 35.0, 28.0, 20.0, 25.0, 31.0, 24.0, 27.0, 10.0, 11.0, 10.0, 10.0, 8.0, 11.0, 1.0, 9.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.6304569244384766, -1.5789599418640137, -1.5274629592895508, -1.4759658575057983, -1.4244688749313354, -1.3729718923568726, -1.3214747905731201, -1.2699778079986572, -1.2184808254241943, -1.1669838428497314, -1.1154868602752686, -1.0639897584915161, -1.0124927759170532, -0.9609957933425903, -0.9094987511634827, -0.858001708984375, -0.8065047264099121, -0.7550077438354492, -0.7035107016563416, -0.6520136594772339, -0.600516676902771, -0.5490196943283081, -0.49752265214920044, -0.44602563977241516, -0.3945286273956299, -0.3430316150188446, -0.2915346026420593, -0.24003759026527405, -0.18854057788848877, -0.1370435655117035, -0.08554655313491821, -0.034049540758132935, 0.017447471618652344, 0.06894448399543762, 0.1204414963722229, 0.17193850874900818, 0.22343552112579346, 0.27493253350257874, 0.326429545879364, 0.3779265582561493, 0.42942357063293457, 0.48092058300971985, 0.5324175953865051, 0.5839146375656128, 0.6354116201400757, 0.6869086027145386, 0.7384056448936462, 0.7899026870727539, 0.8413996696472168, 0.8928966522216797, 0.9443936944007874, 0.995890736579895, 1.047387719154358, 1.0988847017288208, 1.1503818035125732, 1.2018787860870361, 1.253375768661499, 1.304872751235962, 1.3563697338104248, 1.4078668355941772, 1.4593638181686401, 1.510860800743103, 1.5623579025268555, 1.6138548851013184, 1.6653518676757812]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 13.0, 18.0, 23.0, 37.0, 41.0, 56.0, 83.0, 150.0, 159.0, 291.0, 432.0, 645.0, 1065.0, 1710.0, 3032.0, 5445.0, 10351.0, 19737.0, 38136.0, 72313.0, 125851.0, 184243.0, 202256.0, 161700.0, 101738.0, 56245.0, 29273.0, 14963.0, 7892.0, 4297.0, 2458.0, 1449.0, 853.0, 527.0, 359.0, 228.0, 140.0, 98.0, 63.0, 49.0, 35.0, 26.0, 19.0, 17.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.876953125, -2.77874755859375, -2.6805419921875, -2.58233642578125, -2.484130859375, -2.38592529296875, -2.2877197265625, -2.18951416015625, -2.09130859375, -1.99310302734375, -1.8948974609375, -1.79669189453125, -1.698486328125, -1.60028076171875, -1.5020751953125, -1.40386962890625, -1.3056640625, -1.20745849609375, -1.1092529296875, -1.01104736328125, -0.912841796875, -0.81463623046875, -0.7164306640625, -0.61822509765625, -0.52001953125, -0.42181396484375, -0.3236083984375, -0.22540283203125, -0.127197265625, -0.02899169921875, 0.0692138671875, 0.16741943359375, 0.265625, 0.36383056640625, 0.4620361328125, 0.56024169921875, 0.658447265625, 0.75665283203125, 0.8548583984375, 0.95306396484375, 1.05126953125, 1.14947509765625, 1.2476806640625, 1.34588623046875, 1.444091796875, 1.54229736328125, 1.6405029296875, 1.73870849609375, 1.8369140625, 1.93511962890625, 2.0333251953125, 2.13153076171875, 2.229736328125, 2.32794189453125, 2.4261474609375, 2.52435302734375, 2.62255859375, 2.72076416015625, 2.8189697265625, 2.91717529296875, 3.015380859375, 3.11358642578125, 3.2117919921875, 3.30999755859375, 3.408203125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 10.0, 8.0, 13.0, 8.0, 10.0, 20.0, 16.0, 20.0, 26.0, 24.0, 26.0, 22.0, 26.0, 34.0, 36.0, 37.0, 35.0, 43.0, 48.0, 39.0, 39.0, 34.0, 41.0, 30.0, 29.0, 26.0, 33.0, 29.0, 24.0, 20.0, 27.0, 27.0, 22.0, 13.0, 11.0, 14.0, 6.0, 11.0, 3.0, 8.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.11328125, -2.0505828857421875, -1.987884521484375, -1.9251861572265625, -1.86248779296875, -1.7997894287109375, -1.737091064453125, -1.6743927001953125, -1.6116943359375, -1.5489959716796875, -1.486297607421875, -1.4235992431640625, -1.36090087890625, -1.2982025146484375, -1.235504150390625, -1.1728057861328125, -1.110107421875, -1.0474090576171875, -0.984710693359375, -0.9220123291015625, -0.85931396484375, -0.7966156005859375, -0.733917236328125, -0.6712188720703125, -0.6085205078125, -0.5458221435546875, -0.483123779296875, -0.4204254150390625, -0.35772705078125, -0.2950286865234375, -0.232330322265625, -0.1696319580078125, -0.10693359375, -0.0442352294921875, 0.018463134765625, 0.0811614990234375, 0.14385986328125, 0.2065582275390625, 0.269256591796875, 0.3319549560546875, 0.3946533203125, 0.4573516845703125, 0.520050048828125, 0.5827484130859375, 0.64544677734375, 0.7081451416015625, 0.770843505859375, 0.8335418701171875, 0.896240234375, 0.9589385986328125, 1.021636962890625, 1.0843353271484375, 1.14703369140625, 1.2097320556640625, 1.272430419921875, 1.3351287841796875, 1.3978271484375, 1.4605255126953125, 1.523223876953125, 1.5859222412109375, 1.64862060546875, 1.7113189697265625, 1.774017333984375, 1.8367156982421875, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 20.0, 24.0, 42.0, 47.0, 63.0, 121.0, 145.0, 238.0, 337.0, 516.0, 768.0, 1332.0, 2067.0, 3346.0, 5718.0, 10038.0, 17773.0, 31894.0, 56072.0, 93595.0, 140919.0, 176733.0, 171636.0, 132193.0, 85378.0, 50266.0, 28599.0, 16047.0, 9050.0, 5158.0, 3048.0, 1917.0, 1223.0, 755.0, 493.0, 315.0, 208.0, 148.0, 87.0, 69.0, 38.0, 32.0, 28.0, 17.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.720703125, -2.629730224609375, -2.53875732421875, -2.447784423828125, -2.3568115234375, -2.265838623046875, -2.17486572265625, -2.083892822265625, -1.992919921875, -1.901947021484375, -1.81097412109375, -1.720001220703125, -1.6290283203125, -1.538055419921875, -1.44708251953125, -1.356109619140625, -1.26513671875, -1.174163818359375, -1.08319091796875, -0.992218017578125, -0.9012451171875, -0.810272216796875, -0.71929931640625, -0.628326416015625, -0.537353515625, -0.446380615234375, -0.35540771484375, -0.264434814453125, -0.1734619140625, -0.082489013671875, 0.00848388671875, 0.099456787109375, 0.1904296875, 0.281402587890625, 0.37237548828125, 0.463348388671875, 0.5543212890625, 0.645294189453125, 0.73626708984375, 0.827239990234375, 0.918212890625, 1.009185791015625, 1.10015869140625, 1.191131591796875, 1.2821044921875, 1.373077392578125, 1.46405029296875, 1.555023193359375, 1.64599609375, 1.736968994140625, 1.82794189453125, 1.918914794921875, 2.0098876953125, 2.100860595703125, 2.19183349609375, 2.282806396484375, 2.373779296875, 2.464752197265625, 2.55572509765625, 2.646697998046875, 2.7376708984375, 2.828643798828125, 2.91961669921875, 3.010589599609375, 3.1015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 12.0, 12.0, 16.0, 23.0, 17.0, 18.0, 36.0, 24.0, 29.0, 41.0, 38.0, 37.0, 44.0, 36.0, 47.0, 44.0, 44.0, 43.0, 49.0, 37.0, 34.0, 42.0, 39.0, 24.0, 29.0, 22.0, 20.0, 19.0, 27.0, 16.0, 10.0, 8.0, 13.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2480316162109375, -1.202117919921875, -1.1562042236328125, -1.11029052734375, -1.0643768310546875, -1.018463134765625, -0.9725494384765625, -0.9266357421875, -0.8807220458984375, -0.834808349609375, -0.7888946533203125, -0.74298095703125, -0.6970672607421875, -0.651153564453125, -0.6052398681640625, -0.559326171875, -0.5134124755859375, -0.467498779296875, -0.4215850830078125, -0.37567138671875, -0.3297576904296875, -0.283843994140625, -0.2379302978515625, -0.1920166015625, -0.1461029052734375, -0.100189208984375, -0.0542755126953125, -0.00836181640625, 0.0375518798828125, 0.083465576171875, 0.1293792724609375, 0.17529296875, 0.2212066650390625, 0.267120361328125, 0.3130340576171875, 0.35894775390625, 0.4048614501953125, 0.450775146484375, 0.4966888427734375, 0.5426025390625, 0.5885162353515625, 0.634429931640625, 0.6803436279296875, 0.72625732421875, 0.7721710205078125, 0.818084716796875, 0.8639984130859375, 0.909912109375, 0.9558258056640625, 1.001739501953125, 1.0476531982421875, 1.09356689453125, 1.1394805908203125, 1.185394287109375, 1.2313079833984375, 1.2772216796875, 1.3231353759765625, 1.369049072265625, 1.4149627685546875, 1.46087646484375, 1.5067901611328125, 1.552703857421875, 1.5986175537109375, 1.64453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 6.0, 9.0, 22.0, 27.0, 41.0, 44.0, 86.0, 83.0, 160.0, 244.0, 282.0, 526.0, 796.0, 1060.0, 1803.0, 2731.0, 4513.0, 7348.0, 13007.0, 23521.0, 43775.0, 83187.0, 147416.0, 209129.0, 201800.0, 137558.0, 76417.0, 40513.0, 21775.0, 11933.0, 7084.0, 4149.0, 2584.0, 1680.0, 1117.0, 675.0, 476.0, 313.0, 198.0, 143.0, 107.0, 65.0, 45.0, 31.0, 27.0, 13.0, 17.0, 10.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7138671875, -1.6584625244140625, -1.603057861328125, -1.5476531982421875, -1.49224853515625, -1.4368438720703125, -1.381439208984375, -1.3260345458984375, -1.2706298828125, -1.2152252197265625, -1.159820556640625, -1.1044158935546875, -1.04901123046875, -0.9936065673828125, -0.938201904296875, -0.8827972412109375, -0.827392578125, -0.7719879150390625, -0.716583251953125, -0.6611785888671875, -0.60577392578125, -0.5503692626953125, -0.494964599609375, -0.4395599365234375, -0.3841552734375, -0.3287506103515625, -0.273345947265625, -0.2179412841796875, -0.16253662109375, -0.1071319580078125, -0.051727294921875, 0.0036773681640625, 0.05908203125, 0.1144866943359375, 0.169891357421875, 0.2252960205078125, 0.28070068359375, 0.3361053466796875, 0.391510009765625, 0.4469146728515625, 0.5023193359375, 0.5577239990234375, 0.613128662109375, 0.6685333251953125, 0.72393798828125, 0.7793426513671875, 0.834747314453125, 0.8901519775390625, 0.945556640625, 1.0009613037109375, 1.056365966796875, 1.1117706298828125, 1.16717529296875, 1.2225799560546875, 1.277984619140625, 1.3333892822265625, 1.3887939453125, 1.4441986083984375, 1.499603271484375, 1.5550079345703125, 1.61041259765625, 1.6658172607421875, 1.721221923828125, 1.7766265869140625, 1.83203125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 14.0, 17.0, 14.0, 19.0, 29.0, 31.0, 39.0, 40.0, 45.0, 50.0, 65.0, 61.0, 65.0, 68.0, 75.0, 65.0, 52.0, 37.0, 36.0, 33.0, 26.0, 26.0, 13.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00015115737915039062, -0.00014640763401985168, -0.00014165788888931274, -0.0001369081437587738, -0.00013215839862823486, -0.00012740865349769592, -0.00012265890836715698, -0.00011790916323661804, -0.0001131594181060791, -0.00010840967297554016, -0.00010365992784500122, -9.891018271446228e-05, -9.416043758392334e-05, -8.94106924533844e-05, -8.466094732284546e-05, -7.991120219230652e-05, -7.516145706176758e-05, -7.041171193122864e-05, -6.56619668006897e-05, -6.091222167015076e-05, -5.6162476539611816e-05, -5.1412731409072876e-05, -4.6662986278533936e-05, -4.1913241147994995e-05, -3.7163496017456055e-05, -3.2413750886917114e-05, -2.7664005756378174e-05, -2.2914260625839233e-05, -1.8164515495300293e-05, -1.3414770364761353e-05, -8.665025234222412e-06, -3.915280103683472e-06, 8.344650268554688e-07, 5.584210157394409e-06, 1.033395528793335e-05, 1.508370041847229e-05, 1.983344554901123e-05, 2.458319067955017e-05, 2.933293581008911e-05, 3.408268094062805e-05, 3.883242607116699e-05, 4.358217120170593e-05, 4.833191633224487e-05, 5.3081661462783813e-05, 5.7831406593322754e-05, 6.25811517238617e-05, 6.733089685440063e-05, 7.208064198493958e-05, 7.683038711547852e-05, 8.158013224601746e-05, 8.63298773765564e-05, 9.107962250709534e-05, 9.582936763763428e-05, 0.00010057911276817322, 0.00010532885789871216, 0.0001100786030292511, 0.00011482834815979004, 0.00011957809329032898, 0.00012432783842086792, 0.00012907758355140686, 0.0001338273286819458, 0.00013857707381248474, 0.00014332681894302368, 0.00014807656407356262, 0.00015282630920410156]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 21.0, 28.0, 64.0, 82.0, 120.0, 198.0, 337.0, 601.0, 1008.0, 1778.0, 3100.0, 5987.0, 11620.0, 22885.0, 46501.0, 92868.0, 166782.0, 229264.0, 205666.0, 127413.0, 65616.0, 32195.0, 16370.0, 8059.0, 4397.0, 2406.0, 1306.0, 771.0, 405.0, 256.0, 127.0, 92.0, 74.0, 51.0, 21.0, 25.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7138671875, -1.6581268310546875, -1.602386474609375, -1.5466461181640625, -1.49090576171875, -1.4351654052734375, -1.379425048828125, -1.3236846923828125, -1.2679443359375, -1.2122039794921875, -1.156463623046875, -1.1007232666015625, -1.04498291015625, -0.9892425537109375, -0.933502197265625, -0.8777618408203125, -0.822021484375, -0.7662811279296875, -0.710540771484375, -0.6548004150390625, -0.59906005859375, -0.5433197021484375, -0.487579345703125, -0.4318389892578125, -0.3760986328125, -0.3203582763671875, -0.264617919921875, -0.2088775634765625, -0.15313720703125, -0.0973968505859375, -0.041656494140625, 0.0140838623046875, 0.06982421875, 0.1255645751953125, 0.181304931640625, 0.2370452880859375, 0.29278564453125, 0.3485260009765625, 0.404266357421875, 0.4600067138671875, 0.5157470703125, 0.5714874267578125, 0.627227783203125, 0.6829681396484375, 0.73870849609375, 0.7944488525390625, 0.850189208984375, 0.9059295654296875, 0.961669921875, 1.0174102783203125, 1.073150634765625, 1.1288909912109375, 1.18463134765625, 1.2403717041015625, 1.296112060546875, 1.3518524169921875, 1.4075927734375, 1.4633331298828125, 1.519073486328125, 1.5748138427734375, 1.63055419921875, 1.6862945556640625, 1.742034912109375, 1.7977752685546875, 1.853515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 11.0, 11.0, 13.0, 12.0, 22.0, 21.0, 30.0, 39.0, 47.0, 49.0, 56.0, 80.0, 69.0, 56.0, 70.0, 54.0, 64.0, 43.0, 39.0, 36.0, 37.0, 36.0, 17.0, 13.0, 8.0, 16.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33078765869140625, -0.3185577392578125, -0.30632781982421875, -0.294097900390625, -0.28186798095703125, -0.2696380615234375, -0.25740814208984375, -0.24517822265625, -0.23294830322265625, -0.2207183837890625, -0.20848846435546875, -0.196258544921875, -0.18402862548828125, -0.1717987060546875, -0.15956878662109375, -0.1473388671875, -0.13510894775390625, -0.1228790283203125, -0.11064910888671875, -0.098419189453125, -0.08618927001953125, -0.0739593505859375, -0.06172943115234375, -0.04949951171875, -0.03726959228515625, -0.0250396728515625, -0.01280975341796875, -0.000579833984375, 0.01165008544921875, 0.0238800048828125, 0.03610992431640625, 0.04833984375, 0.06056976318359375, 0.0727996826171875, 0.08502960205078125, 0.097259521484375, 0.10948944091796875, 0.1217193603515625, 0.13394927978515625, 0.14617919921875, 0.15840911865234375, 0.1706390380859375, 0.18286895751953125, 0.195098876953125, 0.20732879638671875, 0.2195587158203125, 0.23178863525390625, 0.2440185546875, 0.25624847412109375, 0.2684783935546875, 0.28070831298828125, 0.292938232421875, 0.30516815185546875, 0.3173980712890625, 0.32962799072265625, 0.34185791015625, 0.35408782958984375, 0.3663177490234375, 0.37854766845703125, 0.390777587890625, 0.40300750732421875, 0.4152374267578125, 0.42746734619140625, 0.439697265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 10.0, 13.0, 22.0, 20.0, 39.0, 43.0, 57.0, 61.0, 78.0, 93.0, 95.0, 73.0, 93.0, 58.0, 51.0, 45.0, 34.0, 28.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668394565582275, -6.490774154663086, -6.313153266906738, -6.135532855987549, -5.957912445068359, -5.78029203414917, -5.6026716232299805, -5.425050735473633, -5.247430324554443, -5.069809913635254, -4.892189025878906, -4.714568614959717, -4.536948204040527, -4.359327793121338, -4.181707382202148, -4.004086494445801, -3.8264660835266113, -3.648845672607422, -3.4712250232696533, -3.2936043739318848, -3.1159839630126953, -2.938363552093506, -2.7607429027557373, -2.5831222534179688, -2.4055018424987793, -2.22788143157959, -2.0502607822418213, -1.8726402521133423, -1.6950197219848633, -1.5173991918563843, -1.3397786617279053, -1.1621581315994263, -0.9845380783081055, -0.8069175481796265, -0.6292970180511475, -0.45167648792266846, -0.27405595779418945, -0.09643542766571045, 0.08118510246276855, 0.25880563259124756, 0.43642616271972656, 0.6140466928482056, 0.7916672229766846, 0.9692877531051636, 1.1469082832336426, 1.3245288133621216, 1.5021493434906006, 1.6797698736190796, 1.8573904037475586, 2.035010814666748, 2.2126314640045166, 2.390252113342285, 2.5678725242614746, 2.745492935180664, 2.9231135845184326, 3.100734233856201, 3.2783546447753906, 3.45597505569458, 3.6335957050323486, 3.811216354370117, 3.9888367652893066, 4.166457176208496, 4.344078063964844, 4.521698474884033, 4.699318885803223]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 13.0, 14.0, 27.0, 21.0, 14.0, 21.0, 27.0, 34.0, 19.0, 35.0, 35.0, 34.0, 35.0, 45.0, 52.0, 42.0, 44.0, 44.0, 47.0, 31.0, 32.0, 34.0, 41.0, 29.0, 21.0, 21.0, 26.0, 20.0, 13.0, 23.0, 17.0, 4.0, 13.0, 12.0, 4.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9693043231964111, -1.907718539237976, -1.8461326360702515, -1.7845468521118164, -1.7229610681533813, -1.6613751649856567, -1.5997893810272217, -1.538203477859497, -1.476617693901062, -1.415031909942627, -1.3534460067749023, -1.2918602228164673, -1.2302744388580322, -1.1686885356903076, -1.1071027517318726, -1.0455169677734375, -0.9839311242103577, -0.9223452806472778, -0.8607594966888428, -0.7991736531257629, -0.7375878095626831, -0.676002025604248, -0.6144161820411682, -0.5528303384780884, -0.49124452471733093, -0.4296587109565735, -0.36807286739349365, -0.3064870536327362, -0.24490122497081757, -0.18331539630889893, -0.12172958254814148, -0.060143738985061646, 0.0014420747756958008, 0.06302790343761444, 0.12461372464895248, 0.18619954586029053, 0.24778537452220917, 0.3093712031841278, 0.37095701694488525, 0.4325428605079651, 0.49412867426872253, 0.55571448802948, 0.6173003315925598, 0.6788861751556396, 0.7404719591140747, 0.8020578026771545, 0.8636436462402344, 0.9252294301986694, 0.9868152737617493, 1.048401117324829, 1.1099869012832642, 1.1715726852416992, 1.2331585884094238, 1.2947443723678589, 1.356330156326294, 1.4179160594940186, 1.4795018434524536, 1.5410876274108887, 1.6026735305786133, 1.6642593145370483, 1.7258450984954834, 1.787431001663208, 1.849016785621643, 1.9106025695800781, 1.9721884727478027]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 17.0, 15.0, 30.0, 53.0, 72.0, 115.0, 159.0, 260.0, 440.0, 654.0, 1032.0, 1716.0, 3034.0, 5258.0, 9629.0, 18512.0, 37235.0, 80871.0, 193478.0, 512983.0, 1207863.0, 1228824.0, 534557.0, 197648.0, 81611.0, 37276.0, 18129.0, 9622.0, 5355.0, 3054.0, 1833.0, 1113.0, 654.0, 428.0, 257.0, 184.0, 96.0, 75.0, 53.0, 28.0, 22.0, 14.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.46453857421875, -4.3157958984375, -4.16705322265625, -4.018310546875, -3.86956787109375, -3.7208251953125, -3.57208251953125, -3.42333984375, -3.27459716796875, -3.1258544921875, -2.97711181640625, -2.828369140625, -2.67962646484375, -2.5308837890625, -2.38214111328125, -2.2333984375, -2.08465576171875, -1.9359130859375, -1.78717041015625, -1.638427734375, -1.48968505859375, -1.3409423828125, -1.19219970703125, -1.04345703125, -0.89471435546875, -0.7459716796875, -0.59722900390625, -0.448486328125, -0.29974365234375, -0.1510009765625, -0.00225830078125, 0.146484375, 0.29522705078125, 0.4439697265625, 0.59271240234375, 0.741455078125, 0.89019775390625, 1.0389404296875, 1.18768310546875, 1.33642578125, 1.48516845703125, 1.6339111328125, 1.78265380859375, 1.931396484375, 2.08013916015625, 2.2288818359375, 2.37762451171875, 2.5263671875, 2.67510986328125, 2.8238525390625, 2.97259521484375, 3.121337890625, 3.27008056640625, 3.4188232421875, 3.56756591796875, 3.71630859375, 3.86505126953125, 4.0137939453125, 4.16253662109375, 4.311279296875, 4.46002197265625, 4.6087646484375, 4.75750732421875, 4.90625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 4.0, 1.0, 5.0, 5.0, 11.0, 15.0, 11.0, 17.0, 10.0, 19.0, 19.0, 25.0, 20.0, 28.0, 29.0, 36.0, 32.0, 30.0, 27.0, 36.0, 40.0, 49.0, 30.0, 46.0, 39.0, 27.0, 41.0, 34.0, 37.0, 30.0, 29.0, 28.0, 21.0, 22.0, 18.0, 12.0, 21.0, 18.0, 10.0, 10.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.521484375, -1.4746856689453125, -1.427886962890625, -1.3810882568359375, -1.33428955078125, -1.2874908447265625, -1.240692138671875, -1.1938934326171875, -1.1470947265625, -1.1002960205078125, -1.053497314453125, -1.0066986083984375, -0.95989990234375, -0.9131011962890625, -0.866302490234375, -0.8195037841796875, -0.772705078125, -0.7259063720703125, -0.679107666015625, -0.6323089599609375, -0.58551025390625, -0.5387115478515625, -0.491912841796875, -0.4451141357421875, -0.3983154296875, -0.3515167236328125, -0.304718017578125, -0.2579193115234375, -0.21112060546875, -0.1643218994140625, -0.117523193359375, -0.0707244873046875, -0.02392578125, 0.0228729248046875, 0.069671630859375, 0.1164703369140625, 0.16326904296875, 0.2100677490234375, 0.256866455078125, 0.3036651611328125, 0.3504638671875, 0.3972625732421875, 0.444061279296875, 0.4908599853515625, 0.53765869140625, 0.5844573974609375, 0.631256103515625, 0.6780548095703125, 0.724853515625, 0.7716522216796875, 0.818450927734375, 0.8652496337890625, 0.91204833984375, 0.9588470458984375, 1.005645751953125, 1.0524444580078125, 1.0992431640625, 1.1460418701171875, 1.192840576171875, 1.2396392822265625, 1.28643798828125, 1.3332366943359375, 1.380035400390625, 1.4268341064453125, 1.4736328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 18.0, 21.0, 34.0, 49.0, 85.0, 107.0, 132.0, 230.0, 328.0, 517.0, 746.0, 1216.0, 1900.0, 2960.0, 4741.0, 7636.0, 12945.0, 22377.0, 40009.0, 73152.0, 138658.0, 272854.0, 535096.0, 921368.0, 958471.0, 576936.0, 293593.0, 148977.0, 78048.0, 41927.0, 23661.0, 13667.0, 8188.0, 5038.0, 3014.0, 1946.0, 1255.0, 774.0, 538.0, 350.0, 230.0, 165.0, 98.0, 65.0, 49.0, 41.0, 14.0, 13.0, 14.0, 10.0, 4.0, 1.0, 5.0, 4.0, 1.0], "bins": [-4.10546875, -3.98126220703125, -3.8570556640625, -3.73284912109375, -3.608642578125, -3.48443603515625, -3.3602294921875, -3.23602294921875, -3.11181640625, -2.98760986328125, -2.8634033203125, -2.73919677734375, -2.614990234375, -2.49078369140625, -2.3665771484375, -2.24237060546875, -2.1181640625, -1.99395751953125, -1.8697509765625, -1.74554443359375, -1.621337890625, -1.49713134765625, -1.3729248046875, -1.24871826171875, -1.12451171875, -1.00030517578125, -0.8760986328125, -0.75189208984375, -0.627685546875, -0.50347900390625, -0.3792724609375, -0.25506591796875, -0.130859375, -0.00665283203125, 0.1175537109375, 0.24176025390625, 0.365966796875, 0.49017333984375, 0.6143798828125, 0.73858642578125, 0.86279296875, 0.98699951171875, 1.1112060546875, 1.23541259765625, 1.359619140625, 1.48382568359375, 1.6080322265625, 1.73223876953125, 1.8564453125, 1.98065185546875, 2.1048583984375, 2.22906494140625, 2.353271484375, 2.47747802734375, 2.6016845703125, 2.72589111328125, 2.85009765625, 2.97430419921875, 3.0985107421875, 3.22271728515625, 3.346923828125, 3.47113037109375, 3.5953369140625, 3.71954345703125, 3.84375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 9.0, 8.0, 6.0, 17.0, 32.0, 40.0, 34.0, 48.0, 57.0, 95.0, 94.0, 105.0, 141.0, 176.0, 209.0, 265.0, 260.0, 293.0, 294.0, 265.0, 263.0, 272.0, 205.0, 180.0, 148.0, 118.0, 98.0, 79.0, 61.0, 50.0, 43.0, 28.0, 16.0, 13.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.07647705078125, -1.0396728515625, -1.00286865234375, -0.966064453125, -0.92926025390625, -0.8924560546875, -0.85565185546875, -0.81884765625, -0.78204345703125, -0.7452392578125, -0.70843505859375, -0.671630859375, -0.63482666015625, -0.5980224609375, -0.56121826171875, -0.5244140625, -0.48760986328125, -0.4508056640625, -0.41400146484375, -0.377197265625, -0.34039306640625, -0.3035888671875, -0.26678466796875, -0.22998046875, -0.19317626953125, -0.1563720703125, -0.11956787109375, -0.082763671875, -0.04595947265625, -0.0091552734375, 0.02764892578125, 0.064453125, 0.10125732421875, 0.1380615234375, 0.17486572265625, 0.211669921875, 0.24847412109375, 0.2852783203125, 0.32208251953125, 0.35888671875, 0.39569091796875, 0.4324951171875, 0.46929931640625, 0.506103515625, 0.54290771484375, 0.5797119140625, 0.61651611328125, 0.6533203125, 0.69012451171875, 0.7269287109375, 0.76373291015625, 0.800537109375, 0.83734130859375, 0.8741455078125, 0.91094970703125, 0.94775390625, 0.98455810546875, 1.0213623046875, 1.05816650390625, 1.094970703125, 1.13177490234375, 1.1685791015625, 1.20538330078125, 1.2421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 9.0, 14.0, 16.0, 14.0, 26.0, 41.0, 51.0, 63.0, 74.0, 95.0, 79.0, 92.0, 91.0, 64.0, 57.0, 60.0, 32.0, 27.0, 24.0, 20.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.784271717071533, -7.594692707061768, -7.405113697052002, -7.2155351638793945, -7.025956153869629, -6.836377143859863, -6.646798133850098, -6.457219123840332, -6.267640113830566, -6.078061103820801, -5.888482093811035, -5.6989030838012695, -5.509324550628662, -5.3197455406188965, -5.130166530609131, -4.940587520599365, -4.751008987426758, -4.561429977416992, -4.371850967407227, -4.182271957397461, -3.9926934242248535, -3.803114414215088, -3.6135354042053223, -3.4239563941955566, -3.23437762260437, -3.0447986125946045, -2.855219841003418, -2.6656408309936523, -2.4760618209838867, -2.2864830493927, -2.0969040393829346, -1.9073251485824585, -1.7177457809448242, -1.5281668901443481, -1.338587999343872, -1.1490089893341064, -0.9594300985336304, -0.7698512077331543, -0.5802721977233887, -0.3906933069229126, -0.20111441612243652, -0.011535495519638062, 0.1780434250831604, 0.36762237548828125, 0.5572012662887573, 0.7467801570892334, 0.936359167098999, 1.125938057899475, 1.3155169486999512, 1.5050958395004272, 1.6946747303009033, 1.884253740310669, 2.0738325119018555, 2.263411521911621, 2.4529905319213867, 2.6425695419311523, 2.832148313522339, 3.0217273235321045, 3.211306095123291, 3.4008851051330566, 3.5904641151428223, 3.780042886734009, 3.9696218967437744, 4.159200668334961, 4.348779678344727]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 7.0, 16.0, 10.0, 16.0, 22.0, 25.0, 14.0, 29.0, 20.0, 30.0, 30.0, 30.0, 42.0, 45.0, 33.0, 43.0, 42.0, 48.0, 38.0, 34.0, 36.0, 39.0, 46.0, 38.0, 34.0, 32.0, 27.0, 20.0, 22.0, 18.0, 19.0, 14.0, 11.0, 9.0, 14.0, 10.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.2169461250305176, -2.1566765308380127, -2.096407175064087, -2.036137580871582, -1.9758681058883667, -1.9155986309051514, -1.855329155921936, -1.7950596809387207, -1.7347902059555054, -1.67452073097229, -1.6142512559890747, -1.5539817810058594, -1.4937121868133545, -1.4334427118301392, -1.3731732368469238, -1.3129037618637085, -1.2526342868804932, -1.1923648118972778, -1.1320953369140625, -1.0718257427215576, -1.0115562677383423, -0.951286792755127, -0.8910173177719116, -0.8307478427886963, -0.7704782485961914, -0.7102087736129761, -0.649939239025116, -0.5896697640419006, -0.5294002890586853, -0.4691307842731476, -0.40886127948760986, -0.34859180450439453, -0.2883223295211792, -0.22805283963680267, -0.16778334975242615, -0.10751384496688843, -0.0472443550825119, 0.013025134801864624, 0.07329463958740234, 0.13356411457061768, 0.1938336193561554, 0.2541031241416931, 0.31437259912490845, 0.37464210391044617, 0.4349116086959839, 0.4951810836791992, 0.5554505586624146, 0.6157200336456299, 0.67598956823349, 0.7362590432167053, 0.7965285778045654, 0.8567980527877808, 0.9170675277709961, 0.9773370027542114, 1.0376064777374268, 1.0978760719299316, 1.158145546913147, 1.2184150218963623, 1.2786844968795776, 1.338953971862793, 1.3992235660552979, 1.4594930410385132, 1.5197625160217285, 1.5800319910049438, 1.6403014659881592]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 2.0, 8.0, 16.0, 17.0, 23.0, 39.0, 50.0, 84.0, 135.0, 251.0, 375.0, 565.0, 1053.0, 1793.0, 3324.0, 6319.0, 11909.0, 23719.0, 48421.0, 98618.0, 185751.0, 251671.0, 197455.0, 109129.0, 53839.0, 25988.0, 12835.0, 6635.0, 3733.0, 2003.0, 1131.0, 661.0, 360.0, 212.0, 154.0, 97.0, 54.0, 37.0, 27.0, 14.0, 17.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.32747650146484375, -0.3155975341796875, -0.30371856689453125, -0.291839599609375, -0.27996063232421875, -0.2680816650390625, -0.25620269775390625, -0.24432373046875, -0.23244476318359375, -0.2205657958984375, -0.20868682861328125, -0.196807861328125, -0.18492889404296875, -0.1730499267578125, -0.16117095947265625, -0.1492919921875, -0.13741302490234375, -0.1255340576171875, -0.11365509033203125, -0.101776123046875, -0.08989715576171875, -0.0780181884765625, -0.06613922119140625, -0.05426025390625, -0.04238128662109375, -0.0305023193359375, -0.01862335205078125, -0.006744384765625, 0.00513458251953125, 0.0170135498046875, 0.02889251708984375, 0.040771484375, 0.05265045166015625, 0.0645294189453125, 0.07640838623046875, 0.088287353515625, 0.10016632080078125, 0.1120452880859375, 0.12392425537109375, 0.13580322265625, 0.14768218994140625, 0.1595611572265625, 0.17144012451171875, 0.183319091796875, 0.19519805908203125, 0.2070770263671875, 0.21895599365234375, 0.2308349609375, 0.24271392822265625, 0.2545928955078125, 0.26647186279296875, 0.278350830078125, 0.29022979736328125, 0.3021087646484375, 0.31398773193359375, 0.32586669921875, 0.33774566650390625, 0.3496246337890625, 0.36150360107421875, 0.373382568359375, 0.38526153564453125, 0.3971405029296875, 0.40901947021484375, 0.4208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 7.0, 12.0, 14.0, 20.0, 20.0, 23.0, 23.0, 27.0, 33.0, 24.0, 48.0, 37.0, 36.0, 35.0, 35.0, 33.0, 45.0, 33.0, 51.0, 41.0, 41.0, 42.0, 39.0, 23.0, 35.0, 29.0, 19.0, 25.0, 22.0, 15.0, 18.0, 16.0, 13.0, 10.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.147979736328125, -2.07916259765625, -2.010345458984375, -1.9415283203125, -1.872711181640625, -1.80389404296875, -1.735076904296875, -1.666259765625, -1.597442626953125, -1.52862548828125, -1.459808349609375, -1.3909912109375, -1.322174072265625, -1.25335693359375, -1.184539794921875, -1.11572265625, -1.046905517578125, -0.97808837890625, -0.909271240234375, -0.8404541015625, -0.771636962890625, -0.70281982421875, -0.634002685546875, -0.565185546875, -0.496368408203125, -0.42755126953125, -0.358734130859375, -0.2899169921875, -0.221099853515625, -0.15228271484375, -0.083465576171875, -0.0146484375, 0.054168701171875, 0.12298583984375, 0.191802978515625, 0.2606201171875, 0.329437255859375, 0.39825439453125, 0.467071533203125, 0.535888671875, 0.604705810546875, 0.67352294921875, 0.742340087890625, 0.8111572265625, 0.879974365234375, 0.94879150390625, 1.017608642578125, 1.08642578125, 1.155242919921875, 1.22406005859375, 1.292877197265625, 1.3616943359375, 1.430511474609375, 1.49932861328125, 1.568145751953125, 1.636962890625, 1.705780029296875, 1.77459716796875, 1.843414306640625, 1.9122314453125, 1.981048583984375, 2.04986572265625, 2.118682861328125, 2.1875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 8.0, 3.0, 7.0, 8.0, 14.0, 15.0, 22.0, 30.0, 44.0, 66.0, 98.0, 129.0, 183.0, 286.0, 450.0, 693.0, 1152.0, 2002.0, 3984.0, 8534.0, 20126.0, 79197.0, 858546.0, 43362.0, 15206.0, 6627.0, 3194.0, 1758.0, 1019.0, 582.0, 398.0, 280.0, 143.0, 99.0, 73.0, 54.0, 42.0, 29.0, 18.0, 16.0, 15.0, 12.0, 9.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.080078125, -1.04669189453125, -1.0133056640625, -0.97991943359375, -0.946533203125, -0.91314697265625, -0.8797607421875, -0.84637451171875, -0.81298828125, -0.77960205078125, -0.7462158203125, -0.71282958984375, -0.679443359375, -0.64605712890625, -0.6126708984375, -0.57928466796875, -0.5458984375, -0.51251220703125, -0.4791259765625, -0.44573974609375, -0.412353515625, -0.37896728515625, -0.3455810546875, -0.31219482421875, -0.27880859375, -0.24542236328125, -0.2120361328125, -0.17864990234375, -0.145263671875, -0.11187744140625, -0.0784912109375, -0.04510498046875, -0.01171875, 0.02166748046875, 0.0550537109375, 0.08843994140625, 0.121826171875, 0.15521240234375, 0.1885986328125, 0.22198486328125, 0.25537109375, 0.28875732421875, 0.3221435546875, 0.35552978515625, 0.388916015625, 0.42230224609375, 0.4556884765625, 0.48907470703125, 0.5224609375, 0.55584716796875, 0.5892333984375, 0.62261962890625, 0.656005859375, 0.68939208984375, 0.7227783203125, 0.75616455078125, 0.78955078125, 0.82293701171875, 0.8563232421875, 0.88970947265625, 0.923095703125, 0.95648193359375, 0.9898681640625, 1.02325439453125, 1.056640625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 4.0, 5.0, 9.0, 11.0, 23.0, 27.0, 16.0, 21.0, 21.0, 34.0, 36.0, 32.0, 35.0, 38.0, 34.0, 43.0, 44.0, 43.0, 37.0, 40.0, 30.0, 37.0, 35.0, 39.0, 39.0, 31.0, 25.0, 28.0, 20.0, 12.0, 14.0, 23.0, 24.0, 13.0, 9.0, 10.0, 6.0, 10.0, 6.0, 9.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.36328125, -1.320404052734375, -1.27752685546875, -1.234649658203125, -1.1917724609375, -1.148895263671875, -1.10601806640625, -1.063140869140625, -1.020263671875, -0.977386474609375, -0.93450927734375, -0.891632080078125, -0.8487548828125, -0.805877685546875, -0.76300048828125, -0.720123291015625, -0.67724609375, -0.634368896484375, -0.59149169921875, -0.548614501953125, -0.5057373046875, -0.462860107421875, -0.41998291015625, -0.377105712890625, -0.334228515625, -0.291351318359375, -0.24847412109375, -0.205596923828125, -0.1627197265625, -0.119842529296875, -0.07696533203125, -0.034088134765625, 0.0087890625, 0.051666259765625, 0.09454345703125, 0.137420654296875, 0.1802978515625, 0.223175048828125, 0.26605224609375, 0.308929443359375, 0.351806640625, 0.394683837890625, 0.43756103515625, 0.480438232421875, 0.5233154296875, 0.566192626953125, 0.60906982421875, 0.651947021484375, 0.69482421875, 0.737701416015625, 0.78057861328125, 0.823455810546875, 0.8663330078125, 0.909210205078125, 0.95208740234375, 0.994964599609375, 1.037841796875, 1.080718994140625, 1.12359619140625, 1.166473388671875, 1.2093505859375, 1.252227783203125, 1.29510498046875, 1.337982177734375, 1.380859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 13.0, 19.0, 18.0, 37.0, 49.0, 61.0, 116.0, 173.0, 274.0, 426.0, 801.0, 1574.0, 3218.0, 7855.0, 24748.0, 888202.0, 93343.0, 16556.0, 5688.0, 2476.0, 1178.0, 661.0, 373.0, 228.0, 138.0, 100.0, 61.0, 43.0, 33.0, 24.0, 10.0, 9.0, 16.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.36058807373046875, -0.3471527099609375, -0.33371734619140625, -0.320281982421875, -0.30684661865234375, -0.2934112548828125, -0.27997589111328125, -0.26654052734375, -0.25310516357421875, -0.2396697998046875, -0.22623443603515625, -0.212799072265625, -0.19936370849609375, -0.1859283447265625, -0.17249298095703125, -0.1590576171875, -0.14562225341796875, -0.1321868896484375, -0.11875152587890625, -0.105316162109375, -0.09188079833984375, -0.0784454345703125, -0.06501007080078125, -0.05157470703125, -0.03813934326171875, -0.0247039794921875, -0.01126861572265625, 0.002166748046875, 0.01560211181640625, 0.0290374755859375, 0.04247283935546875, 0.055908203125, 0.06934356689453125, 0.0827789306640625, 0.09621429443359375, 0.109649658203125, 0.12308502197265625, 0.1365203857421875, 0.14995574951171875, 0.16339111328125, 0.17682647705078125, 0.1902618408203125, 0.20369720458984375, 0.217132568359375, 0.23056793212890625, 0.2440032958984375, 0.25743865966796875, 0.2708740234375, 0.28430938720703125, 0.2977447509765625, 0.31118011474609375, 0.324615478515625, 0.33805084228515625, 0.3514862060546875, 0.36492156982421875, 0.37835693359375, 0.39179229736328125, 0.4052276611328125, 0.41866302490234375, 0.432098388671875, 0.44553375244140625, 0.4589691162109375, 0.47240447998046875, 0.48583984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 5.0, 4.0, 14.0, 12.0, 20.0, 17.0, 10.0, 20.0, 33.0, 23.0, 33.0, 40.0, 47.0, 52.0, 45.0, 52.0, 42.0, 56.0, 41.0, 49.0, 32.0, 43.0, 34.0, 36.0, 22.0, 28.0, 30.0, 26.0, 18.0, 21.0, 13.0, 5.0, 11.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-3.552436828613281e-05, -3.449525684118271e-05, -3.3466145396232605e-05, -3.24370339512825e-05, -3.14079225063324e-05, -3.0378811061382294e-05, -2.934969961643219e-05, -2.8320588171482086e-05, -2.7291476726531982e-05, -2.626236528158188e-05, -2.5233253836631775e-05, -2.420414239168167e-05, -2.3175030946731567e-05, -2.2145919501781464e-05, -2.111680805683136e-05, -2.0087696611881256e-05, -1.9058585166931152e-05, -1.802947372198105e-05, -1.7000362277030945e-05, -1.597125083208084e-05, -1.4942139387130737e-05, -1.3913027942180634e-05, -1.288391649723053e-05, -1.1854805052280426e-05, -1.0825693607330322e-05, -9.796582162380219e-06, -8.767470717430115e-06, -7.738359272480011e-06, -6.709247827529907e-06, -5.6801363825798035e-06, -4.6510249376297e-06, -3.621913492679596e-06, -2.592802047729492e-06, -1.5636906027793884e-06, -5.345791578292847e-07, 4.945322871208191e-07, 1.5236437320709229e-06, 2.5527551770210266e-06, 3.5818666219711304e-06, 4.610978066921234e-06, 5.640089511871338e-06, 6.669200956821442e-06, 7.698312401771545e-06, 8.72742384672165e-06, 9.756535291671753e-06, 1.0785646736621857e-05, 1.181475818157196e-05, 1.2843869626522064e-05, 1.3872981071472168e-05, 1.4902092516422272e-05, 1.5931203961372375e-05, 1.696031540632248e-05, 1.7989426851272583e-05, 1.9018538296222687e-05, 2.004764974117279e-05, 2.1076761186122894e-05, 2.2105872631072998e-05, 2.3134984076023102e-05, 2.4164095520973206e-05, 2.519320696592331e-05, 2.6222318410873413e-05, 2.7251429855823517e-05, 2.828054130077362e-05, 2.9309652745723724e-05, 3.0338764190673828e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 9.0, 10.0, 19.0, 17.0, 34.0, 40.0, 53.0, 88.0, 149.0, 160.0, 290.0, 409.0, 618.0, 961.0, 1615.0, 2530.0, 4381.0, 7540.0, 13486.0, 24816.0, 47368.0, 90314.0, 165173.0, 237697.0, 200850.0, 116604.0, 61069.0, 31787.0, 17113.0, 9409.0, 5472.0, 3112.0, 1890.0, 1208.0, 767.0, 506.0, 322.0, 198.0, 132.0, 116.0, 67.0, 37.0, 34.0, 19.0, 18.0, 12.0, 4.0, 6.0, 5.0, 9.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.082763671875, -0.08006763458251953, -0.07737159729003906, -0.0746755599975586, -0.07197952270507812, -0.06928348541259766, -0.06658744812011719, -0.06389141082763672, -0.06119537353515625, -0.05849933624267578, -0.05580329895019531, -0.053107261657714844, -0.050411224365234375, -0.047715187072753906, -0.04501914978027344, -0.04232311248779297, -0.0396270751953125, -0.03693103790283203, -0.03423500061035156, -0.031538963317871094, -0.028842926025390625, -0.026146888732910156, -0.023450851440429688, -0.02075481414794922, -0.01805877685546875, -0.015362739562988281, -0.012666702270507812, -0.009970664978027344, -0.007274627685546875, -0.004578590393066406, -0.0018825531005859375, 0.0008134841918945312, 0.003509521484375, 0.006205558776855469, 0.008901596069335938, 0.011597633361816406, 0.014293670654296875, 0.016989707946777344, 0.019685745239257812, 0.02238178253173828, 0.02507781982421875, 0.02777385711669922, 0.030469894409179688, 0.033165931701660156, 0.035861968994140625, 0.038558006286621094, 0.04125404357910156, 0.04395008087158203, 0.0466461181640625, 0.04934215545654297, 0.05203819274902344, 0.054734230041503906, 0.057430267333984375, 0.060126304626464844, 0.06282234191894531, 0.06551837921142578, 0.06821441650390625, 0.07091045379638672, 0.07360649108886719, 0.07630252838134766, 0.07899856567382812, 0.0816946029663086, 0.08439064025878906, 0.08708667755126953, 0.08978271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 8.0, 9.0, 10.0, 17.0, 30.0, 26.0, 33.0, 39.0, 56.0, 67.0, 69.0, 88.0, 79.0, 95.0, 79.0, 70.0, 49.0, 30.0, 35.0, 16.0, 33.0, 5.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.021753787994384766, -0.02103137969970703, -0.020308971405029297, -0.019586563110351562, -0.018864154815673828, -0.018141746520996094, -0.01741933822631836, -0.016696929931640625, -0.01597452163696289, -0.015252113342285156, -0.014529705047607422, -0.013807296752929688, -0.013084888458251953, -0.012362480163574219, -0.011640071868896484, -0.01091766357421875, -0.010195255279541016, -0.009472846984863281, -0.008750438690185547, -0.008028030395507812, -0.007305622100830078, -0.006583213806152344, -0.005860805511474609, -0.005138397216796875, -0.004415988922119141, -0.0036935806274414062, -0.002971172332763672, -0.0022487640380859375, -0.0015263557434082031, -0.0008039474487304688, -8.153915405273438e-05, 0.000640869140625, 0.0013632774353027344, 0.0020856857299804688, 0.002808094024658203, 0.0035305023193359375, 0.004252910614013672, 0.004975318908691406, 0.005697727203369141, 0.006420135498046875, 0.007142543792724609, 0.007864952087402344, 0.008587360382080078, 0.009309768676757812, 0.010032176971435547, 0.010754585266113281, 0.011476993560791016, 0.01219940185546875, 0.012921810150146484, 0.013644218444824219, 0.014366626739501953, 0.015089035034179688, 0.015811443328857422, 0.016533851623535156, 0.01725625991821289, 0.017978668212890625, 0.01870107650756836, 0.019423484802246094, 0.020145893096923828, 0.020868301391601562, 0.021590709686279297, 0.02231311798095703, 0.023035526275634766, 0.0237579345703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 19.0, 20.0, 35.0, 50.0, 63.0, 71.0, 95.0, 79.0, 86.0, 92.0, 76.0, 53.0, 60.0, 44.0, 25.0, 23.0, 20.0, 12.0, 9.0, 6.0, 7.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.76797342300415, -7.5797271728515625, -7.391481399536133, -7.203235149383545, -7.014988899230957, -6.826742649078369, -6.638496398925781, -6.450250625610352, -6.262004375457764, -6.073758125305176, -5.885512351989746, -5.697266101837158, -5.50901985168457, -5.320773601531982, -5.1325273513793945, -4.944281578063965, -4.756035327911377, -4.567789077758789, -4.379543304443359, -4.1912970542907715, -4.003050804138184, -3.8148045539855957, -3.626558542251587, -3.438312530517578, -3.2500662803649902, -3.0618200302124023, -2.8735740184783936, -2.6853280067443848, -2.497081756591797, -2.308835506439209, -2.1205894947052, -1.9323433637619019, -1.7440977096557617, -1.5558515787124634, -1.367605447769165, -1.1793593168258667, -0.9911131858825684, -0.80286705493927, -0.6146209239959717, -0.42637479305267334, -0.238128662109375, -0.04988253116607666, 0.13836359977722168, 0.32660973072052, 0.5148558616638184, 0.7031019926071167, 0.891348123550415, 1.0795942544937134, 1.2678403854370117, 1.45608651638031, 1.6443326473236084, 1.8325787782669067, 2.020824909210205, 2.209071159362793, 2.3973171710968018, 2.5855631828308105, 2.7738094329833984, 2.9620556831359863, 3.150301694869995, 3.338547706604004, 3.526793956756592, 3.7150402069091797, 3.9032862186431885, 4.091532230377197, 4.279778480529785]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 8.0, 6.0, 14.0, 12.0, 14.0, 23.0, 23.0, 18.0, 24.0, 22.0, 29.0, 32.0, 28.0, 44.0, 41.0, 36.0, 37.0, 47.0, 43.0, 40.0, 34.0, 32.0, 46.0, 43.0, 36.0, 41.0, 30.0, 28.0, 21.0, 21.0, 21.0, 13.0, 18.0, 14.0, 8.0, 13.0, 10.0, 5.0, 4.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0], "bins": [-2.200934886932373, -2.141292095184326, -2.0816493034362793, -2.0220065116882324, -1.962363839149475, -1.9027210474014282, -1.8430782556533813, -1.7834354639053345, -1.7237927913665771, -1.6641499996185303, -1.6045072078704834, -1.5448644161224365, -1.4852217435836792, -1.4255789518356323, -1.3659361600875854, -1.3062933683395386, -1.2466505765914917, -1.1870077848434448, -1.127364993095398, -1.0677223205566406, -1.0080795288085938, -0.9484367370605469, -0.8887939453125, -0.8291511535644531, -0.769508421421051, -0.7098656296730042, -0.650222897529602, -0.5905801057815552, -0.5309373140335083, -0.4712945818901062, -0.4116517901420593, -0.35200902819633484, -0.2923663854598999, -0.23272362351417542, -0.17308084666728973, -0.11343806982040405, -0.053795307874679565, 0.005847454071044922, 0.0654902458190918, 0.12513300776481628, 0.18477576971054077, 0.24441853165626526, 0.30406129360198975, 0.3637040853500366, 0.4233468472957611, 0.4829896092414856, 0.5426324009895325, 0.6022751331329346, 0.6619179248809814, 0.7215607166290283, 0.7812034487724304, 0.8408462405204773, 0.9004889726638794, 0.9601317644119263, 1.0197745561599731, 1.07941734790802, 1.1390600204467773, 1.1987028121948242, 1.258345603942871, 1.317988395690918, 1.3776310682296753, 1.4372738599777222, 1.496916651725769, 1.556559443473816, 1.6162022352218628]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 18.0, 22.0, 26.0, 30.0, 56.0, 108.0, 183.0, 315.0, 472.0, 717.0, 1156.0, 1993.0, 3203.0, 5447.0, 8809.0, 14767.0, 24315.0, 39148.0, 61162.0, 90567.0, 122147.0, 143693.0, 145157.0, 123860.0, 92996.0, 63414.0, 40142.0, 25287.0, 15660.0, 9342.0, 5619.0, 3415.0, 2149.0, 1272.0, 708.0, 406.0, 270.0, 182.0, 121.0, 75.0, 39.0, 21.0, 22.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.24609375, -2.175994873046875, -2.10589599609375, -2.035797119140625, -1.9656982421875, -1.895599365234375, -1.82550048828125, -1.755401611328125, -1.685302734375, -1.615203857421875, -1.54510498046875, -1.475006103515625, -1.4049072265625, -1.334808349609375, -1.26470947265625, -1.194610595703125, -1.12451171875, -1.054412841796875, -0.98431396484375, -0.914215087890625, -0.8441162109375, -0.774017333984375, -0.70391845703125, -0.633819580078125, -0.563720703125, -0.493621826171875, -0.42352294921875, -0.353424072265625, -0.2833251953125, -0.213226318359375, -0.14312744140625, -0.073028564453125, -0.0029296875, 0.067169189453125, 0.13726806640625, 0.207366943359375, 0.2774658203125, 0.347564697265625, 0.41766357421875, 0.487762451171875, 0.557861328125, 0.627960205078125, 0.69805908203125, 0.768157958984375, 0.8382568359375, 0.908355712890625, 0.97845458984375, 1.048553466796875, 1.11865234375, 1.188751220703125, 1.25885009765625, 1.328948974609375, 1.3990478515625, 1.469146728515625, 1.53924560546875, 1.609344482421875, 1.679443359375, 1.749542236328125, 1.81964111328125, 1.889739990234375, 1.9598388671875, 2.029937744140625, 2.10003662109375, 2.170135498046875, 2.240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 11.0, 8.0, 13.0, 12.0, 11.0, 9.0, 11.0, 24.0, 17.0, 25.0, 33.0, 30.0, 42.0, 24.0, 36.0, 29.0, 40.0, 32.0, 49.0, 45.0, 39.0, 46.0, 39.0, 49.0, 42.0, 32.0, 32.0, 26.0, 24.0, 32.0, 19.0, 18.0, 17.0, 14.0, 15.0, 9.0, 9.0, 7.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.27349853515625, -2.2052001953125, -2.13690185546875, -2.068603515625, -2.00030517578125, -1.9320068359375, -1.86370849609375, -1.79541015625, -1.72711181640625, -1.6588134765625, -1.59051513671875, -1.522216796875, -1.45391845703125, -1.3856201171875, -1.31732177734375, -1.2490234375, -1.18072509765625, -1.1124267578125, -1.04412841796875, -0.975830078125, -0.90753173828125, -0.8392333984375, -0.77093505859375, -0.70263671875, -0.63433837890625, -0.5660400390625, -0.49774169921875, -0.429443359375, -0.36114501953125, -0.2928466796875, -0.22454833984375, -0.15625, -0.08795166015625, -0.0196533203125, 0.04864501953125, 0.116943359375, 0.18524169921875, 0.2535400390625, 0.32183837890625, 0.39013671875, 0.45843505859375, 0.5267333984375, 0.59503173828125, 0.663330078125, 0.73162841796875, 0.7999267578125, 0.86822509765625, 0.9365234375, 1.00482177734375, 1.0731201171875, 1.14141845703125, 1.209716796875, 1.27801513671875, 1.3463134765625, 1.41461181640625, 1.48291015625, 1.55120849609375, 1.6195068359375, 1.68780517578125, 1.756103515625, 1.82440185546875, 1.8927001953125, 1.96099853515625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 11.0, 24.0, 25.0, 37.0, 66.0, 108.0, 194.0, 271.0, 498.0, 773.0, 1300.0, 2156.0, 3589.0, 5979.0, 9990.0, 17235.0, 28268.0, 45354.0, 71001.0, 104484.0, 136716.0, 152765.0, 142265.0, 113275.0, 79743.0, 52043.0, 32112.0, 19446.0, 11701.0, 6750.0, 4192.0, 2370.0, 1476.0, 914.0, 555.0, 326.0, 198.0, 105.0, 78.0, 55.0, 37.0, 24.0, 15.0, 12.0, 4.0, 1.0, 4.0, 3.0], "bins": [-2.876953125, -2.800506591796875, -2.72406005859375, -2.647613525390625, -2.5711669921875, -2.494720458984375, -2.41827392578125, -2.341827392578125, -2.265380859375, -2.188934326171875, -2.11248779296875, -2.036041259765625, -1.9595947265625, -1.883148193359375, -1.80670166015625, -1.730255126953125, -1.65380859375, -1.577362060546875, -1.50091552734375, -1.424468994140625, -1.3480224609375, -1.271575927734375, -1.19512939453125, -1.118682861328125, -1.042236328125, -0.965789794921875, -0.88934326171875, -0.812896728515625, -0.7364501953125, -0.660003662109375, -0.58355712890625, -0.507110595703125, -0.4306640625, -0.354217529296875, -0.27777099609375, -0.201324462890625, -0.1248779296875, -0.048431396484375, 0.02801513671875, 0.104461669921875, 0.180908203125, 0.257354736328125, 0.33380126953125, 0.410247802734375, 0.4866943359375, 0.563140869140625, 0.63958740234375, 0.716033935546875, 0.79248046875, 0.868927001953125, 0.94537353515625, 1.021820068359375, 1.0982666015625, 1.174713134765625, 1.25115966796875, 1.327606201171875, 1.404052734375, 1.480499267578125, 1.55694580078125, 1.633392333984375, 1.7098388671875, 1.786285400390625, 1.86273193359375, 1.939178466796875, 2.015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 13.0, 11.0, 17.0, 21.0, 15.0, 32.0, 27.0, 24.0, 29.0, 42.0, 36.0, 43.0, 36.0, 27.0, 43.0, 54.0, 48.0, 38.0, 52.0, 42.0, 39.0, 35.0, 26.0, 34.0, 25.0, 25.0, 31.0, 27.0, 20.0, 12.0, 10.0, 10.0, 3.0, 10.0, 6.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5126953125, -1.4666748046875, -1.420654296875, -1.3746337890625, -1.32861328125, -1.2825927734375, -1.236572265625, -1.1905517578125, -1.14453125, -1.0985107421875, -1.052490234375, -1.0064697265625, -0.96044921875, -0.9144287109375, -0.868408203125, -0.8223876953125, -0.7763671875, -0.7303466796875, -0.684326171875, -0.6383056640625, -0.59228515625, -0.5462646484375, -0.500244140625, -0.4542236328125, -0.408203125, -0.3621826171875, -0.316162109375, -0.2701416015625, -0.22412109375, -0.1781005859375, -0.132080078125, -0.0860595703125, -0.0400390625, 0.0059814453125, 0.052001953125, 0.0980224609375, 0.14404296875, 0.1900634765625, 0.236083984375, 0.2821044921875, 0.328125, 0.3741455078125, 0.420166015625, 0.4661865234375, 0.51220703125, 0.5582275390625, 0.604248046875, 0.6502685546875, 0.6962890625, 0.7423095703125, 0.788330078125, 0.8343505859375, 0.88037109375, 0.9263916015625, 0.972412109375, 1.0184326171875, 1.064453125, 1.1104736328125, 1.156494140625, 1.2025146484375, 1.24853515625, 1.2945556640625, 1.340576171875, 1.3865966796875, 1.4326171875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 18.0, 22.0, 19.0, 44.0, 56.0, 77.0, 137.0, 182.0, 253.0, 404.0, 559.0, 915.0, 1305.0, 2045.0, 3171.0, 5291.0, 8580.0, 14272.0, 24335.0, 42283.0, 71904.0, 116646.0, 163621.0, 181668.0, 153042.0, 103390.0, 62840.0, 37000.0, 21404.0, 12633.0, 7488.0, 4469.0, 2871.0, 1857.0, 1222.0, 862.0, 528.0, 381.0, 219.0, 188.0, 119.0, 65.0, 50.0, 37.0, 28.0, 12.0, 11.0, 7.0, 6.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4015045166015625, -1.353790283203125, -1.3060760498046875, -1.25836181640625, -1.2106475830078125, -1.162933349609375, -1.1152191162109375, -1.0675048828125, -1.0197906494140625, -0.972076416015625, -0.9243621826171875, -0.87664794921875, -0.8289337158203125, -0.781219482421875, -0.7335052490234375, -0.685791015625, -0.6380767822265625, -0.590362548828125, -0.5426483154296875, -0.49493408203125, -0.4472198486328125, -0.399505615234375, -0.3517913818359375, -0.3040771484375, -0.2563629150390625, -0.208648681640625, -0.1609344482421875, -0.11322021484375, -0.0655059814453125, -0.017791748046875, 0.0299224853515625, 0.07763671875, 0.1253509521484375, 0.173065185546875, 0.2207794189453125, 0.26849365234375, 0.3162078857421875, 0.363922119140625, 0.4116363525390625, 0.4593505859375, 0.5070648193359375, 0.554779052734375, 0.6024932861328125, 0.65020751953125, 0.6979217529296875, 0.745635986328125, 0.7933502197265625, 0.841064453125, 0.8887786865234375, 0.936492919921875, 0.9842071533203125, 1.03192138671875, 1.0796356201171875, 1.127349853515625, 1.1750640869140625, 1.2227783203125, 1.2704925537109375, 1.318206787109375, 1.3659210205078125, 1.41363525390625, 1.4613494873046875, 1.509063720703125, 1.5567779541015625, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 6.0, 21.0, 13.0, 25.0, 32.0, 37.0, 50.0, 50.0, 62.0, 63.0, 56.0, 79.0, 73.0, 71.0, 62.0, 42.0, 48.0, 41.0, 38.0, 24.0, 25.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.0001490432769060135, -0.00014382973313331604, -0.0001386161893606186, -0.00013340264558792114, -0.0001281891018152237, -0.00012297555804252625, -0.0001177620142698288, -0.00011254847049713135, -0.0001073349267244339, -0.00010212138295173645, -9.6907839179039e-05, -9.169429540634155e-05, -8.64807516336441e-05, -8.126720786094666e-05, -7.60536640882492e-05, -7.084012031555176e-05, -6.562657654285431e-05, -6.041303277015686e-05, -5.519948899745941e-05, -4.998594522476196e-05, -4.4772401452064514e-05, -3.9558857679367065e-05, -3.434531390666962e-05, -2.9131770133972168e-05, -2.391822636127472e-05, -1.870468258857727e-05, -1.3491138815879822e-05, -8.277595043182373e-06, -3.0640512704849243e-06, 2.1494925022125244e-06, 7.363036274909973e-06, 1.2576580047607422e-05, 1.779012382030487e-05, 2.300366759300232e-05, 2.8217211365699768e-05, 3.343075513839722e-05, 3.8644298911094666e-05, 4.3857842683792114e-05, 4.907138645648956e-05, 5.428493022918701e-05, 5.949847400188446e-05, 6.471201777458191e-05, 6.992556154727936e-05, 7.51391053199768e-05, 8.035264909267426e-05, 8.55661928653717e-05, 9.077973663806915e-05, 9.59932804107666e-05, 0.00010120682418346405, 0.0001064203679561615, 0.00011163391172885895, 0.0001168474555015564, 0.00012206099927425385, 0.0001272745430469513, 0.00013248808681964874, 0.0001377016305923462, 0.00014291517436504364, 0.0001481287181377411, 0.00015334226191043854, 0.00015855580568313599, 0.00016376934945583344, 0.00016898289322853088, 0.00017419643700122833, 0.00017940998077392578]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 28.0, 21.0, 50.0, 65.0, 89.0, 170.0, 259.0, 365.0, 624.0, 937.0, 1558.0, 2574.0, 4229.0, 7426.0, 13417.0, 24421.0, 43942.0, 78330.0, 128056.0, 178636.0, 190180.0, 150247.0, 96743.0, 55915.0, 30554.0, 16522.0, 9376.0, 5512.0, 3145.0, 1929.0, 1162.0, 710.0, 469.0, 298.0, 205.0, 104.0, 91.0, 56.0, 34.0, 18.0, 12.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.39898681640625, -1.3526611328125, -1.30633544921875, -1.260009765625, -1.21368408203125, -1.1673583984375, -1.12103271484375, -1.07470703125, -1.02838134765625, -0.9820556640625, -0.93572998046875, -0.889404296875, -0.84307861328125, -0.7967529296875, -0.75042724609375, -0.7041015625, -0.65777587890625, -0.6114501953125, -0.56512451171875, -0.518798828125, -0.47247314453125, -0.4261474609375, -0.37982177734375, -0.33349609375, -0.28717041015625, -0.2408447265625, -0.19451904296875, -0.148193359375, -0.10186767578125, -0.0555419921875, -0.00921630859375, 0.037109375, 0.08343505859375, 0.1297607421875, 0.17608642578125, 0.222412109375, 0.26873779296875, 0.3150634765625, 0.36138916015625, 0.40771484375, 0.45404052734375, 0.5003662109375, 0.54669189453125, 0.593017578125, 0.63934326171875, 0.6856689453125, 0.73199462890625, 0.7783203125, 0.82464599609375, 0.8709716796875, 0.91729736328125, 0.963623046875, 1.00994873046875, 1.0562744140625, 1.10260009765625, 1.14892578125, 1.19525146484375, 1.2415771484375, 1.28790283203125, 1.334228515625, 1.38055419921875, 1.4268798828125, 1.47320556640625, 1.51953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 9.0, 10.0, 15.0, 14.0, 16.0, 15.0, 25.0, 33.0, 20.0, 45.0, 40.0, 72.0, 68.0, 52.0, 62.0, 77.0, 68.0, 55.0, 46.0, 51.0, 44.0, 31.0, 24.0, 23.0, 18.0, 7.0, 12.0, 7.0, 3.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4009056091308594, -0.38823699951171875, -0.3755683898925781, -0.3628997802734375, -0.3502311706542969, -0.33756256103515625, -0.3248939514160156, -0.312225341796875, -0.2995567321777344, -0.28688812255859375, -0.2742195129394531, -0.2615509033203125, -0.24888229370117188, -0.23621368408203125, -0.22354507446289062, -0.21087646484375, -0.19820785522460938, -0.18553924560546875, -0.17287063598632812, -0.1602020263671875, -0.14753341674804688, -0.13486480712890625, -0.12219619750976562, -0.109527587890625, -0.09685897827148438, -0.08419036865234375, -0.07152175903320312, -0.0588531494140625, -0.046184539794921875, -0.03351593017578125, -0.020847320556640625, -0.0081787109375, 0.004489898681640625, 0.01715850830078125, 0.029827117919921875, 0.0424957275390625, 0.055164337158203125, 0.06783294677734375, 0.08050155639648438, 0.093170166015625, 0.10583877563476562, 0.11850738525390625, 0.13117599487304688, 0.1438446044921875, 0.15651321411132812, 0.16918182373046875, 0.18185043334960938, 0.19451904296875, 0.20718765258789062, 0.21985626220703125, 0.23252487182617188, 0.2451934814453125, 0.2578620910644531, 0.27053070068359375, 0.2831993103027344, 0.295867919921875, 0.3085365295410156, 0.32120513916015625, 0.3338737487792969, 0.3465423583984375, 0.3592109680175781, 0.37187957763671875, 0.3845481872558594, 0.397216796875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 27.0, 19.0, 37.0, 32.0, 51.0, 69.0, 80.0, 92.0, 104.0, 77.0, 83.0, 72.0, 65.0, 35.0, 32.0, 28.0, 17.0, 21.0, 13.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.787813186645508, -7.59655237197876, -7.40529203414917, -7.214031219482422, -7.022770881652832, -6.831510066986084, -6.640249252319336, -6.448988914489746, -6.257728576660156, -6.066467761993408, -5.875207424163818, -5.68394660949707, -5.4926862716674805, -5.301425457000732, -5.110164642333984, -4.9189043045043945, -4.7276434898376465, -4.536382675170898, -4.345122337341309, -4.1538615226745605, -3.9626011848449707, -3.7713403701782227, -3.5800797939300537, -3.3888192176818848, -3.197558641433716, -3.006298065185547, -2.815037488937378, -2.623776912689209, -2.432516098022461, -2.241255760192871, -2.049994945526123, -1.858734369277954, -1.667473316192627, -1.476212739944458, -1.284952163696289, -1.0936914682388306, -0.9024308919906616, -0.7111703157424927, -0.5199096202850342, -0.32864904403686523, -0.1373884677886963, 0.053872138261795044, 0.24513274431228638, 0.4363933801651001, 0.627653956413269, 0.818914532661438, 1.0101752281188965, 1.2014358043670654, 1.3926963806152344, 1.5839569568634033, 1.7752175331115723, 1.9664782285690308, 2.15773868560791, 2.348999500274658, 2.540260076522827, 2.731520652770996, 2.922781229019165, 3.114041805267334, 3.305302381515503, 3.496562957763672, 3.68782377243042, 3.8790841102600098, 4.070344924926758, 4.261605262756348, 4.452866077423096]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 10.0, 10.0, 13.0, 17.0, 17.0, 19.0, 18.0, 21.0, 33.0, 34.0, 29.0, 30.0, 37.0, 25.0, 37.0, 36.0, 42.0, 46.0, 46.0, 35.0, 39.0, 33.0, 33.0, 34.0, 22.0, 33.0, 16.0, 28.0, 27.0, 18.0, 23.0, 14.0, 16.0, 9.0, 19.0, 10.0, 17.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-2.103912353515625, -2.04496431350708, -1.9860161542892456, -1.9270681142807007, -1.8681199550628662, -1.8091719150543213, -1.7502238750457764, -1.6912758350372314, -1.632327675819397, -1.573379635810852, -1.5144314765930176, -1.4554834365844727, -1.3965353965759277, -1.3375872373580933, -1.2786391973495483, -1.2196910381317139, -1.160742998123169, -1.101794958114624, -1.0428467988967896, -0.9838987588882446, -0.9249506592750549, -0.8660025596618652, -0.8070545196533203, -0.7481064200401306, -0.6891583204269409, -0.6302102208137512, -0.5712621212005615, -0.5123140811920166, -0.4533659815788269, -0.3944178819656372, -0.3354698121547699, -0.2765217423439026, -0.21757376194000244, -0.15862567722797394, -0.09967759251594543, -0.04072950780391693, 0.018218576908111572, 0.07716667652130127, 0.13611474633216858, 0.1950628161430359, 0.2540109157562256, 0.3129590153694153, 0.3719070851802826, 0.4308551549911499, 0.4898032546043396, 0.5487513542175293, 0.6076993942260742, 0.6666474938392639, 0.7255955934524536, 0.7845436930656433, 0.843491792678833, 0.9024398326873779, 0.9613879323005676, 1.0203360319137573, 1.0792840719223022, 1.1382322311401367, 1.1971802711486816, 1.2561283111572266, 1.315076470375061, 1.374024510383606, 1.4329726696014404, 1.4919207096099854, 1.5508687496185303, 1.6098167896270752, 1.6687649488449097]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 10.0, 22.0, 25.0, 44.0, 76.0, 117.0, 191.0, 276.0, 462.0, 806.0, 1383.0, 2191.0, 3634.0, 6327.0, 11467.0, 20756.0, 39748.0, 81050.0, 178953.0, 436498.0, 997004.0, 1223554.0, 672831.0, 278304.0, 120663.0, 57059.0, 28288.0, 14712.0, 7811.0, 4306.0, 2382.0, 1377.0, 806.0, 441.0, 278.0, 170.0, 98.0, 50.0, 36.0, 25.0, 23.0, 5.0, 5.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.26519775390625, -4.1241455078125, -3.98309326171875, -3.842041015625, -3.70098876953125, -3.5599365234375, -3.41888427734375, -3.27783203125, -3.13677978515625, -2.9957275390625, -2.85467529296875, -2.713623046875, -2.57257080078125, -2.4315185546875, -2.29046630859375, -2.1494140625, -2.00836181640625, -1.8673095703125, -1.72625732421875, -1.585205078125, -1.44415283203125, -1.3031005859375, -1.16204833984375, -1.02099609375, -0.87994384765625, -0.7388916015625, -0.59783935546875, -0.456787109375, -0.31573486328125, -0.1746826171875, -0.03363037109375, 0.107421875, 0.24847412109375, 0.3895263671875, 0.53057861328125, 0.671630859375, 0.81268310546875, 0.9537353515625, 1.09478759765625, 1.23583984375, 1.37689208984375, 1.5179443359375, 1.65899658203125, 1.800048828125, 1.94110107421875, 2.0821533203125, 2.22320556640625, 2.3642578125, 2.50531005859375, 2.6463623046875, 2.78741455078125, 2.928466796875, 3.06951904296875, 3.2105712890625, 3.35162353515625, 3.49267578125, 3.63372802734375, 3.7747802734375, 3.91583251953125, 4.056884765625, 4.19793701171875, 4.3389892578125, 4.48004150390625, 4.62109375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 6.0, 22.0, 12.0, 19.0, 27.0, 25.0, 29.0, 26.0, 39.0, 38.0, 36.0, 43.0, 31.0, 44.0, 35.0, 36.0, 54.0, 35.0, 52.0, 49.0, 40.0, 23.0, 38.0, 37.0, 30.0, 21.0, 21.0, 35.0, 15.0, 9.0, 10.0, 6.0, 12.0, 6.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.078125, -2.019866943359375, -1.96160888671875, -1.903350830078125, -1.8450927734375, -1.786834716796875, -1.72857666015625, -1.670318603515625, -1.612060546875, -1.553802490234375, -1.49554443359375, -1.437286376953125, -1.3790283203125, -1.320770263671875, -1.26251220703125, -1.204254150390625, -1.14599609375, -1.087738037109375, -1.02947998046875, -0.971221923828125, -0.9129638671875, -0.854705810546875, -0.79644775390625, -0.738189697265625, -0.679931640625, -0.621673583984375, -0.56341552734375, -0.505157470703125, -0.4468994140625, -0.388641357421875, -0.33038330078125, -0.272125244140625, -0.2138671875, -0.155609130859375, -0.09735107421875, -0.039093017578125, 0.0191650390625, 0.077423095703125, 0.13568115234375, 0.193939208984375, 0.252197265625, 0.310455322265625, 0.36871337890625, 0.426971435546875, 0.4852294921875, 0.543487548828125, 0.60174560546875, 0.660003662109375, 0.71826171875, 0.776519775390625, 0.83477783203125, 0.893035888671875, 0.9512939453125, 1.009552001953125, 1.06781005859375, 1.126068115234375, 1.184326171875, 1.242584228515625, 1.30084228515625, 1.359100341796875, 1.4173583984375, 1.475616455078125, 1.53387451171875, 1.592132568359375, 1.650390625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 14.0, 27.0, 40.0, 45.0, 85.0, 134.0, 227.0, 335.0, 582.0, 967.0, 1473.0, 2510.0, 4315.0, 7428.0, 13143.0, 24089.0, 44776.0, 86996.0, 171692.0, 352864.0, 693910.0, 1039472.0, 840922.0, 451720.0, 221802.0, 110664.0, 56175.0, 29964.0, 16329.0, 9061.0, 4959.0, 3030.0, 1818.0, 1090.0, 646.0, 337.0, 231.0, 144.0, 103.0, 64.0, 32.0, 28.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.16015625, -4.0245361328125, -3.888916015625, -3.7532958984375, -3.61767578125, -3.4820556640625, -3.346435546875, -3.2108154296875, -3.0751953125, -2.9395751953125, -2.803955078125, -2.6683349609375, -2.53271484375, -2.3970947265625, -2.261474609375, -2.1258544921875, -1.990234375, -1.8546142578125, -1.718994140625, -1.5833740234375, -1.44775390625, -1.3121337890625, -1.176513671875, -1.0408935546875, -0.9052734375, -0.7696533203125, -0.634033203125, -0.4984130859375, -0.36279296875, -0.2271728515625, -0.091552734375, 0.0440673828125, 0.1796875, 0.3153076171875, 0.450927734375, 0.5865478515625, 0.72216796875, 0.8577880859375, 0.993408203125, 1.1290283203125, 1.2646484375, 1.4002685546875, 1.535888671875, 1.6715087890625, 1.80712890625, 1.9427490234375, 2.078369140625, 2.2139892578125, 2.349609375, 2.4852294921875, 2.620849609375, 2.7564697265625, 2.89208984375, 3.0277099609375, 3.163330078125, 3.2989501953125, 3.4345703125, 3.5701904296875, 3.705810546875, 3.8414306640625, 3.97705078125, 4.1126708984375, 4.248291015625, 4.3839111328125, 4.51953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 11.0, 11.0, 14.0, 20.0, 32.0, 33.0, 47.0, 68.0, 81.0, 97.0, 99.0, 135.0, 137.0, 181.0, 201.0, 219.0, 245.0, 230.0, 285.0, 258.0, 215.0, 241.0, 199.0, 165.0, 136.0, 137.0, 100.0, 87.0, 84.0, 71.0, 52.0, 40.0, 23.0, 15.0, 23.0, 17.0, 6.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.99072265625, -0.9569778442382812, -0.9232330322265625, -0.8894882202148438, -0.855743408203125, -0.8219985961914062, -0.7882537841796875, -0.7545089721679688, -0.72076416015625, -0.6870193481445312, -0.6532745361328125, -0.6195297241210938, -0.585784912109375, -0.5520401000976562, -0.5182952880859375, -0.48455047607421875, -0.4508056640625, -0.41706085205078125, -0.3833160400390625, -0.34957122802734375, -0.315826416015625, -0.28208160400390625, -0.2483367919921875, -0.21459197998046875, -0.18084716796875, -0.14710235595703125, -0.1133575439453125, -0.07961273193359375, -0.045867919921875, -0.01212310791015625, 0.0216217041015625, 0.05536651611328125, 0.089111328125, 0.12285614013671875, 0.1566009521484375, 0.19034576416015625, 0.224090576171875, 0.25783538818359375, 0.2915802001953125, 0.32532501220703125, 0.35906982421875, 0.39281463623046875, 0.4265594482421875, 0.46030426025390625, 0.494049072265625, 0.5277938842773438, 0.5615386962890625, 0.5952835083007812, 0.6290283203125, 0.6627731323242188, 0.6965179443359375, 0.7302627563476562, 0.764007568359375, 0.7977523803710938, 0.8314971923828125, 0.8652420043945312, 0.89898681640625, 0.9327316284179688, 0.9664764404296875, 1.0002212524414062, 1.033966064453125, 1.0677108764648438, 1.1014556884765625, 1.1352005004882812, 1.1689453125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 14.0, 12.0, 16.0, 16.0, 25.0, 49.0, 47.0, 55.0, 70.0, 64.0, 74.0, 84.0, 74.0, 80.0, 68.0, 57.0, 26.0, 30.0, 21.0, 25.0, 19.0, 8.0, 13.0, 14.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.886803150177002, -6.720529079437256, -6.554255485534668, -6.387981414794922, -6.221707344055176, -6.05543327331543, -5.889159202575684, -5.722885608673096, -5.55661153793335, -5.3903374671936035, -5.224063873291016, -5.0577898025512695, -4.891515731811523, -4.725241661071777, -4.558967590332031, -4.392693996429443, -4.226419925689697, -4.060145854949951, -3.893872022628784, -3.727598190307617, -3.561324119567871, -3.395050048828125, -3.228776216506958, -3.062502384185791, -2.896228313446045, -2.729954242706299, -2.563680410385132, -2.397406578063965, -2.2311325073242188, -2.0648584365844727, -1.8985846042633057, -1.7323106527328491, -1.5660364627838135, -1.399762511253357, -1.2334885597229004, -1.0672146081924438, -0.9009406566619873, -0.7346667051315308, -0.5683927536010742, -0.4021188020706177, -0.23584485054016113, -0.06957089900970459, 0.09670305252075195, 0.2629770040512085, 0.42925095558166504, 0.5955249071121216, 0.7617988586425781, 0.9280728101730347, 1.0943467617034912, 1.2606207132339478, 1.4268946647644043, 1.5931686162948608, 1.7594425678253174, 1.925716519355774, 2.0919904708862305, 2.2582645416259766, 2.4245383739471436, 2.5908122062683105, 2.7570862770080566, 2.9233603477478027, 3.0896341800689697, 3.2559080123901367, 3.422182083129883, 3.588456153869629, 3.754729986190796]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 8.0, 4.0, 12.0, 20.0, 12.0, 25.0, 15.0, 20.0, 19.0, 26.0, 31.0, 31.0, 35.0, 33.0, 38.0, 50.0, 40.0, 32.0, 44.0, 44.0, 31.0, 42.0, 34.0, 29.0, 29.0, 20.0, 32.0, 25.0, 20.0, 19.0, 26.0, 20.0, 17.0, 14.0, 18.0, 11.0, 11.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8708324432373047, -1.8121438026428223, -1.7534551620483398, -1.6947665214538574, -1.636077880859375, -1.5773892402648926, -1.5187007188796997, -1.4600120782852173, -1.4013234376907349, -1.3426347970962524, -1.28394615650177, -1.2252575159072876, -1.1665689945220947, -1.1078803539276123, -1.0491917133331299, -0.9905030727386475, -0.931814432144165, -0.8731257915496826, -0.8144371509552002, -0.7557485699653625, -0.6970599293708801, -0.6383712887763977, -0.5796827077865601, -0.5209940671920776, -0.4623054265975952, -0.4036167860031128, -0.34492817521095276, -0.2862395644187927, -0.2275509238243103, -0.16886228322982788, -0.11017367243766785, -0.05148506164550781, 0.00720369815826416, 0.06589232385158539, 0.12458094954490662, 0.18326957523822784, 0.24195820093154907, 0.3006468415260315, 0.35933545231819153, 0.41802406311035156, 0.476712703704834, 0.5354013442993164, 0.5940899848937988, 0.6527785658836365, 0.7114672064781189, 0.7701558470726013, 0.828844428062439, 0.8875330686569214, 0.9462217092514038, 1.0049103498458862, 1.0635989904403687, 1.122287631034851, 1.180976152420044, 1.2396647930145264, 1.2983534336090088, 1.3570420742034912, 1.4157307147979736, 1.474419355392456, 1.5331079959869385, 1.591796636581421, 1.6504852771759033, 1.7091739177703857, 1.7678624391555786, 1.826551079750061, 1.8852397203445435]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 15.0, 22.0, 37.0, 46.0, 98.0, 126.0, 216.0, 317.0, 495.0, 790.0, 1301.0, 2005.0, 3435.0, 5767.0, 10168.0, 18038.0, 32493.0, 58886.0, 105221.0, 169738.0, 210826.0, 175578.0, 111063.0, 62661.0, 34362.0, 19025.0, 10695.0, 5939.0, 3474.0, 2229.0, 1299.0, 751.0, 529.0, 307.0, 216.0, 148.0, 79.0, 44.0, 35.0, 17.0, 16.0, 12.0, 14.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.328125, -0.31862640380859375, -0.3091278076171875, -0.29962921142578125, -0.290130615234375, -0.28063201904296875, -0.2711334228515625, -0.26163482666015625, -0.25213623046875, -0.24263763427734375, -0.2331390380859375, -0.22364044189453125, -0.214141845703125, -0.20464324951171875, -0.1951446533203125, -0.18564605712890625, -0.1761474609375, -0.16664886474609375, -0.1571502685546875, -0.14765167236328125, -0.138153076171875, -0.12865447998046875, -0.1191558837890625, -0.10965728759765625, -0.10015869140625, -0.09066009521484375, -0.0811614990234375, -0.07166290283203125, -0.062164306640625, -0.05266571044921875, -0.0431671142578125, -0.03366851806640625, -0.024169921875, -0.01467132568359375, -0.0051727294921875, 0.00432586669921875, 0.013824462890625, 0.02332305908203125, 0.0328216552734375, 0.04232025146484375, 0.05181884765625, 0.06131744384765625, 0.0708160400390625, 0.08031463623046875, 0.089813232421875, 0.09931182861328125, 0.1088104248046875, 0.11830902099609375, 0.1278076171875, 0.13730621337890625, 0.1468048095703125, 0.15630340576171875, 0.165802001953125, 0.17530059814453125, 0.1847991943359375, 0.19429779052734375, 0.20379638671875, 0.21329498291015625, 0.2227935791015625, 0.23229217529296875, 0.241790771484375, 0.25128936767578125, 0.2607879638671875, 0.27028656005859375, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 10.0, 6.0, 14.0, 8.0, 16.0, 17.0, 18.0, 21.0, 26.0, 26.0, 31.0, 30.0, 46.0, 27.0, 45.0, 34.0, 48.0, 27.0, 43.0, 38.0, 37.0, 30.0, 39.0, 32.0, 36.0, 30.0, 31.0, 24.0, 19.0, 13.0, 19.0, 22.0, 21.0, 12.0, 11.0, 15.0, 12.0, 6.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.296875, -2.228546142578125, -2.16021728515625, -2.091888427734375, -2.0235595703125, -1.955230712890625, -1.88690185546875, -1.818572998046875, -1.750244140625, -1.681915283203125, -1.61358642578125, -1.545257568359375, -1.4769287109375, -1.408599853515625, -1.34027099609375, -1.271942138671875, -1.20361328125, -1.135284423828125, -1.06695556640625, -0.998626708984375, -0.9302978515625, -0.861968994140625, -0.79364013671875, -0.725311279296875, -0.656982421875, -0.588653564453125, -0.52032470703125, -0.451995849609375, -0.3836669921875, -0.315338134765625, -0.24700927734375, -0.178680419921875, -0.1103515625, -0.042022705078125, 0.02630615234375, 0.094635009765625, 0.1629638671875, 0.231292724609375, 0.29962158203125, 0.367950439453125, 0.436279296875, 0.504608154296875, 0.57293701171875, 0.641265869140625, 0.7095947265625, 0.777923583984375, 0.84625244140625, 0.914581298828125, 0.98291015625, 1.051239013671875, 1.11956787109375, 1.187896728515625, 1.2562255859375, 1.324554443359375, 1.39288330078125, 1.461212158203125, 1.529541015625, 1.597869873046875, 1.66619873046875, 1.734527587890625, 1.8028564453125, 1.871185302734375, 1.93951416015625, 2.007843017578125, 2.076171875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 27.0, 29.0, 48.0, 71.0, 70.0, 132.0, 185.0, 259.0, 443.0, 791.0, 1316.0, 2533.0, 5318.0, 12331.0, 33200.0, 741366.0, 206411.0, 24797.0, 9747.0, 4332.0, 2118.0, 1162.0, 620.0, 423.0, 244.0, 185.0, 110.0, 73.0, 44.0, 39.0, 25.0, 23.0, 14.0, 9.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.060546875, -1.0272674560546875, -0.993988037109375, -0.9607086181640625, -0.92742919921875, -0.8941497802734375, -0.860870361328125, -0.8275909423828125, -0.7943115234375, -0.7610321044921875, -0.727752685546875, -0.6944732666015625, -0.66119384765625, -0.6279144287109375, -0.594635009765625, -0.5613555908203125, -0.528076171875, -0.4947967529296875, -0.461517333984375, -0.4282379150390625, -0.39495849609375, -0.3616790771484375, -0.328399658203125, -0.2951202392578125, -0.2618408203125, -0.2285614013671875, -0.195281982421875, -0.1620025634765625, -0.12872314453125, -0.0954437255859375, -0.062164306640625, -0.0288848876953125, 0.00439453125, 0.0376739501953125, 0.070953369140625, 0.1042327880859375, 0.13751220703125, 0.1707916259765625, 0.204071044921875, 0.2373504638671875, 0.2706298828125, 0.3039093017578125, 0.337188720703125, 0.3704681396484375, 0.40374755859375, 0.4370269775390625, 0.470306396484375, 0.5035858154296875, 0.536865234375, 0.5701446533203125, 0.603424072265625, 0.6367034912109375, 0.66998291015625, 0.7032623291015625, 0.736541748046875, 0.7698211669921875, 0.8031005859375, 0.8363800048828125, 0.869659423828125, 0.9029388427734375, 0.93621826171875, 0.9694976806640625, 1.002777099609375, 1.0360565185546875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 9.0, 10.0, 22.0, 21.0, 20.0, 27.0, 28.0, 25.0, 27.0, 26.0, 33.0, 33.0, 46.0, 38.0, 47.0, 46.0, 45.0, 35.0, 45.0, 43.0, 42.0, 55.0, 46.0, 29.0, 18.0, 30.0, 12.0, 24.0, 21.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8232421875, -1.772857666015625, -1.72247314453125, -1.672088623046875, -1.6217041015625, -1.571319580078125, -1.52093505859375, -1.470550537109375, -1.420166015625, -1.369781494140625, -1.31939697265625, -1.269012451171875, -1.2186279296875, -1.168243408203125, -1.11785888671875, -1.067474365234375, -1.01708984375, -0.966705322265625, -0.91632080078125, -0.865936279296875, -0.8155517578125, -0.765167236328125, -0.71478271484375, -0.664398193359375, -0.614013671875, -0.563629150390625, -0.51324462890625, -0.462860107421875, -0.4124755859375, -0.362091064453125, -0.31170654296875, -0.261322021484375, -0.2109375, -0.160552978515625, -0.11016845703125, -0.059783935546875, -0.0093994140625, 0.040985107421875, 0.09136962890625, 0.141754150390625, 0.192138671875, 0.242523193359375, 0.29290771484375, 0.343292236328125, 0.3936767578125, 0.444061279296875, 0.49444580078125, 0.544830322265625, 0.59521484375, 0.645599365234375, 0.69598388671875, 0.746368408203125, 0.7967529296875, 0.847137451171875, 0.89752197265625, 0.947906494140625, 0.998291015625, 1.048675537109375, 1.09906005859375, 1.149444580078125, 1.1998291015625, 1.250213623046875, 1.30059814453125, 1.350982666015625, 1.4013671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 14.0, 18.0, 27.0, 28.0, 28.0, 43.0, 54.0, 91.0, 151.0, 257.0, 448.0, 792.0, 1420.0, 2747.0, 5786.0, 13103.0, 36279.0, 903133.0, 53276.0, 16635.0, 6940.0, 3262.0, 1708.0, 913.0, 529.0, 292.0, 185.0, 119.0, 75.0, 51.0, 32.0, 31.0, 20.0, 15.0, 5.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0], "bins": [-0.338623046875, -0.3296241760253906, -0.32062530517578125, -0.3116264343261719, -0.3026275634765625, -0.2936286926269531, -0.28462982177734375, -0.2756309509277344, -0.266632080078125, -0.2576332092285156, -0.24863433837890625, -0.23963546752929688, -0.2306365966796875, -0.22163772583007812, -0.21263885498046875, -0.20363998413085938, -0.19464111328125, -0.18564224243164062, -0.17664337158203125, -0.16764450073242188, -0.1586456298828125, -0.14964675903320312, -0.14064788818359375, -0.13164901733398438, -0.122650146484375, -0.11365127563476562, -0.10465240478515625, -0.09565353393554688, -0.0866546630859375, -0.07765579223632812, -0.06865692138671875, -0.059658050537109375, -0.0506591796875, -0.041660308837890625, -0.03266143798828125, -0.023662567138671875, -0.0146636962890625, -0.005664825439453125, 0.00333404541015625, 0.012332916259765625, 0.021331787109375, 0.030330657958984375, 0.03932952880859375, 0.048328399658203125, 0.0573272705078125, 0.06632614135742188, 0.07532501220703125, 0.08432388305664062, 0.09332275390625, 0.10232162475585938, 0.11132049560546875, 0.12031936645507812, 0.1293182373046875, 0.13831710815429688, 0.14731597900390625, 0.15631484985351562, 0.165313720703125, 0.17431259155273438, 0.18331146240234375, 0.19231033325195312, 0.2013092041015625, 0.21030807495117188, 0.21930694580078125, 0.22830581665039062, 0.2373046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 21.0, 18.0, 26.0, 20.0, 30.0, 40.0, 43.0, 37.0, 48.0, 47.0, 37.0, 56.0, 58.0, 51.0, 53.0, 54.0, 42.0, 45.0, 35.0, 30.0, 23.0, 18.0, 22.0, 9.0, 18.0, 14.0, 13.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.612879663705826e-05, -3.5064294934272766e-05, -3.3999793231487274e-05, -3.293529152870178e-05, -3.187078982591629e-05, -3.08062881231308e-05, -2.9741786420345306e-05, -2.8677284717559814e-05, -2.7612783014774323e-05, -2.654828131198883e-05, -2.548377960920334e-05, -2.4419277906417847e-05, -2.3354776203632355e-05, -2.2290274500846863e-05, -2.122577279806137e-05, -2.016127109527588e-05, -1.9096769392490387e-05, -1.8032267689704895e-05, -1.6967765986919403e-05, -1.590326428413391e-05, -1.483876258134842e-05, -1.3774260878562927e-05, -1.2709759175777435e-05, -1.1645257472991943e-05, -1.0580755770206451e-05, -9.51625406742096e-06, -8.451752364635468e-06, -7.387250661849976e-06, -6.322748959064484e-06, -5.258247256278992e-06, -4.1937455534935e-06, -3.129243850708008e-06, -2.064742147922516e-06, -1.000240445137024e-06, 6.426125764846802e-08, 1.12876296043396e-06, 2.193264663219452e-06, 3.257766366004944e-06, 4.322268068790436e-06, 5.386769771575928e-06, 6.45127147436142e-06, 7.515773177146912e-06, 8.580274879932404e-06, 9.644776582717896e-06, 1.0709278285503387e-05, 1.177377998828888e-05, 1.2838281691074371e-05, 1.3902783393859863e-05, 1.4967285096645355e-05, 1.6031786799430847e-05, 1.709628850221634e-05, 1.816079020500183e-05, 1.9225291907787323e-05, 2.0289793610572815e-05, 2.1354295313358307e-05, 2.24187970161438e-05, 2.348329871892929e-05, 2.4547800421714783e-05, 2.5612302124500275e-05, 2.6676803827285767e-05, 2.774130553007126e-05, 2.880580723285675e-05, 2.9870308935642242e-05, 3.0934810638427734e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 13.0, 26.0, 37.0, 44.0, 55.0, 83.0, 94.0, 138.0, 230.0, 340.0, 451.0, 632.0, 1040.0, 1523.0, 2276.0, 3626.0, 5991.0, 9577.0, 16396.0, 28144.0, 49759.0, 89647.0, 150337.0, 208660.0, 189692.0, 123210.0, 70081.0, 39741.0, 22222.0, 12958.0, 7688.0, 4773.0, 2958.0, 1933.0, 1293.0, 934.0, 623.0, 409.0, 259.0, 188.0, 161.0, 86.0, 63.0, 48.0, 28.0, 21.0, 19.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0], "bins": [-0.07452392578125, -0.07238197326660156, -0.07024002075195312, -0.06809806823730469, -0.06595611572265625, -0.06381416320800781, -0.061672210693359375, -0.05953025817871094, -0.0573883056640625, -0.05524635314941406, -0.053104400634765625, -0.05096244812011719, -0.04882049560546875, -0.04667854309082031, -0.044536590576171875, -0.04239463806152344, -0.040252685546875, -0.03811073303222656, -0.035968780517578125, -0.03382682800292969, -0.03168487548828125, -0.029542922973632812, -0.027400970458984375, -0.025259017944335938, -0.0231170654296875, -0.020975112915039062, -0.018833160400390625, -0.016691207885742188, -0.01454925537109375, -0.012407302856445312, -0.010265350341796875, -0.008123397827148438, -0.0059814453125, -0.0038394927978515625, -0.001697540283203125, 0.0004444122314453125, 0.00258636474609375, 0.0047283172607421875, 0.006870269775390625, 0.009012222290039062, 0.0111541748046875, 0.013296127319335938, 0.015438079833984375, 0.017580032348632812, 0.01972198486328125, 0.021863937377929688, 0.024005889892578125, 0.026147842407226562, 0.028289794921875, 0.030431747436523438, 0.032573699951171875, 0.03471565246582031, 0.03685760498046875, 0.03899955749511719, 0.041141510009765625, 0.04328346252441406, 0.0454254150390625, 0.04756736755371094, 0.049709320068359375, 0.05185127258300781, 0.05399322509765625, 0.05613517761230469, 0.058277130126953125, 0.06041908264160156, 0.06256103515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 21.0, 22.0, 21.0, 32.0, 56.0, 74.0, 79.0, 79.0, 70.0, 78.0, 76.0, 73.0, 60.0, 57.0, 35.0, 32.0, 23.0, 20.0, 14.0, 12.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020233154296875, -0.01952052116394043, -0.01880788803100586, -0.01809525489807129, -0.01738262176513672, -0.01666998863220215, -0.015957355499267578, -0.015244722366333008, -0.014532089233398438, -0.013819456100463867, -0.013106822967529297, -0.012394189834594727, -0.011681556701660156, -0.010968923568725586, -0.010256290435791016, -0.009543657302856445, -0.008831024169921875, -0.008118391036987305, -0.007405757904052734, -0.006693124771118164, -0.005980491638183594, -0.0052678585052490234, -0.004555225372314453, -0.003842592239379883, -0.0031299591064453125, -0.002417325973510742, -0.0017046928405761719, -0.0009920597076416016, -0.00027942657470703125, 0.00043320655822753906, 0.0011458396911621094, 0.0018584728240966797, 0.00257110595703125, 0.0032837390899658203, 0.003996372222900391, 0.004709005355834961, 0.005421638488769531, 0.0061342716217041016, 0.006846904754638672, 0.007559537887573242, 0.008272171020507812, 0.008984804153442383, 0.009697437286376953, 0.010410070419311523, 0.011122703552246094, 0.011835336685180664, 0.012547969818115234, 0.013260602951049805, 0.013973236083984375, 0.014685869216918945, 0.015398502349853516, 0.016111135482788086, 0.016823768615722656, 0.017536401748657227, 0.018249034881591797, 0.018961668014526367, 0.019674301147460938, 0.020386934280395508, 0.021099567413330078, 0.02181220054626465, 0.02252483367919922, 0.02323746681213379, 0.02395009994506836, 0.02466273307800293, 0.0253753662109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 8.0, 19.0, 16.0, 27.0, 45.0, 48.0, 55.0, 71.0, 65.0, 71.0, 84.0, 83.0, 81.0, 66.0, 47.0, 29.0, 31.0, 23.0, 19.0, 22.0, 12.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.85531759262085, -6.689630031585693, -6.523942470550537, -6.358254432678223, -6.192566871643066, -6.02687931060791, -5.861191749572754, -5.695504188537598, -5.529816627502441, -5.364129066467285, -5.198441505432129, -5.0327534675598145, -4.867065906524658, -4.701378345489502, -4.535690784454346, -4.3700032234191895, -4.204315185546875, -4.038627624511719, -3.8729398250579834, -3.707252264022827, -3.541564464569092, -3.3758769035339355, -3.2101893424987793, -3.044501781463623, -2.8788139820098877, -2.7131264209747314, -2.547438621520996, -2.38175106048584, -2.2160634994506836, -2.0503756999969482, -1.884688138961792, -1.7190004587173462, -1.5533127784729004, -1.3876250982284546, -1.2219374179840088, -1.0562498569488525, -0.8905621767044067, -0.7248744964599609, -0.5591868758201599, -0.3934992551803589, -0.22781157493591309, -0.06212392449378967, 0.10356372594833374, 0.26925137639045715, 0.43493902683258057, 0.6006267070770264, 0.7663143277168274, 0.9320019483566284, 1.0976896286010742, 1.26337730884552, 1.4290649890899658, 1.594752550125122, 1.7604402303695679, 1.9261279106140137, 2.09181547164917, 2.257503032684326, 2.4231908321380615, 2.5888783931732178, 2.754566192626953, 2.9202537536621094, 3.0859413146972656, 3.251629114151001, 3.4173166751861572, 3.5830044746398926, 3.748692035675049]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 9.0, 6.0, 10.0, 16.0, 16.0, 20.0, 18.0, 18.0, 18.0, 27.0, 26.0, 36.0, 33.0, 35.0, 39.0, 46.0, 45.0, 29.0, 42.0, 45.0, 35.0, 40.0, 36.0, 28.0, 32.0, 22.0, 30.0, 22.0, 22.0, 22.0, 26.0, 21.0, 14.0, 15.0, 18.0, 10.0, 13.0, 6.0, 7.0, 5.0, 8.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8758937120437622, -1.8173400163650513, -1.7587863206863403, -1.7002326250076294, -1.6416789293289185, -1.5831252336502075, -1.524571418762207, -1.466017723083496, -1.4074640274047852, -1.3489103317260742, -1.2903566360473633, -1.2318029403686523, -1.1732492446899414, -1.1146955490112305, -1.0561418533325195, -0.9975880980491638, -0.9390344619750977, -0.8804807662963867, -0.8219270706176758, -0.7633733749389648, -0.7048196792602539, -0.646265983581543, -0.5877122282981873, -0.5291585326194763, -0.4706048369407654, -0.41205114126205444, -0.3534974455833435, -0.2949437201023102, -0.23639002442359924, -0.1778363287448883, -0.11928260326385498, -0.06072890758514404, -0.0021750926971435547, 0.05637861043214798, 0.11493231356143951, 0.17348602414131165, 0.23203971982002258, 0.2905934154987335, 0.34914714097976685, 0.4077008366584778, 0.4662545323371887, 0.5248082280158997, 0.5833619236946106, 0.6419156789779663, 0.7004693746566772, 0.7590230703353882, 0.8175767660140991, 0.8761304616928101, 0.934684157371521, 0.9932378530502319, 1.0517915487289429, 1.1103452444076538, 1.1688989400863647, 1.2274526357650757, 1.2860064506530762, 1.344560146331787, 1.403113842010498, 1.461667537689209, 1.52022123336792, 1.5787749290466309, 1.6373286247253418, 1.6958823204040527, 1.7544360160827637, 1.8129897117614746, 1.8715434074401855]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 23.0, 29.0, 52.0, 57.0, 75.0, 154.0, 233.0, 299.0, 463.0, 734.0, 1185.0, 1680.0, 2687.0, 4302.0, 6911.0, 10312.0, 16105.0, 24830.0, 37831.0, 55167.0, 77715.0, 102431.0, 123341.0, 131028.0, 120995.0, 99998.0, 75064.0, 52509.0, 35529.0, 23661.0, 15383.0, 9850.0, 6387.0, 4089.0, 2581.0, 1668.0, 1122.0, 721.0, 458.0, 312.0, 194.0, 120.0, 84.0, 55.0, 41.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.22265625, -2.15618896484375, -2.0897216796875, -2.02325439453125, -1.956787109375, -1.89031982421875, -1.8238525390625, -1.75738525390625, -1.69091796875, -1.62445068359375, -1.5579833984375, -1.49151611328125, -1.425048828125, -1.35858154296875, -1.2921142578125, -1.22564697265625, -1.1591796875, -1.09271240234375, -1.0262451171875, -0.95977783203125, -0.893310546875, -0.82684326171875, -0.7603759765625, -0.69390869140625, -0.62744140625, -0.56097412109375, -0.4945068359375, -0.42803955078125, -0.361572265625, -0.29510498046875, -0.2286376953125, -0.16217041015625, -0.095703125, -0.02923583984375, 0.0372314453125, 0.10369873046875, 0.170166015625, 0.23663330078125, 0.3031005859375, 0.36956787109375, 0.43603515625, 0.50250244140625, 0.5689697265625, 0.63543701171875, 0.701904296875, 0.76837158203125, 0.8348388671875, 0.90130615234375, 0.9677734375, 1.03424072265625, 1.1007080078125, 1.16717529296875, 1.233642578125, 1.30010986328125, 1.3665771484375, 1.43304443359375, 1.49951171875, 1.56597900390625, 1.6324462890625, 1.69891357421875, 1.765380859375, 1.83184814453125, 1.8983154296875, 1.96478271484375, 2.03125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 6.0, 11.0, 20.0, 19.0, 21.0, 29.0, 31.0, 33.0, 31.0, 41.0, 42.0, 47.0, 39.0, 46.0, 38.0, 48.0, 53.0, 33.0, 44.0, 39.0, 34.0, 37.0, 30.0, 29.0, 22.0, 24.0, 20.0, 27.0, 10.0, 8.0, 13.0, 10.0, 10.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.3851318359375, -2.307373046875, -2.2296142578125, -2.15185546875, -2.0740966796875, -1.996337890625, -1.9185791015625, -1.8408203125, -1.7630615234375, -1.685302734375, -1.6075439453125, -1.52978515625, -1.4520263671875, -1.374267578125, -1.2965087890625, -1.21875, -1.1409912109375, -1.063232421875, -0.9854736328125, -0.90771484375, -0.8299560546875, -0.752197265625, -0.6744384765625, -0.5966796875, -0.5189208984375, -0.441162109375, -0.3634033203125, -0.28564453125, -0.2078857421875, -0.130126953125, -0.0523681640625, 0.025390625, 0.1031494140625, 0.180908203125, 0.2586669921875, 0.33642578125, 0.4141845703125, 0.491943359375, 0.5697021484375, 0.6474609375, 0.7252197265625, 0.802978515625, 0.8807373046875, 0.95849609375, 1.0362548828125, 1.114013671875, 1.1917724609375, 1.26953125, 1.3472900390625, 1.425048828125, 1.5028076171875, 1.58056640625, 1.6583251953125, 1.736083984375, 1.8138427734375, 1.8916015625, 1.9693603515625, 2.047119140625, 2.1248779296875, 2.20263671875, 2.2803955078125, 2.358154296875, 2.4359130859375, 2.513671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 9.0, 11.0, 16.0, 22.0, 26.0, 56.0, 73.0, 121.0, 157.0, 250.0, 365.0, 621.0, 908.0, 1485.0, 2326.0, 3771.0, 6130.0, 10011.0, 16425.0, 26272.0, 42704.0, 65500.0, 95190.0, 125552.0, 144413.0, 141825.0, 118613.0, 87730.0, 58910.0, 37881.0, 23420.0, 14468.0, 8731.0, 5496.0, 3274.0, 2123.0, 1328.0, 848.0, 496.0, 368.0, 226.0, 143.0, 85.0, 66.0, 34.0, 27.0, 21.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.4375, -2.358551025390625, -2.27960205078125, -2.200653076171875, -2.1217041015625, -2.042755126953125, -1.96380615234375, -1.884857177734375, -1.805908203125, -1.726959228515625, -1.64801025390625, -1.569061279296875, -1.4901123046875, -1.411163330078125, -1.33221435546875, -1.253265380859375, -1.17431640625, -1.095367431640625, -1.01641845703125, -0.937469482421875, -0.8585205078125, -0.779571533203125, -0.70062255859375, -0.621673583984375, -0.542724609375, -0.463775634765625, -0.38482666015625, -0.305877685546875, -0.2269287109375, -0.147979736328125, -0.06903076171875, 0.009918212890625, 0.0888671875, 0.167816162109375, 0.24676513671875, 0.325714111328125, 0.4046630859375, 0.483612060546875, 0.56256103515625, 0.641510009765625, 0.720458984375, 0.799407958984375, 0.87835693359375, 0.957305908203125, 1.0362548828125, 1.115203857421875, 1.19415283203125, 1.273101806640625, 1.35205078125, 1.430999755859375, 1.50994873046875, 1.588897705078125, 1.6678466796875, 1.746795654296875, 1.82574462890625, 1.904693603515625, 1.983642578125, 2.062591552734375, 2.14154052734375, 2.220489501953125, 2.2994384765625, 2.378387451171875, 2.45733642578125, 2.536285400390625, 2.615234375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 5.0, 7.0, 13.0, 12.0, 15.0, 22.0, 17.0, 20.0, 30.0, 25.0, 23.0, 37.0, 40.0, 32.0, 37.0, 28.0, 38.0, 35.0, 30.0, 39.0, 39.0, 36.0, 36.0, 31.0, 31.0, 23.0, 16.0, 34.0, 25.0, 20.0, 22.0, 14.0, 18.0, 16.0, 12.0, 11.0, 15.0, 7.0, 8.0, 6.0, 4.0, 9.0, 6.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.3134765625, -1.274261474609375, -1.23504638671875, -1.195831298828125, -1.1566162109375, -1.117401123046875, -1.07818603515625, -1.038970947265625, -0.999755859375, -0.960540771484375, -0.92132568359375, -0.882110595703125, -0.8428955078125, -0.803680419921875, -0.76446533203125, -0.725250244140625, -0.68603515625, -0.646820068359375, -0.60760498046875, -0.568389892578125, -0.5291748046875, -0.489959716796875, -0.45074462890625, -0.411529541015625, -0.372314453125, -0.333099365234375, -0.29388427734375, -0.254669189453125, -0.2154541015625, -0.176239013671875, -0.13702392578125, -0.097808837890625, -0.05859375, -0.019378662109375, 0.01983642578125, 0.059051513671875, 0.0982666015625, 0.137481689453125, 0.17669677734375, 0.215911865234375, 0.255126953125, 0.294342041015625, 0.33355712890625, 0.372772216796875, 0.4119873046875, 0.451202392578125, 0.49041748046875, 0.529632568359375, 0.56884765625, 0.608062744140625, 0.64727783203125, 0.686492919921875, 0.7257080078125, 0.764923095703125, 0.80413818359375, 0.843353271484375, 0.882568359375, 0.921783447265625, 0.96099853515625, 1.000213623046875, 1.0394287109375, 1.078643798828125, 1.11785888671875, 1.157073974609375, 1.1962890625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 15.0, 29.0, 29.0, 40.0, 68.0, 96.0, 153.0, 235.0, 319.0, 577.0, 766.0, 1248.0, 1835.0, 2983.0, 4741.0, 7500.0, 12007.0, 19857.0, 33435.0, 55280.0, 89246.0, 133294.0, 168881.0, 167382.0, 128911.0, 85325.0, 52502.0, 31508.0, 18947.0, 11711.0, 7032.0, 4514.0, 2878.0, 1771.0, 1191.0, 783.0, 499.0, 297.0, 216.0, 148.0, 93.0, 69.0, 52.0, 25.0, 13.0, 13.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3737030029296875, -1.324554443359375, -1.2754058837890625, -1.22625732421875, -1.1771087646484375, -1.127960205078125, -1.0788116455078125, -1.0296630859375, -0.9805145263671875, -0.931365966796875, -0.8822174072265625, -0.83306884765625, -0.7839202880859375, -0.734771728515625, -0.6856231689453125, -0.636474609375, -0.5873260498046875, -0.538177490234375, -0.4890289306640625, -0.43988037109375, -0.3907318115234375, -0.341583251953125, -0.2924346923828125, -0.2432861328125, -0.1941375732421875, -0.144989013671875, -0.0958404541015625, -0.04669189453125, 0.0024566650390625, 0.051605224609375, 0.1007537841796875, 0.14990234375, 0.1990509033203125, 0.248199462890625, 0.2973480224609375, 0.34649658203125, 0.3956451416015625, 0.444793701171875, 0.4939422607421875, 0.5430908203125, 0.5922393798828125, 0.641387939453125, 0.6905364990234375, 0.73968505859375, 0.7888336181640625, 0.837982177734375, 0.8871307373046875, 0.936279296875, 0.9854278564453125, 1.034576416015625, 1.0837249755859375, 1.13287353515625, 1.1820220947265625, 1.231170654296875, 1.2803192138671875, 1.3294677734375, 1.3786163330078125, 1.427764892578125, 1.4769134521484375, 1.52606201171875, 1.5752105712890625, 1.624359130859375, 1.6735076904296875, 1.72265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 6.0, 14.0, 11.0, 9.0, 20.0, 27.0, 26.0, 31.0, 42.0, 63.0, 50.0, 52.0, 61.0, 77.0, 64.0, 56.0, 52.0, 56.0, 42.0, 43.0, 39.0, 24.0, 20.0, 16.0, 20.0, 15.0, 11.0, 11.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019168853759765625, -0.0001863911747932434, -0.00018109381198883057, -0.00017579644918441772, -0.00017049908638000488, -0.00016520172357559204, -0.0001599043607711792, -0.00015460699796676636, -0.00014930963516235352, -0.00014401227235794067, -0.00013871490955352783, -0.000133417546749115, -0.00012812018394470215, -0.0001228228211402893, -0.00011752545833587646, -0.00011222809553146362, -0.00010693073272705078, -0.00010163336992263794, -9.63360071182251e-05, -9.103864431381226e-05, -8.574128150939941e-05, -8.044391870498657e-05, -7.514655590057373e-05, -6.984919309616089e-05, -6.455183029174805e-05, -5.9254467487335205e-05, -5.395710468292236e-05, -4.865974187850952e-05, -4.336237907409668e-05, -3.806501626968384e-05, -3.2767653465270996e-05, -2.7470290660858154e-05, -2.2172927856445312e-05, -1.687556505203247e-05, -1.1578202247619629e-05, -6.280839443206787e-06, -9.834766387939453e-07, 4.3138861656188965e-06, 9.611248970031738e-06, 1.490861177444458e-05, 2.0205974578857422e-05, 2.5503337383270264e-05, 3.0800700187683105e-05, 3.609806299209595e-05, 4.139542579650879e-05, 4.669278860092163e-05, 5.199015140533447e-05, 5.7287514209747314e-05, 6.258487701416016e-05, 6.7882239818573e-05, 7.317960262298584e-05, 7.847696542739868e-05, 8.377432823181152e-05, 8.907169103622437e-05, 9.436905384063721e-05, 9.966641664505005e-05, 0.00010496377944946289, 0.00011026114225387573, 0.00011555850505828857, 0.00012085586786270142, 0.00012615323066711426, 0.0001314505934715271, 0.00013674795627593994, 0.00014204531908035278, 0.00014734268188476562]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 34.0, 32.0, 45.0, 69.0, 93.0, 172.0, 243.0, 457.0, 735.0, 1195.0, 2130.0, 3774.0, 6844.0, 12355.0, 22021.0, 39530.0, 68820.0, 112243.0, 162020.0, 184841.0, 161134.0, 112501.0, 68200.0, 39165.0, 21908.0, 12127.0, 6843.0, 3727.0, 2162.0, 1235.0, 689.0, 452.0, 278.0, 164.0, 108.0, 53.0, 30.0, 35.0, 18.0, 16.0, 11.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.609375, -1.5613250732421875, -1.513275146484375, -1.4652252197265625, -1.41717529296875, -1.3691253662109375, -1.321075439453125, -1.2730255126953125, -1.2249755859375, -1.1769256591796875, -1.128875732421875, -1.0808258056640625, -1.03277587890625, -0.9847259521484375, -0.936676025390625, -0.8886260986328125, -0.840576171875, -0.7925262451171875, -0.744476318359375, -0.6964263916015625, -0.64837646484375, -0.6003265380859375, -0.552276611328125, -0.5042266845703125, -0.4561767578125, -0.4081268310546875, -0.360076904296875, -0.3120269775390625, -0.26397705078125, -0.2159271240234375, -0.167877197265625, -0.1198272705078125, -0.07177734375, -0.0237274169921875, 0.024322509765625, 0.0723724365234375, 0.12042236328125, 0.1684722900390625, 0.216522216796875, 0.2645721435546875, 0.3126220703125, 0.3606719970703125, 0.408721923828125, 0.4567718505859375, 0.50482177734375, 0.5528717041015625, 0.600921630859375, 0.6489715576171875, 0.697021484375, 0.7450714111328125, 0.793121337890625, 0.8411712646484375, 0.88922119140625, 0.9372711181640625, 0.985321044921875, 1.0333709716796875, 1.0814208984375, 1.1294708251953125, 1.177520751953125, 1.2255706787109375, 1.27362060546875, 1.3216705322265625, 1.369720458984375, 1.4177703857421875, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 15.0, 21.0, 28.0, 23.0, 30.0, 50.0, 50.0, 72.0, 59.0, 71.0, 71.0, 74.0, 59.0, 55.0, 45.0, 64.0, 46.0, 42.0, 31.0, 24.0, 18.0, 10.0, 3.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5405807495117188, -0.5235443115234375, -0.5065078735351562, -0.489471435546875, -0.47243499755859375, -0.4553985595703125, -0.43836212158203125, -0.42132568359375, -0.40428924560546875, -0.3872528076171875, -0.37021636962890625, -0.353179931640625, -0.33614349365234375, -0.3191070556640625, -0.30207061767578125, -0.2850341796875, -0.26799774169921875, -0.2509613037109375, -0.23392486572265625, -0.216888427734375, -0.19985198974609375, -0.1828155517578125, -0.16577911376953125, -0.14874267578125, -0.13170623779296875, -0.1146697998046875, -0.09763336181640625, -0.080596923828125, -0.06356048583984375, -0.0465240478515625, -0.02948760986328125, -0.012451171875, 0.00458526611328125, 0.0216217041015625, 0.03865814208984375, 0.055694580078125, 0.07273101806640625, 0.0897674560546875, 0.10680389404296875, 0.12384033203125, 0.14087677001953125, 0.1579132080078125, 0.17494964599609375, 0.191986083984375, 0.20902252197265625, 0.2260589599609375, 0.24309539794921875, 0.2601318359375, 0.27716827392578125, 0.2942047119140625, 0.31124114990234375, 0.328277587890625, 0.34531402587890625, 0.3623504638671875, 0.37938690185546875, 0.39642333984375, 0.41345977783203125, 0.4304962158203125, 0.44753265380859375, 0.464569091796875, 0.48160552978515625, 0.4986419677734375, 0.5156784057617188, 0.53271484375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 13.0, 11.0, 11.0, 18.0, 21.0, 24.0, 26.0, 41.0, 40.0, 61.0, 62.0, 75.0, 79.0, 75.0, 82.0, 49.0, 76.0, 41.0, 48.0, 19.0, 24.0, 20.0, 22.0, 14.0, 16.0, 14.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6054840087890625, -6.44195032119751, -6.278416633605957, -6.1148834228515625, -5.95134973526001, -5.787816047668457, -5.624282360076904, -5.460748672485352, -5.297215461730957, -5.133681774139404, -4.970148086547852, -4.806614875793457, -4.643081188201904, -4.479547500610352, -4.316013813018799, -4.152480125427246, -3.9889466762542725, -3.8254129886627197, -3.661879539489746, -3.4983458518981934, -3.3348124027252197, -3.171278715133667, -3.0077452659606934, -2.8442115783691406, -2.680677890777588, -2.517144203186035, -2.3536107540130615, -2.190077066421509, -2.026543617248535, -1.8630099296569824, -1.6994763612747192, -1.535942792892456, -1.3724095821380615, -1.2088760137557983, -1.0453424453735352, -0.8818088173866272, -0.718275249004364, -0.5547416806221008, -0.39120805263519287, -0.2276744842529297, -0.0641409158706665, 0.09939266741275787, 0.26292625069618225, 0.4264598488807678, 0.589993417263031, 0.7535269856452942, 0.9170606136322021, 1.0805941820144653, 1.2441277503967285, 1.4076613187789917, 1.5711948871612549, 1.7347285747528076, 1.8982620239257812, 2.061795711517334, 2.2253293991088867, 2.3888628482818604, 2.552396297454834, 2.7159299850463867, 2.8794634342193604, 3.042997121810913, 3.2065305709838867, 3.3700642585754395, 3.533597946166992, 3.697131395339966, 3.8606650829315186]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 2.0, 7.0, 12.0, 16.0, 11.0, 17.0, 17.0, 16.0, 26.0, 24.0, 19.0, 20.0, 30.0, 33.0, 19.0, 29.0, 35.0, 33.0, 32.0, 49.0, 39.0, 36.0, 35.0, 35.0, 39.0, 27.0, 34.0, 24.0, 17.0, 32.0, 21.0, 25.0, 21.0, 23.0, 13.0, 19.0, 14.0, 18.0, 14.0, 5.0, 10.0, 7.0, 10.0, 6.0, 2.0, 8.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.917460560798645, -1.8577678203582764, -1.7980751991271973, -1.7383824586868286, -1.67868971824646, -1.6189970970153809, -1.5593043565750122, -1.4996116161346436, -1.4399189949035645, -1.3802262544631958, -1.3205336332321167, -1.260840892791748, -1.2011481523513794, -1.1414554119110107, -1.0817627906799316, -1.022070050239563, -0.9623773097991943, -0.9026846289634705, -0.8429918885231018, -0.7832992076873779, -0.7236064672470093, -0.6639137864112854, -0.6042211055755615, -0.5445283651351929, -0.484835684299469, -0.42514297366142273, -0.36545026302337646, -0.3057575821876526, -0.24606487154960632, -0.18637216091156006, -0.12667948007583618, -0.06698676943778992, -0.007294178009033203, 0.052398525178432465, 0.11209122836589813, 0.1717839241027832, 0.23147663474082947, 0.29116934537887573, 0.3508620262145996, 0.4105547368526459, 0.47024744749069214, 0.529940128326416, 0.5896328687667847, 0.6493255496025085, 0.7090182304382324, 0.7687109708786011, 0.828403651714325, 0.8880963325500488, 0.9477890729904175, 1.0074818134307861, 1.0671744346618652, 1.1268671751022339, 1.1865599155426025, 1.2462525367736816, 1.3059452772140503, 1.365638017654419, 1.425330638885498, 1.4850233793258667, 1.5447160005569458, 1.6044087409973145, 1.664101481437683, 1.7237942218780518, 1.7834868431091309, 1.8431795835494995, 1.9028723239898682]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 26.0, 44.0, 60.0, 100.0, 166.0, 224.0, 320.0, 479.0, 768.0, 1343.0, 2017.0, 3275.0, 5534.0, 9909.0, 17397.0, 32985.0, 65687.0, 141046.0, 332614.0, 793353.0, 1249471.0, 856099.0, 369269.0, 158618.0, 73510.0, 36634.0, 19020.0, 10270.0, 5696.0, 3384.0, 1934.0, 1102.0, 692.0, 422.0, 281.0, 169.0, 113.0, 72.0, 44.0, 21.0, 27.0, 10.0, 12.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.41015625, -4.26092529296875, -4.1116943359375, -3.96246337890625, -3.813232421875, -3.66400146484375, -3.5147705078125, -3.36553955078125, -3.21630859375, -3.06707763671875, -2.9178466796875, -2.76861572265625, -2.619384765625, -2.47015380859375, -2.3209228515625, -2.17169189453125, -2.0224609375, -1.87322998046875, -1.7239990234375, -1.57476806640625, -1.425537109375, -1.27630615234375, -1.1270751953125, -0.97784423828125, -0.82861328125, -0.67938232421875, -0.5301513671875, -0.38092041015625, -0.231689453125, -0.08245849609375, 0.0667724609375, 0.21600341796875, 0.365234375, 0.51446533203125, 0.6636962890625, 0.81292724609375, 0.962158203125, 1.11138916015625, 1.2606201171875, 1.40985107421875, 1.55908203125, 1.70831298828125, 1.8575439453125, 2.00677490234375, 2.156005859375, 2.30523681640625, 2.4544677734375, 2.60369873046875, 2.7529296875, 2.90216064453125, 3.0513916015625, 3.20062255859375, 3.349853515625, 3.49908447265625, 3.6483154296875, 3.79754638671875, 3.94677734375, 4.09600830078125, 4.2452392578125, 4.39447021484375, 4.543701171875, 4.69293212890625, 4.8421630859375, 4.99139404296875, 5.140625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 18.0, 20.0, 22.0, 21.0, 18.0, 25.0, 18.0, 24.0, 28.0, 44.0, 31.0, 35.0, 38.0, 37.0, 26.0, 36.0, 35.0, 42.0, 32.0, 36.0, 33.0, 37.0, 28.0, 24.0, 37.0, 29.0, 15.0, 28.0, 27.0, 15.0, 14.0, 18.0, 14.0, 9.0, 4.0, 15.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7802734375, -1.7282562255859375, -1.676239013671875, -1.6242218017578125, -1.57220458984375, -1.5201873779296875, -1.468170166015625, -1.4161529541015625, -1.3641357421875, -1.3121185302734375, -1.260101318359375, -1.2080841064453125, -1.15606689453125, -1.1040496826171875, -1.052032470703125, -1.0000152587890625, -0.947998046875, -0.8959808349609375, -0.843963623046875, -0.7919464111328125, -0.73992919921875, -0.6879119873046875, -0.635894775390625, -0.5838775634765625, -0.5318603515625, -0.4798431396484375, -0.427825927734375, -0.3758087158203125, -0.32379150390625, -0.2717742919921875, -0.219757080078125, -0.1677398681640625, -0.11572265625, -0.0637054443359375, -0.011688232421875, 0.0403289794921875, 0.09234619140625, 0.1443634033203125, 0.196380615234375, 0.2483978271484375, 0.3004150390625, 0.3524322509765625, 0.404449462890625, 0.4564666748046875, 0.50848388671875, 0.5605010986328125, 0.612518310546875, 0.6645355224609375, 0.716552734375, 0.7685699462890625, 0.820587158203125, 0.8726043701171875, 0.92462158203125, 0.9766387939453125, 1.028656005859375, 1.0806732177734375, 1.1326904296875, 1.1847076416015625, 1.236724853515625, 1.2887420654296875, 1.34075927734375, 1.3927764892578125, 1.444793701171875, 1.4968109130859375, 1.548828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 3.0, 11.0, 19.0, 26.0, 35.0, 63.0, 93.0, 155.0, 196.0, 322.0, 534.0, 826.0, 1419.0, 2301.0, 4004.0, 6839.0, 12235.0, 22022.0, 40720.0, 78965.0, 152623.0, 302319.0, 587283.0, 952865.0, 915299.0, 540664.0, 275901.0, 138908.0, 72020.0, 37760.0, 20745.0, 11339.0, 6498.0, 3679.0, 2098.0, 1331.0, 795.0, 512.0, 324.0, 207.0, 118.0, 69.0, 50.0, 34.0, 16.0, 16.0, 8.0, 8.0, 1.0, 2.0, 3.0], "bins": [-5.29296875, -5.149658203125, -5.00634765625, -4.863037109375, -4.7197265625, -4.576416015625, -4.43310546875, -4.289794921875, -4.146484375, -4.003173828125, -3.85986328125, -3.716552734375, -3.5732421875, -3.429931640625, -3.28662109375, -3.143310546875, -3.0, -2.856689453125, -2.71337890625, -2.570068359375, -2.4267578125, -2.283447265625, -2.14013671875, -1.996826171875, -1.853515625, -1.710205078125, -1.56689453125, -1.423583984375, -1.2802734375, -1.136962890625, -0.99365234375, -0.850341796875, -0.70703125, -0.563720703125, -0.42041015625, -0.277099609375, -0.1337890625, 0.009521484375, 0.15283203125, 0.296142578125, 0.439453125, 0.582763671875, 0.72607421875, 0.869384765625, 1.0126953125, 1.156005859375, 1.29931640625, 1.442626953125, 1.5859375, 1.729248046875, 1.87255859375, 2.015869140625, 2.1591796875, 2.302490234375, 2.44580078125, 2.589111328125, 2.732421875, 2.875732421875, 3.01904296875, 3.162353515625, 3.3056640625, 3.448974609375, 3.59228515625, 3.735595703125, 3.87890625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 12.0, 14.0, 20.0, 27.0, 35.0, 52.0, 52.0, 70.0, 92.0, 112.0, 122.0, 153.0, 190.0, 215.0, 242.0, 252.0, 278.0, 304.0, 265.0, 256.0, 234.0, 176.0, 178.0, 144.0, 101.0, 98.0, 87.0, 66.0, 40.0, 48.0, 40.0, 20.0, 15.0, 16.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.86334228515625, -0.8243408203125, -0.78533935546875, -0.746337890625, -0.70733642578125, -0.6683349609375, -0.62933349609375, -0.59033203125, -0.55133056640625, -0.5123291015625, -0.47332763671875, -0.434326171875, -0.39532470703125, -0.3563232421875, -0.31732177734375, -0.2783203125, -0.23931884765625, -0.2003173828125, -0.16131591796875, -0.122314453125, -0.08331298828125, -0.0443115234375, -0.00531005859375, 0.03369140625, 0.07269287109375, 0.1116943359375, 0.15069580078125, 0.189697265625, 0.22869873046875, 0.2677001953125, 0.30670166015625, 0.345703125, 0.38470458984375, 0.4237060546875, 0.46270751953125, 0.501708984375, 0.54071044921875, 0.5797119140625, 0.61871337890625, 0.65771484375, 0.69671630859375, 0.7357177734375, 0.77471923828125, 0.813720703125, 0.85272216796875, 0.8917236328125, 0.93072509765625, 0.9697265625, 1.00872802734375, 1.0477294921875, 1.08673095703125, 1.125732421875, 1.16473388671875, 1.2037353515625, 1.24273681640625, 1.28173828125, 1.32073974609375, 1.3597412109375, 1.39874267578125, 1.437744140625, 1.47674560546875, 1.5157470703125, 1.55474853515625, 1.59375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 17.0, 12.0, 19.0, 21.0, 23.0, 23.0, 33.0, 40.0, 46.0, 36.0, 49.0, 55.0, 60.0, 72.0, 52.0, 68.0, 42.0, 55.0, 42.0, 28.0, 33.0, 26.0, 22.0, 15.0, 21.0, 15.0, 10.0, 7.0, 11.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.709427356719971, -4.573078155517578, -4.4367289543151855, -4.300380229949951, -4.164031028747559, -4.027681827545166, -3.8913326263427734, -3.75498366355896, -3.6186347007751465, -3.482285499572754, -3.3459365367889404, -3.209587335586548, -3.0732383728027344, -2.936889171600342, -2.800539970397949, -2.6641910076141357, -2.527841806411743, -2.3914926052093506, -2.255143642425537, -2.1187944412231445, -1.982445478439331, -1.8460962772369385, -1.7097471952438354, -1.5733981132507324, -1.4370490312576294, -1.3006999492645264, -1.1643508672714233, -1.0280017852783203, -0.8916526436805725, -0.7553035616874695, -0.6189544200897217, -0.48260533809661865, -0.3462562561035156, -0.2099071592092514, -0.07355806231498718, 0.06279104948043823, 0.19914013147354126, 0.3354892134666443, 0.4718383550643921, 0.6081874370574951, 0.7445365190505981, 0.8808856010437012, 1.0172346830368042, 1.1535837650299072, 1.2899329662322998, 1.4262819290161133, 1.5626311302185059, 1.6989802122116089, 1.835329294204712, 1.971678376197815, 2.108027458190918, 2.2443766593933105, 2.380725622177124, 2.5170748233795166, 2.65342378616333, 2.7897729873657227, 2.9261221885681152, 3.062471389770508, 3.1988203525543213, 3.335169553756714, 3.4715185165405273, 3.60786771774292, 3.7442169189453125, 3.880565881729126, 4.0169148445129395]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 4.0, 10.0, 16.0, 20.0, 12.0, 18.0, 14.0, 22.0, 26.0, 18.0, 27.0, 35.0, 30.0, 45.0, 36.0, 41.0, 48.0, 44.0, 41.0, 48.0, 28.0, 39.0, 35.0, 27.0, 31.0, 27.0, 30.0, 29.0, 28.0, 31.0, 16.0, 19.0, 13.0, 10.0, 10.0, 17.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2914984226226807, -2.2230279445648193, -2.154557704925537, -2.086087226867676, -2.0176169872283936, -1.9491465091705322, -1.8806761503219604, -1.8122057914733887, -1.7437353134155273, -1.6752649545669556, -1.6067945957183838, -1.5383241176605225, -1.4698537588119507, -1.401383399963379, -1.3329130411148071, -1.2644426822662354, -1.1959723234176636, -1.1275019645690918, -1.05903160572052, -0.9905611872673035, -0.9220907688140869, -0.8536204099655151, -0.7851500511169434, -0.7166796922683716, -0.648209273815155, -0.5797389149665833, -0.5112684965133667, -0.4427981376647949, -0.37432774901390076, -0.3058573603630066, -0.23738700151443481, -0.16891661286354065, -0.10044622421264648, -0.031975843012332916, 0.03649453818798065, 0.10496491193771362, 0.1734353005886078, 0.24190568923950195, 0.31037604808807373, 0.3788464367389679, 0.44731682538986206, 0.5157871842384338, 0.5842576026916504, 0.6527279615402222, 0.721198320388794, 0.7896687388420105, 0.8581390976905823, 0.9266095161437988, 0.9950798749923706, 1.0635502338409424, 1.1320205926895142, 1.200490951538086, 1.2689614295959473, 1.337431788444519, 1.4059021472930908, 1.4743725061416626, 1.5428428649902344, 1.6113132238388062, 1.679783582687378, 1.7482540607452393, 1.816724419593811, 1.8851947784423828, 1.9536651372909546, 2.0221354961395264, 2.0906059741973877]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 14.0, 8.0, 9.0, 19.0, 22.0, 41.0, 89.0, 108.0, 185.0, 356.0, 575.0, 941.0, 1618.0, 2973.0, 5166.0, 9340.0, 17459.0, 31990.0, 59581.0, 108846.0, 174694.0, 213955.0, 176805.0, 110523.0, 61422.0, 32451.0, 17742.0, 9366.0, 5227.0, 2963.0, 1671.0, 995.0, 552.0, 340.0, 205.0, 111.0, 74.0, 40.0, 32.0, 16.0, 11.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38306427001953125, -0.3725738525390625, -0.36208343505859375, -0.351593017578125, -0.34110260009765625, -0.3306121826171875, -0.32012176513671875, -0.30963134765625, -0.29914093017578125, -0.2886505126953125, -0.27816009521484375, -0.267669677734375, -0.25717926025390625, -0.2466888427734375, -0.23619842529296875, -0.2257080078125, -0.21521759033203125, -0.2047271728515625, -0.19423675537109375, -0.183746337890625, -0.17325592041015625, -0.1627655029296875, -0.15227508544921875, -0.14178466796875, -0.13129425048828125, -0.1208038330078125, -0.11031341552734375, -0.099822998046875, -0.08933258056640625, -0.0788421630859375, -0.06835174560546875, -0.057861328125, -0.04737091064453125, -0.0368804931640625, -0.02639007568359375, -0.015899658203125, -0.00540924072265625, 0.0050811767578125, 0.01557159423828125, 0.02606201171875, 0.03655242919921875, 0.0470428466796875, 0.05753326416015625, 0.068023681640625, 0.07851409912109375, 0.0890045166015625, 0.09949493408203125, 0.1099853515625, 0.12047576904296875, 0.1309661865234375, 0.14145660400390625, 0.151947021484375, 0.16243743896484375, 0.1729278564453125, 0.18341827392578125, 0.19390869140625, 0.20439910888671875, 0.2148895263671875, 0.22537994384765625, 0.235870361328125, 0.24636077880859375, 0.2568511962890625, 0.26734161376953125, 0.27783203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 12.0, 11.0, 13.0, 19.0, 12.0, 25.0, 16.0, 22.0, 34.0, 34.0, 41.0, 45.0, 50.0, 29.0, 46.0, 34.0, 36.0, 29.0, 39.0, 32.0, 28.0, 30.0, 26.0, 33.0, 29.0, 26.0, 28.0, 39.0, 27.0, 20.0, 16.0, 19.0, 10.0, 9.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-2.609375, -2.532440185546875, -2.45550537109375, -2.378570556640625, -2.3016357421875, -2.224700927734375, -2.14776611328125, -2.070831298828125, -1.993896484375, -1.916961669921875, -1.84002685546875, -1.763092041015625, -1.6861572265625, -1.609222412109375, -1.53228759765625, -1.455352783203125, -1.37841796875, -1.301483154296875, -1.22454833984375, -1.147613525390625, -1.0706787109375, -0.993743896484375, -0.91680908203125, -0.839874267578125, -0.762939453125, -0.686004638671875, -0.60906982421875, -0.532135009765625, -0.4552001953125, -0.378265380859375, -0.30133056640625, -0.224395751953125, -0.1474609375, -0.070526123046875, 0.00640869140625, 0.083343505859375, 0.1602783203125, 0.237213134765625, 0.31414794921875, 0.391082763671875, 0.468017578125, 0.544952392578125, 0.62188720703125, 0.698822021484375, 0.7757568359375, 0.852691650390625, 0.92962646484375, 1.006561279296875, 1.08349609375, 1.160430908203125, 1.23736572265625, 1.314300537109375, 1.3912353515625, 1.468170166015625, 1.54510498046875, 1.622039794921875, 1.698974609375, 1.775909423828125, 1.85284423828125, 1.929779052734375, 2.0067138671875, 2.083648681640625, 2.16058349609375, 2.237518310546875, 2.314453125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 11.0, 28.0, 13.0, 31.0, 39.0, 80.0, 98.0, 145.0, 261.0, 375.0, 625.0, 1033.0, 1892.0, 3760.0, 8173.0, 20007.0, 75853.0, 859439.0, 46672.0, 15879.0, 6871.0, 3249.0, 1599.0, 880.0, 563.0, 323.0, 209.0, 119.0, 90.0, 69.0, 41.0, 39.0, 31.0, 16.0, 9.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2973480224609375, -1.261688232421875, -1.2260284423828125, -1.19036865234375, -1.1547088623046875, -1.119049072265625, -1.0833892822265625, -1.0477294921875, -1.0120697021484375, -0.976409912109375, -0.9407501220703125, -0.90509033203125, -0.8694305419921875, -0.833770751953125, -0.7981109619140625, -0.762451171875, -0.7267913818359375, -0.691131591796875, -0.6554718017578125, -0.61981201171875, -0.5841522216796875, -0.548492431640625, -0.5128326416015625, -0.4771728515625, -0.4415130615234375, -0.405853271484375, -0.3701934814453125, -0.33453369140625, -0.2988739013671875, -0.263214111328125, -0.2275543212890625, -0.19189453125, -0.1562347412109375, -0.120574951171875, -0.0849151611328125, -0.04925537109375, -0.0135955810546875, 0.022064208984375, 0.0577239990234375, 0.0933837890625, 0.1290435791015625, 0.164703369140625, 0.2003631591796875, 0.23602294921875, 0.2716827392578125, 0.307342529296875, 0.3430023193359375, 0.378662109375, 0.4143218994140625, 0.449981689453125, 0.4856414794921875, 0.52130126953125, 0.5569610595703125, 0.592620849609375, 0.6282806396484375, 0.6639404296875, 0.6996002197265625, 0.735260009765625, 0.7709197998046875, 0.80657958984375, 0.8422393798828125, 0.877899169921875, 0.9135589599609375, 0.94921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 8.0, 13.0, 12.0, 14.0, 17.0, 20.0, 20.0, 26.0, 25.0, 29.0, 30.0, 32.0, 30.0, 39.0, 31.0, 31.0, 38.0, 43.0, 33.0, 49.0, 38.0, 31.0, 28.0, 43.0, 26.0, 35.0, 35.0, 24.0, 36.0, 20.0, 19.0, 26.0, 18.0, 5.0, 10.0, 9.0, 14.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.558135986328125, -1.50982666015625, -1.461517333984375, -1.4132080078125, -1.364898681640625, -1.31658935546875, -1.268280029296875, -1.219970703125, -1.171661376953125, -1.12335205078125, -1.075042724609375, -1.0267333984375, -0.978424072265625, -0.93011474609375, -0.881805419921875, -0.83349609375, -0.785186767578125, -0.73687744140625, -0.688568115234375, -0.6402587890625, -0.591949462890625, -0.54364013671875, -0.495330810546875, -0.447021484375, -0.398712158203125, -0.35040283203125, -0.302093505859375, -0.2537841796875, -0.205474853515625, -0.15716552734375, -0.108856201171875, -0.060546875, -0.012237548828125, 0.03607177734375, 0.084381103515625, 0.1326904296875, 0.180999755859375, 0.22930908203125, 0.277618408203125, 0.325927734375, 0.374237060546875, 0.42254638671875, 0.470855712890625, 0.5191650390625, 0.567474365234375, 0.61578369140625, 0.664093017578125, 0.71240234375, 0.760711669921875, 0.80902099609375, 0.857330322265625, 0.9056396484375, 0.953948974609375, 1.00225830078125, 1.050567626953125, 1.098876953125, 1.147186279296875, 1.19549560546875, 1.243804931640625, 1.2921142578125, 1.340423583984375, 1.38873291015625, 1.437042236328125, 1.4853515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 39.0, 51.0, 76.0, 83.0, 137.0, 165.0, 300.0, 489.0, 799.0, 1275.0, 2336.0, 4387.0, 8698.0, 18496.0, 54712.0, 886998.0, 38410.0, 15121.0, 7190.0, 3663.0, 1967.0, 1105.0, 685.0, 432.0, 266.0, 179.0, 123.0, 70.0, 49.0, 40.0, 23.0, 20.0, 21.0, 13.0, 10.0, 8.0, 7.0, 8.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.275146484375, -0.2669029235839844, -0.25865936279296875, -0.2504158020019531, -0.2421722412109375, -0.23392868041992188, -0.22568511962890625, -0.21744155883789062, -0.209197998046875, -0.20095443725585938, -0.19271087646484375, -0.18446731567382812, -0.1762237548828125, -0.16798019409179688, -0.15973663330078125, -0.15149307250976562, -0.14324951171875, -0.13500595092773438, -0.12676239013671875, -0.11851882934570312, -0.1102752685546875, -0.10203170776367188, -0.09378814697265625, -0.08554458618164062, -0.077301025390625, -0.06905746459960938, -0.06081390380859375, -0.052570343017578125, -0.0443267822265625, -0.036083221435546875, -0.02783966064453125, -0.019596099853515625, -0.0113525390625, -0.003108978271484375, 0.00513458251953125, 0.013378143310546875, 0.0216217041015625, 0.029865264892578125, 0.03810882568359375, 0.046352386474609375, 0.054595947265625, 0.06283950805664062, 0.07108306884765625, 0.07932662963867188, 0.0875701904296875, 0.09581375122070312, 0.10405731201171875, 0.11230087280273438, 0.12054443359375, 0.12878799438476562, 0.13703155517578125, 0.14527511596679688, 0.1535186767578125, 0.16176223754882812, 0.17000579833984375, 0.17824935913085938, 0.186492919921875, 0.19473648071289062, 0.20298004150390625, 0.21122360229492188, 0.2194671630859375, 0.22771072387695312, 0.23595428466796875, 0.24419784545898438, 0.25244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 9.0, 10.0, 19.0, 21.0, 21.0, 34.0, 30.0, 41.0, 33.0, 52.0, 39.0, 53.0, 51.0, 63.0, 64.0, 57.0, 57.0, 38.0, 52.0, 36.0, 34.0, 29.0, 27.0, 24.0, 12.0, 18.0, 11.0, 10.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1961669921875e-05, -4.06922772526741e-05, -3.9422884583473206e-05, -3.815349191427231e-05, -3.688409924507141e-05, -3.5614706575870514e-05, -3.434531390666962e-05, -3.307592123746872e-05, -3.180652856826782e-05, -3.0537135899066925e-05, -2.9267743229866028e-05, -2.799835056066513e-05, -2.6728957891464233e-05, -2.5459565222263336e-05, -2.419017255306244e-05, -2.2920779883861542e-05, -2.1651387214660645e-05, -2.0381994545459747e-05, -1.911260187625885e-05, -1.7843209207057953e-05, -1.6573816537857056e-05, -1.530442386865616e-05, -1.4035031199455261e-05, -1.2765638530254364e-05, -1.1496245861053467e-05, -1.022685319185257e-05, -8.957460522651672e-06, -7.688067853450775e-06, -6.418675184249878e-06, -5.149282515048981e-06, -3.8798898458480835e-06, -2.6104971766471863e-06, -1.341104507446289e-06, -7.171183824539185e-08, 1.1976808309555054e-06, 2.4670735001564026e-06, 3.7364661693573e-06, 5.005858838558197e-06, 6.275251507759094e-06, 7.5446441769599915e-06, 8.814036846160889e-06, 1.0083429515361786e-05, 1.1352822184562683e-05, 1.262221485376358e-05, 1.3891607522964478e-05, 1.5161000192165375e-05, 1.6430392861366272e-05, 1.769978553056717e-05, 1.8969178199768066e-05, 2.0238570868968964e-05, 2.150796353816986e-05, 2.2777356207370758e-05, 2.4046748876571655e-05, 2.5316141545772552e-05, 2.658553421497345e-05, 2.7854926884174347e-05, 2.9124319553375244e-05, 3.039371222257614e-05, 3.166310489177704e-05, 3.2932497560977936e-05, 3.420189023017883e-05, 3.547128289937973e-05, 3.674067556858063e-05, 3.8010068237781525e-05, 3.927946090698242e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 13.0, 13.0, 21.0, 22.0, 28.0, 41.0, 50.0, 69.0, 78.0, 142.0, 211.0, 273.0, 384.0, 579.0, 862.0, 1117.0, 1807.0, 2723.0, 4531.0, 7361.0, 12519.0, 22290.0, 39328.0, 70702.0, 123129.0, 189927.0, 208815.0, 151944.0, 90199.0, 50321.0, 28339.0, 15918.0, 9122.0, 5512.0, 3421.0, 2218.0, 1374.0, 921.0, 594.0, 413.0, 362.0, 223.0, 163.0, 139.0, 86.0, 77.0, 56.0, 32.0, 20.0, 19.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07623291015625, -0.0737905502319336, -0.07134819030761719, -0.06890583038330078, -0.06646347045898438, -0.06402111053466797, -0.06157875061035156, -0.059136390686035156, -0.05669403076171875, -0.054251670837402344, -0.05180931091308594, -0.04936695098876953, -0.046924591064453125, -0.04448223114013672, -0.04203987121582031, -0.039597511291503906, -0.0371551513671875, -0.034712791442871094, -0.03227043151855469, -0.02982807159423828, -0.027385711669921875, -0.02494335174560547, -0.022500991821289062, -0.020058631896972656, -0.01761627197265625, -0.015173912048339844, -0.012731552124023438, -0.010289192199707031, -0.007846832275390625, -0.005404472351074219, -0.0029621124267578125, -0.0005197525024414062, 0.001922607421875, 0.004364967346191406, 0.0068073272705078125, 0.009249687194824219, 0.011692047119140625, 0.014134407043457031, 0.016576766967773438, 0.019019126892089844, 0.02146148681640625, 0.023903846740722656, 0.026346206665039062, 0.02878856658935547, 0.031230926513671875, 0.03367328643798828, 0.03611564636230469, 0.038558006286621094, 0.0410003662109375, 0.043442726135253906, 0.04588508605957031, 0.04832744598388672, 0.050769805908203125, 0.05321216583251953, 0.05565452575683594, 0.058096885681152344, 0.06053924560546875, 0.06298160552978516, 0.06542396545410156, 0.06786632537841797, 0.07030868530273438, 0.07275104522705078, 0.07519340515136719, 0.0776357650756836, 0.080078125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 6.0, 15.0, 15.0, 16.0, 26.0, 19.0, 32.0, 27.0, 48.0, 50.0, 50.0, 66.0, 68.0, 52.0, 75.0, 74.0, 57.0, 59.0, 47.0, 44.0, 29.0, 28.0, 21.0, 13.0, 16.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0164947509765625, -0.015921354293823242, -0.015347957611083984, -0.014774560928344727, -0.014201164245605469, -0.013627767562866211, -0.013054370880126953, -0.012480974197387695, -0.011907577514648438, -0.01133418083190918, -0.010760784149169922, -0.010187387466430664, -0.009613990783691406, -0.009040594100952148, -0.00846719741821289, -0.007893800735473633, -0.007320404052734375, -0.006747007369995117, -0.006173610687255859, -0.0056002140045166016, -0.005026817321777344, -0.004453420639038086, -0.003880023956298828, -0.0033066272735595703, -0.0027332305908203125, -0.0021598339080810547, -0.0015864372253417969, -0.001013040542602539, -0.00043964385986328125, 0.00013375282287597656, 0.0007071495056152344, 0.0012805461883544922, 0.00185394287109375, 0.002427339553833008, 0.0030007362365722656, 0.0035741329193115234, 0.004147529602050781, 0.004720926284790039, 0.005294322967529297, 0.005867719650268555, 0.0064411163330078125, 0.00701451301574707, 0.007587909698486328, 0.008161306381225586, 0.008734703063964844, 0.009308099746704102, 0.00988149642944336, 0.010454893112182617, 0.011028289794921875, 0.011601686477661133, 0.01217508316040039, 0.012748479843139648, 0.013321876525878906, 0.013895273208618164, 0.014468669891357422, 0.01504206657409668, 0.015615463256835938, 0.016188859939575195, 0.016762256622314453, 0.01733565330505371, 0.01790904998779297, 0.018482446670532227, 0.019055843353271484, 0.019629240036010742, 0.02020263671875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 17.0, 11.0, 17.0, 23.0, 26.0, 23.0, 29.0, 37.0, 50.0, 36.0, 47.0, 51.0, 62.0, 77.0, 56.0, 62.0, 42.0, 47.0, 51.0, 29.0, 33.0, 24.0, 21.0, 19.0, 18.0, 16.0, 11.0, 5.0, 14.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703352451324463, -4.567334175109863, -4.431316375732422, -4.295298099517822, -4.159279823303223, -4.023262023925781, -3.8872437477111816, -3.751225709915161, -3.6152076721191406, -3.47918963432312, -3.3431715965270996, -3.2071533203125, -3.0711352825164795, -2.935117244720459, -2.7990989685058594, -2.663080930709839, -2.5270628929138184, -2.391044855117798, -2.2550268173217773, -2.1190085411071777, -1.9829905033111572, -1.8469724655151367, -1.7109543085098267, -1.5749361515045166, -1.438918113708496, -1.3029000759124756, -1.1668819189071655, -1.0308637619018555, -0.894845724105835, -0.7588276267051697, -0.6228095293045044, -0.4867914319038391, -0.35077333450317383, -0.21475523710250854, -0.07873713970184326, 0.05728095769882202, 0.1932990550994873, 0.3293171525001526, 0.46533524990081787, 0.6013533473014832, 0.7373714447021484, 0.8733895421028137, 1.009407639503479, 1.145425796508789, 1.2814438343048096, 1.41746187210083, 1.5534800291061401, 1.6894981861114502, 1.8255162239074707, 1.9615342617034912, 2.0975522994995117, 2.2335705757141113, 2.369588613510132, 2.5056066513061523, 2.641624927520752, 2.7776429653167725, 2.913661003112793, 3.0496790409088135, 3.185697078704834, 3.3217153549194336, 3.457733392715454, 3.5937514305114746, 3.729769706726074, 3.8657877445220947, 4.001805782318115]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 1.0, 1.0, 10.0, 10.0, 2.0, 6.0, 21.0, 17.0, 14.0, 14.0, 19.0, 21.0, 24.0, 22.0, 23.0, 38.0, 30.0, 47.0, 35.0, 34.0, 49.0, 51.0, 42.0, 41.0, 31.0, 41.0, 34.0, 26.0, 31.0, 29.0, 31.0, 29.0, 27.0, 30.0, 18.0, 15.0, 15.0, 11.0, 8.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3029496669769287, -2.2345986366271973, -2.1662473678588867, -2.0978963375091553, -2.0295450687408447, -1.9611940383911133, -1.8928428888320923, -1.8244917392730713, -1.7561405897140503, -1.6877894401550293, -1.6194382905960083, -1.5510871410369873, -1.4827361106872559, -1.4143848419189453, -1.3460338115692139, -1.2776826620101929, -1.2093315124511719, -1.1409803628921509, -1.0726292133331299, -1.0042780637741089, -0.9359269738197327, -0.8675758242607117, -0.7992247343063354, -0.7308735847473145, -0.6625224351882935, -0.5941712856292725, -0.5258201360702515, -0.45746904611587524, -0.38911789655685425, -0.32076674699783325, -0.25241562724113464, -0.18406450748443604, -0.11571335792541504, -0.04736222326755524, 0.020988911390304565, 0.08934004604816437, 0.15769118070602417, 0.22604233026504517, 0.2943934500217438, 0.3627445697784424, 0.4310957193374634, 0.4994468688964844, 0.5677980184555054, 0.6361491084098816, 0.7045002579689026, 0.7728514075279236, 0.8412024974822998, 0.9095536470413208, 0.9779047966003418, 1.0462559461593628, 1.1146070957183838, 1.1829582452774048, 1.2513093948364258, 1.3196604251861572, 1.3880115747451782, 1.4563627243041992, 1.5247138738632202, 1.5930650234222412, 1.6614161729812622, 1.7297673225402832, 1.7981183528900146, 1.8664696216583252, 1.9348206520080566, 2.003171920776367, 2.0715229511260986]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 16.0, 20.0, 33.0, 52.0, 104.0, 145.0, 233.0, 400.0, 685.0, 1169.0, 1926.0, 3260.0, 5428.0, 9318.0, 15524.0, 25828.0, 42270.0, 65918.0, 95814.0, 126941.0, 145913.0, 143131.0, 120443.0, 88683.0, 59615.0, 38254.0, 23097.0, 14061.0, 8248.0, 4847.0, 2863.0, 1707.0, 1088.0, 605.0, 349.0, 234.0, 107.0, 83.0, 60.0, 28.0, 19.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.77349853515625, -2.6837158203125, -2.59393310546875, -2.504150390625, -2.41436767578125, -2.3245849609375, -2.23480224609375, -2.14501953125, -2.05523681640625, -1.9654541015625, -1.87567138671875, -1.785888671875, -1.69610595703125, -1.6063232421875, -1.51654052734375, -1.4267578125, -1.33697509765625, -1.2471923828125, -1.15740966796875, -1.067626953125, -0.97784423828125, -0.8880615234375, -0.79827880859375, -0.70849609375, -0.61871337890625, -0.5289306640625, -0.43914794921875, -0.349365234375, -0.25958251953125, -0.1697998046875, -0.08001708984375, 0.009765625, 0.09954833984375, 0.1893310546875, 0.27911376953125, 0.368896484375, 0.45867919921875, 0.5484619140625, 0.63824462890625, 0.72802734375, 0.81781005859375, 0.9075927734375, 0.99737548828125, 1.087158203125, 1.17694091796875, 1.2667236328125, 1.35650634765625, 1.4462890625, 1.53607177734375, 1.6258544921875, 1.71563720703125, 1.805419921875, 1.89520263671875, 1.9849853515625, 2.07476806640625, 2.16455078125, 2.25433349609375, 2.3441162109375, 2.43389892578125, 2.523681640625, 2.61346435546875, 2.7032470703125, 2.79302978515625, 2.8828125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 2.0, 6.0, 8.0, 11.0, 13.0, 7.0, 9.0, 12.0, 21.0, 17.0, 24.0, 30.0, 30.0, 28.0, 35.0, 30.0, 40.0, 54.0, 51.0, 47.0, 39.0, 52.0, 52.0, 32.0, 41.0, 43.0, 32.0, 36.0, 33.0, 24.0, 22.0, 16.0, 27.0, 17.0, 11.0, 12.0, 7.0, 7.0, 8.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.783203125, -2.69830322265625, -2.6134033203125, -2.52850341796875, -2.443603515625, -2.35870361328125, -2.2738037109375, -2.18890380859375, -2.10400390625, -2.01910400390625, -1.9342041015625, -1.84930419921875, -1.764404296875, -1.67950439453125, -1.5946044921875, -1.50970458984375, -1.4248046875, -1.33990478515625, -1.2550048828125, -1.17010498046875, -1.085205078125, -1.00030517578125, -0.9154052734375, -0.83050537109375, -0.74560546875, -0.66070556640625, -0.5758056640625, -0.49090576171875, -0.406005859375, -0.32110595703125, -0.2362060546875, -0.15130615234375, -0.06640625, 0.01849365234375, 0.1033935546875, 0.18829345703125, 0.273193359375, 0.35809326171875, 0.4429931640625, 0.52789306640625, 0.61279296875, 0.69769287109375, 0.7825927734375, 0.86749267578125, 0.952392578125, 1.03729248046875, 1.1221923828125, 1.20709228515625, 1.2919921875, 1.37689208984375, 1.4617919921875, 1.54669189453125, 1.631591796875, 1.71649169921875, 1.8013916015625, 1.88629150390625, 1.97119140625, 2.05609130859375, 2.1409912109375, 2.22589111328125, 2.310791015625, 2.39569091796875, 2.4805908203125, 2.56549072265625, 2.650390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [7.0, 4.0, 10.0, 7.0, 9.0, 17.0, 24.0, 31.0, 47.0, 73.0, 103.0, 185.0, 257.0, 328.0, 540.0, 869.0, 1343.0, 1948.0, 3217.0, 4800.0, 7691.0, 11740.0, 18029.0, 26917.0, 39656.0, 56290.0, 76811.0, 98115.0, 115070.0, 121740.0, 115073.0, 98111.0, 76621.0, 56326.0, 39183.0, 26356.0, 17872.0, 11873.0, 7636.0, 4804.0, 3134.0, 1936.0, 1287.0, 846.0, 551.0, 377.0, 236.0, 157.0, 111.0, 56.0, 53.0, 30.0, 19.0, 13.0, 7.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.353515625, -2.273712158203125, -2.19390869140625, -2.114105224609375, -2.0343017578125, -1.954498291015625, -1.87469482421875, -1.794891357421875, -1.715087890625, -1.635284423828125, -1.55548095703125, -1.475677490234375, -1.3958740234375, -1.316070556640625, -1.23626708984375, -1.156463623046875, -1.07666015625, -0.996856689453125, -0.91705322265625, -0.837249755859375, -0.7574462890625, -0.677642822265625, -0.59783935546875, -0.518035888671875, -0.438232421875, -0.358428955078125, -0.27862548828125, -0.198822021484375, -0.1190185546875, -0.039215087890625, 0.04058837890625, 0.120391845703125, 0.2001953125, 0.279998779296875, 0.35980224609375, 0.439605712890625, 0.5194091796875, 0.599212646484375, 0.67901611328125, 0.758819580078125, 0.838623046875, 0.918426513671875, 0.99822998046875, 1.078033447265625, 1.1578369140625, 1.237640380859375, 1.31744384765625, 1.397247314453125, 1.47705078125, 1.556854248046875, 1.63665771484375, 1.716461181640625, 1.7962646484375, 1.876068115234375, 1.95587158203125, 2.035675048828125, 2.115478515625, 2.195281982421875, 2.27508544921875, 2.354888916015625, 2.4346923828125, 2.514495849609375, 2.59429931640625, 2.674102783203125, 2.75390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 11.0, 12.0, 12.0, 27.0, 18.0, 25.0, 27.0, 25.0, 23.0, 32.0, 38.0, 41.0, 45.0, 49.0, 57.0, 38.0, 38.0, 42.0, 47.0, 33.0, 43.0, 30.0, 30.0, 32.0, 40.0, 23.0, 29.0, 14.0, 14.0, 9.0, 16.0, 14.0, 15.0, 12.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4817047119140625, -1.429229736328125, -1.3767547607421875, -1.32427978515625, -1.2718048095703125, -1.219329833984375, -1.1668548583984375, -1.1143798828125, -1.0619049072265625, -1.009429931640625, -0.9569549560546875, -0.90447998046875, -0.8520050048828125, -0.799530029296875, -0.7470550537109375, -0.694580078125, -0.6421051025390625, -0.589630126953125, -0.5371551513671875, -0.48468017578125, -0.4322052001953125, -0.379730224609375, -0.3272552490234375, -0.2747802734375, -0.2223052978515625, -0.169830322265625, -0.1173553466796875, -0.06488037109375, -0.0124053955078125, 0.040069580078125, 0.0925445556640625, 0.14501953125, 0.1974945068359375, 0.249969482421875, 0.3024444580078125, 0.35491943359375, 0.4073944091796875, 0.459869384765625, 0.5123443603515625, 0.5648193359375, 0.6172943115234375, 0.669769287109375, 0.7222442626953125, 0.77471923828125, 0.8271942138671875, 0.879669189453125, 0.9321441650390625, 0.984619140625, 1.0370941162109375, 1.089569091796875, 1.1420440673828125, 1.19451904296875, 1.2469940185546875, 1.299468994140625, 1.3519439697265625, 1.4044189453125, 1.4568939208984375, 1.509368896484375, 1.5618438720703125, 1.61431884765625, 1.6667938232421875, 1.719268798828125, 1.7717437744140625, 1.82421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 12.0, 13.0, 19.0, 19.0, 38.0, 58.0, 101.0, 138.0, 169.0, 271.0, 376.0, 576.0, 891.0, 1442.0, 2243.0, 3948.0, 7350.0, 14212.0, 29975.0, 67393.0, 149151.0, 262970.0, 252250.0, 136940.0, 60883.0, 27424.0, 13226.0, 6649.0, 3808.0, 2159.0, 1301.0, 831.0, 587.0, 356.0, 223.0, 182.0, 117.0, 91.0, 45.0, 40.0, 24.0, 21.0, 9.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.5343017578125, -3.416259765625, -3.2982177734375, -3.18017578125, -3.0621337890625, -2.944091796875, -2.8260498046875, -2.7080078125, -2.5899658203125, -2.471923828125, -2.3538818359375, -2.23583984375, -2.1177978515625, -1.999755859375, -1.8817138671875, -1.763671875, -1.6456298828125, -1.527587890625, -1.4095458984375, -1.29150390625, -1.1734619140625, -1.055419921875, -0.9373779296875, -0.8193359375, -0.7012939453125, -0.583251953125, -0.4652099609375, -0.34716796875, -0.2291259765625, -0.111083984375, 0.0069580078125, 0.125, 0.2430419921875, 0.361083984375, 0.4791259765625, 0.59716796875, 0.7152099609375, 0.833251953125, 0.9512939453125, 1.0693359375, 1.1873779296875, 1.305419921875, 1.4234619140625, 1.54150390625, 1.6595458984375, 1.777587890625, 1.8956298828125, 2.013671875, 2.1317138671875, 2.249755859375, 2.3677978515625, 2.48583984375, 2.6038818359375, 2.721923828125, 2.8399658203125, 2.9580078125, 3.0760498046875, 3.194091796875, 3.3121337890625, 3.43017578125, 3.5482177734375, 3.666259765625, 3.7843017578125, 3.90234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 12.0, 19.0, 41.0, 75.0, 86.0, 126.0, 133.0, 142.0, 125.0, 68.0, 43.0, 32.0, 15.0, 13.0, 14.0, 8.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006952285766601562, -0.0006757825613021851, -0.0006563365459442139, -0.0006368905305862427, -0.0006174445152282715, -0.0005979984998703003, -0.0005785524845123291, -0.0005591064691543579, -0.0005396604537963867, -0.0005202144384384155, -0.0005007684230804443, -0.00048132240772247314, -0.00046187639236450195, -0.00044243037700653076, -0.00042298436164855957, -0.0004035383462905884, -0.0003840923309326172, -0.000364646315574646, -0.0003452003002166748, -0.0003257542848587036, -0.0003063082695007324, -0.00028686225414276123, -0.00026741623878479004, -0.00024797022342681885, -0.00022852420806884766, -0.00020907819271087646, -0.00018963217735290527, -0.00017018616199493408, -0.0001507401466369629, -0.0001312941312789917, -0.00011184811592102051, -9.240210056304932e-05, -7.295608520507812e-05, -5.3510069847106934e-05, -3.406405448913574e-05, -1.461803913116455e-05, 4.827976226806641e-06, 2.4273991584777832e-05, 4.3720006942749023e-05, 6.316602230072021e-05, 8.26120376586914e-05, 0.0001020580530166626, 0.00012150406837463379, 0.00014095008373260498, 0.00016039609909057617, 0.00017984211444854736, 0.00019928812980651855, 0.00021873414516448975, 0.00023818016052246094, 0.00025762617588043213, 0.0002770721912384033, 0.0002965182065963745, 0.0003159642219543457, 0.0003354102373123169, 0.0003548562526702881, 0.0003743022680282593, 0.00039374828338623047, 0.00041319429874420166, 0.00043264031410217285, 0.00045208632946014404, 0.00047153234481811523, 0.0004909783601760864, 0.0005104243755340576, 0.0005298703908920288, 0.00054931640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 9.0, 9.0, 13.0, 18.0, 28.0, 51.0, 43.0, 68.0, 108.0, 156.0, 252.0, 335.0, 451.0, 677.0, 1043.0, 1639.0, 2499.0, 4097.0, 6827.0, 11936.0, 21632.0, 39723.0, 73011.0, 129017.0, 193036.0, 207174.0, 152723.0, 89910.0, 49047.0, 26647.0, 14712.0, 8121.0, 4901.0, 3002.0, 1853.0, 1173.0, 828.0, 538.0, 386.0, 267.0, 170.0, 127.0, 87.0, 62.0, 50.0, 22.0, 31.0, 11.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.431640625, -2.3536376953125, -2.275634765625, -2.1976318359375, -2.11962890625, -2.0416259765625, -1.963623046875, -1.8856201171875, -1.8076171875, -1.7296142578125, -1.651611328125, -1.5736083984375, -1.49560546875, -1.4176025390625, -1.339599609375, -1.2615966796875, -1.18359375, -1.1055908203125, -1.027587890625, -0.9495849609375, -0.87158203125, -0.7935791015625, -0.715576171875, -0.6375732421875, -0.5595703125, -0.4815673828125, -0.403564453125, -0.3255615234375, -0.24755859375, -0.1695556640625, -0.091552734375, -0.0135498046875, 0.064453125, 0.1424560546875, 0.220458984375, 0.2984619140625, 0.37646484375, 0.4544677734375, 0.532470703125, 0.6104736328125, 0.6884765625, 0.7664794921875, 0.844482421875, 0.9224853515625, 1.00048828125, 1.0784912109375, 1.156494140625, 1.2344970703125, 1.3125, 1.3905029296875, 1.468505859375, 1.5465087890625, 1.62451171875, 1.7025146484375, 1.780517578125, 1.8585205078125, 1.9365234375, 2.0145263671875, 2.092529296875, 2.1705322265625, 2.24853515625, 2.3265380859375, 2.404541015625, 2.4825439453125, 2.560546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 0.0, 8.0, 10.0, 11.0, 17.0, 16.0, 27.0, 33.0, 38.0, 49.0, 44.0, 54.0, 58.0, 60.0, 79.0, 72.0, 66.0, 59.0, 55.0, 52.0, 23.0, 28.0, 23.0, 16.0, 14.0, 11.0, 11.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.71875, -0.696044921875, -0.67333984375, -0.650634765625, -0.6279296875, -0.605224609375, -0.58251953125, -0.559814453125, -0.537109375, -0.514404296875, -0.49169921875, -0.468994140625, -0.4462890625, -0.423583984375, -0.40087890625, -0.378173828125, -0.35546875, -0.332763671875, -0.31005859375, -0.287353515625, -0.2646484375, -0.241943359375, -0.21923828125, -0.196533203125, -0.173828125, -0.151123046875, -0.12841796875, -0.105712890625, -0.0830078125, -0.060302734375, -0.03759765625, -0.014892578125, 0.0078125, 0.030517578125, 0.05322265625, 0.075927734375, 0.0986328125, 0.121337890625, 0.14404296875, 0.166748046875, 0.189453125, 0.212158203125, 0.23486328125, 0.257568359375, 0.2802734375, 0.302978515625, 0.32568359375, 0.348388671875, 0.37109375, 0.393798828125, 0.41650390625, 0.439208984375, 0.4619140625, 0.484619140625, 0.50732421875, 0.530029296875, 0.552734375, 0.575439453125, 0.59814453125, 0.620849609375, 0.6435546875, 0.666259765625, 0.68896484375, 0.711669921875, 0.734375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 10.0, 13.0, 14.0, 16.0, 12.0, 29.0, 17.0, 30.0, 33.0, 34.0, 48.0, 37.0, 61.0, 58.0, 61.0, 57.0, 66.0, 66.0, 46.0, 49.0, 38.0, 35.0, 27.0, 19.0, 22.0, 23.0, 7.0, 7.0, 13.0, 4.0, 11.0, 11.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.617569446563721, -4.47745418548584, -4.337339401245117, -4.197224140167236, -4.0571088790893555, -3.9169936180114746, -3.776878595352173, -3.636763572692871, -3.4966483116149902, -3.3565330505371094, -3.2164180278778076, -3.076303005218506, -2.936187744140625, -2.796072483062744, -2.6559574604034424, -2.5158424377441406, -2.3757271766662598, -2.235611915588379, -2.095496892929077, -1.9553817510604858, -1.8152666091918945, -1.6751514673233032, -1.535036325454712, -1.3949211835861206, -1.2548060417175293, -1.114690899848938, -0.9745757579803467, -0.8344606161117554, -0.6943454742431641, -0.5542303323745728, -0.41411519050598145, -0.27400004863739014, -0.13388490676879883, 0.0062302350997924805, 0.1463453769683838, 0.2864605188369751, 0.4265756607055664, 0.5666908025741577, 0.706805944442749, 0.8469210863113403, 0.9870362281799316, 1.127151370048523, 1.2672665119171143, 1.4073816537857056, 1.5474967956542969, 1.6876119375228882, 1.8277270793914795, 1.9678422212600708, 2.107957363128662, 2.248072624206543, 2.3881876468658447, 2.5283026695251465, 2.6684179306030273, 2.808533191680908, 2.94864821434021, 3.0887632369995117, 3.2288784980773926, 3.3689937591552734, 3.509108781814575, 3.649223804473877, 3.789339065551758, 3.9294543266296387, 4.0695695877075195, 4.209684371948242, 4.349799633026123]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 9.0, 9.0, 10.0, 13.0, 17.0, 10.0, 18.0, 21.0, 33.0, 14.0, 33.0, 31.0, 38.0, 31.0, 33.0, 33.0, 43.0, 30.0, 39.0, 41.0, 38.0, 34.0, 34.0, 30.0, 40.0, 28.0, 33.0, 28.0, 31.0, 39.0, 14.0, 20.0, 15.0, 24.0, 6.0, 19.0, 11.0, 8.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-2.5560855865478516, -2.4842679500579834, -2.412450075149536, -2.340632438659668, -2.2688148021698, -2.1969971656799316, -2.1251792907714844, -2.053361654281616, -1.9815438985824585, -1.9097261428833008, -1.8379085063934326, -1.766090750694275, -1.6942729949951172, -1.622455358505249, -1.5506376028060913, -1.4788198471069336, -1.4070022106170654, -1.3351844549179077, -1.2633668184280396, -1.1915490627288818, -1.1197314262390137, -1.047913670539856, -0.9760959148406982, -0.9042782187461853, -0.8324605226516724, -0.7606428265571594, -0.6888251304626465, -0.6170073747634888, -0.5451896786689758, -0.4733719825744629, -0.40155425667762756, -0.32973653078079224, -0.2579185962677002, -0.18610088527202606, -0.11428317427635193, -0.042465463280677795, 0.029352247714996338, 0.10116994380950928, 0.1729876697063446, 0.24480539560317993, 0.31662309169769287, 0.3884407877922058, 0.46025851368904114, 0.5320762395858765, 0.6038939356803894, 0.6757116317749023, 0.7475293874740601, 0.819347083568573, 0.8911647796630859, 0.9629824757575989, 1.0348001718521118, 1.1066179275512695, 1.1784355640411377, 1.2502533197402954, 1.3220710754394531, 1.3938887119293213, 1.465706467628479, 1.5375242233276367, 1.6093418598175049, 1.6811596155166626, 1.7529773712158203, 1.8247950077056885, 1.8966127634048462, 1.968430519104004, 2.040248155593872]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 17.0, 17.0, 30.0, 26.0, 41.0, 84.0, 134.0, 181.0, 324.0, 457.0, 765.0, 1264.0, 2062.0, 3540.0, 6323.0, 11072.0, 20599.0, 39078.0, 77915.0, 164238.0, 369744.0, 805057.0, 1157518.0, 819576.0, 379241.0, 168429.0, 79440.0, 39743.0, 21030.0, 11352.0, 6233.0, 3606.0, 2044.0, 1215.0, 753.0, 441.0, 255.0, 153.0, 98.0, 72.0, 41.0, 29.0, 17.0, 7.0, 6.0, 9.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.9453125, -4.793212890625, -4.64111328125, -4.489013671875, -4.3369140625, -4.184814453125, -4.03271484375, -3.880615234375, -3.728515625, -3.576416015625, -3.42431640625, -3.272216796875, -3.1201171875, -2.968017578125, -2.81591796875, -2.663818359375, -2.51171875, -2.359619140625, -2.20751953125, -2.055419921875, -1.9033203125, -1.751220703125, -1.59912109375, -1.447021484375, -1.294921875, -1.142822265625, -0.99072265625, -0.838623046875, -0.6865234375, -0.534423828125, -0.38232421875, -0.230224609375, -0.078125, 0.073974609375, 0.22607421875, 0.378173828125, 0.5302734375, 0.682373046875, 0.83447265625, 0.986572265625, 1.138671875, 1.290771484375, 1.44287109375, 1.594970703125, 1.7470703125, 1.899169921875, 2.05126953125, 2.203369140625, 2.35546875, 2.507568359375, 2.65966796875, 2.811767578125, 2.9638671875, 3.115966796875, 3.26806640625, 3.420166015625, 3.572265625, 3.724365234375, 3.87646484375, 4.028564453125, 4.1806640625, 4.332763671875, 4.48486328125, 4.636962890625, 4.7890625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 5.0, 9.0, 16.0, 17.0, 14.0, 20.0, 23.0, 29.0, 24.0, 32.0, 35.0, 42.0, 45.0, 33.0, 35.0, 42.0, 50.0, 35.0, 45.0, 49.0, 44.0, 35.0, 31.0, 29.0, 24.0, 33.0, 22.0, 26.0, 24.0, 24.0, 15.0, 12.0, 18.0, 9.0, 7.0, 6.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.2865753173828125, -2.219635009765625, -2.1526947021484375, -2.08575439453125, -2.0188140869140625, -1.951873779296875, -1.8849334716796875, -1.8179931640625, -1.7510528564453125, -1.684112548828125, -1.6171722412109375, -1.55023193359375, -1.4832916259765625, -1.416351318359375, -1.3494110107421875, -1.282470703125, -1.2155303955078125, -1.148590087890625, -1.0816497802734375, -1.01470947265625, -0.9477691650390625, -0.880828857421875, -0.8138885498046875, -0.7469482421875, -0.6800079345703125, -0.613067626953125, -0.5461273193359375, -0.47918701171875, -0.4122467041015625, -0.345306396484375, -0.2783660888671875, -0.21142578125, -0.1444854736328125, -0.077545166015625, -0.0106048583984375, 0.05633544921875, 0.1232757568359375, 0.190216064453125, 0.2571563720703125, 0.3240966796875, 0.3910369873046875, 0.457977294921875, 0.5249176025390625, 0.59185791015625, 0.6587982177734375, 0.725738525390625, 0.7926788330078125, 0.859619140625, 0.9265594482421875, 0.993499755859375, 1.0604400634765625, 1.12738037109375, 1.1943206787109375, 1.261260986328125, 1.3282012939453125, 1.3951416015625, 1.4620819091796875, 1.529022216796875, 1.5959625244140625, 1.66290283203125, 1.7298431396484375, 1.796783447265625, 1.8637237548828125, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 15.0, 18.0, 15.0, 34.0, 57.0, 99.0, 138.0, 227.0, 335.0, 570.0, 937.0, 1575.0, 2800.0, 4571.0, 8458.0, 15048.0, 27894.0, 52572.0, 102349.0, 205976.0, 416428.0, 775062.0, 1021311.0, 750665.0, 398872.0, 198723.0, 98801.0, 50510.0, 26396.0, 14582.0, 7974.0, 4599.0, 2648.0, 1580.0, 907.0, 577.0, 345.0, 212.0, 132.0, 91.0, 61.0, 44.0, 21.0, 18.0, 12.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.3359375, -5.176513671875, -5.01708984375, -4.857666015625, -4.6982421875, -4.538818359375, -4.37939453125, -4.219970703125, -4.060546875, -3.901123046875, -3.74169921875, -3.582275390625, -3.4228515625, -3.263427734375, -3.10400390625, -2.944580078125, -2.78515625, -2.625732421875, -2.46630859375, -2.306884765625, -2.1474609375, -1.988037109375, -1.82861328125, -1.669189453125, -1.509765625, -1.350341796875, -1.19091796875, -1.031494140625, -0.8720703125, -0.712646484375, -0.55322265625, -0.393798828125, -0.234375, -0.074951171875, 0.08447265625, 0.243896484375, 0.4033203125, 0.562744140625, 0.72216796875, 0.881591796875, 1.041015625, 1.200439453125, 1.35986328125, 1.519287109375, 1.6787109375, 1.838134765625, 1.99755859375, 2.156982421875, 2.31640625, 2.475830078125, 2.63525390625, 2.794677734375, 2.9541015625, 3.113525390625, 3.27294921875, 3.432373046875, 3.591796875, 3.751220703125, 3.91064453125, 4.070068359375, 4.2294921875, 4.388916015625, 4.54833984375, 4.707763671875, 4.8671875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 6.0, 6.0, 15.0, 19.0, 24.0, 30.0, 40.0, 55.0, 57.0, 52.0, 81.0, 81.0, 110.0, 121.0, 165.0, 164.0, 185.0, 219.0, 219.0, 253.0, 261.0, 255.0, 232.0, 201.0, 179.0, 186.0, 147.0, 119.0, 103.0, 81.0, 66.0, 67.0, 61.0, 39.0, 33.0, 34.0, 19.0, 16.0, 10.0, 10.0, 10.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0], "bins": [-1.19921875, -1.161041259765625, -1.12286376953125, -1.084686279296875, -1.0465087890625, -1.008331298828125, -0.97015380859375, -0.931976318359375, -0.893798828125, -0.855621337890625, -0.81744384765625, -0.779266357421875, -0.7410888671875, -0.702911376953125, -0.66473388671875, -0.626556396484375, -0.58837890625, -0.550201416015625, -0.51202392578125, -0.473846435546875, -0.4356689453125, -0.397491455078125, -0.35931396484375, -0.321136474609375, -0.282958984375, -0.244781494140625, -0.20660400390625, -0.168426513671875, -0.1302490234375, -0.092071533203125, -0.05389404296875, -0.015716552734375, 0.0224609375, 0.060638427734375, 0.09881591796875, 0.136993408203125, 0.1751708984375, 0.213348388671875, 0.25152587890625, 0.289703369140625, 0.327880859375, 0.366058349609375, 0.40423583984375, 0.442413330078125, 0.4805908203125, 0.518768310546875, 0.55694580078125, 0.595123291015625, 0.63330078125, 0.671478271484375, 0.70965576171875, 0.747833251953125, 0.7860107421875, 0.824188232421875, 0.86236572265625, 0.900543212890625, 0.938720703125, 0.976898193359375, 1.01507568359375, 1.053253173828125, 1.0914306640625, 1.129608154296875, 1.16778564453125, 1.205963134765625, 1.244140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 12.0, 10.0, 16.0, 23.0, 17.0, 28.0, 34.0, 34.0, 38.0, 49.0, 52.0, 56.0, 39.0, 49.0, 56.0, 46.0, 49.0, 48.0, 45.0, 46.0, 35.0, 37.0, 29.0, 15.0, 14.0, 16.0, 13.0, 15.0, 11.0, 8.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.763072967529297, -4.624141216278076, -4.485208988189697, -4.346277236938477, -4.207345008850098, -4.068413257598877, -3.9294815063476562, -3.7905495166778564, -3.6516175270080566, -3.512685537338257, -3.373753547668457, -3.2348217964172363, -3.0958898067474365, -2.9569578170776367, -2.818026065826416, -2.679094076156616, -2.5401620864868164, -2.4012300968170166, -2.262298107147217, -2.123366355895996, -1.9844343662261963, -1.8455023765563965, -1.7065705060958862, -1.567638635635376, -1.4287066459655762, -1.2897746562957764, -1.1508427858352661, -1.0119109153747559, -0.872978925704956, -0.734046995639801, -0.595115065574646, -0.45618313550949097, -0.31725120544433594, -0.1783192753791809, -0.03938734531402588, 0.09954458475112915, 0.23847651481628418, 0.3774084448814392, 0.5163403749465942, 0.6552723050117493, 0.7942042350769043, 0.9331361651420593, 1.0720680952072144, 1.2109999656677246, 1.3499319553375244, 1.4888639450073242, 1.6277958154678345, 1.7667276859283447, 1.9056596755981445, 2.0445916652679443, 2.183523654937744, 2.322455406188965, 2.4613873958587646, 2.6003193855285645, 2.739251136779785, 2.878183126449585, 3.0171151161193848, 3.1560471057891846, 3.2949790954589844, 3.433910846710205, 3.572842836380005, 3.7117748260498047, 3.8507065773010254, 3.989638566970825, 4.128570556640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 10.0, 15.0, 12.0, 9.0, 12.0, 13.0, 28.0, 28.0, 29.0, 30.0, 38.0, 38.0, 35.0, 28.0, 44.0, 49.0, 32.0, 39.0, 37.0, 32.0, 35.0, 41.0, 48.0, 37.0, 30.0, 28.0, 24.0, 20.0, 21.0, 21.0, 20.0, 15.0, 11.0, 21.0, 11.0, 9.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4725818634033203, -2.394728183746338, -2.3168742656707764, -2.239020586013794, -2.1611669063568115, -2.08331298828125, -2.0054593086242676, -1.9276056289672852, -1.8497518301010132, -1.7718980312347412, -1.6940443515777588, -1.6161905527114868, -1.5383367538452148, -1.4604830741882324, -1.3826292753219604, -1.3047754764556885, -1.226921796798706, -1.149067997932434, -1.0712143182754517, -0.9933605194091797, -0.9155067801475525, -0.8376530408859253, -0.7597992420196533, -0.6819455027580261, -0.6040917634963989, -0.5262380242347717, -0.44838425517082214, -0.37053048610687256, -0.29267674684524536, -0.21482300758361816, -0.13696923851966858, -0.059115469455718994, 0.0187380313873291, 0.09659178555011749, 0.17444553971290588, 0.25229930877685547, 0.33015304803848267, 0.40800678730010986, 0.48586055636405945, 0.563714325428009, 0.6415680646896362, 0.7194218039512634, 0.7972755432128906, 0.8751293420791626, 0.9529830813407898, 1.030836820602417, 1.108690619468689, 1.186544418334961, 1.2643980979919434, 1.3422518968582153, 1.4201055765151978, 1.4979593753814697, 1.5758130550384521, 1.6536668539047241, 1.731520652770996, 1.8093743324279785, 1.8872281312942505, 1.9650819301605225, 2.042935609817505, 2.1207892894744873, 2.198643207550049, 2.2764968872070312, 2.3543505668640137, 2.432204484939575, 2.5100581645965576]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 13.0, 14.0, 24.0, 43.0, 54.0, 93.0, 148.0, 222.0, 315.0, 506.0, 850.0, 1292.0, 1911.0, 3270.0, 4887.0, 8554.0, 14897.0, 27116.0, 50646.0, 97522.0, 178512.0, 246931.0, 186547.0, 103047.0, 53550.0, 28704.0, 15543.0, 9175.0, 5243.0, 3185.0, 2096.0, 1256.0, 808.0, 536.0, 365.0, 234.0, 146.0, 103.0, 65.0, 53.0, 24.0, 23.0, 12.0, 9.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65673828125, -0.637725830078125, -0.61871337890625, -0.599700927734375, -0.5806884765625, -0.561676025390625, -0.54266357421875, -0.523651123046875, -0.504638671875, -0.485626220703125, -0.46661376953125, -0.447601318359375, -0.4285888671875, -0.409576416015625, -0.39056396484375, -0.371551513671875, -0.3525390625, -0.333526611328125, -0.31451416015625, -0.295501708984375, -0.2764892578125, -0.257476806640625, -0.23846435546875, -0.219451904296875, -0.200439453125, -0.181427001953125, -0.16241455078125, -0.143402099609375, -0.1243896484375, -0.105377197265625, -0.08636474609375, -0.067352294921875, -0.04833984375, -0.029327392578125, -0.01031494140625, 0.008697509765625, 0.0277099609375, 0.046722412109375, 0.06573486328125, 0.084747314453125, 0.103759765625, 0.122772216796875, 0.14178466796875, 0.160797119140625, 0.1798095703125, 0.198822021484375, 0.21783447265625, 0.236846923828125, 0.255859375, 0.274871826171875, 0.29388427734375, 0.312896728515625, 0.3319091796875, 0.350921630859375, 0.36993408203125, 0.388946533203125, 0.407958984375, 0.426971435546875, 0.44598388671875, 0.464996337890625, 0.4840087890625, 0.503021240234375, 0.52203369140625, 0.541046142578125, 0.56005859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 12.0, 11.0, 10.0, 17.0, 17.0, 26.0, 26.0, 32.0, 43.0, 36.0, 41.0, 39.0, 50.0, 50.0, 46.0, 41.0, 43.0, 38.0, 46.0, 44.0, 36.0, 33.0, 27.0, 23.0, 32.0, 25.0, 21.0, 24.0, 14.0, 11.0, 13.0, 15.0, 6.0, 9.0, 8.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.34375, -3.24462890625, -3.1455078125, -3.04638671875, -2.947265625, -2.84814453125, -2.7490234375, -2.64990234375, -2.55078125, -2.45166015625, -2.3525390625, -2.25341796875, -2.154296875, -2.05517578125, -1.9560546875, -1.85693359375, -1.7578125, -1.65869140625, -1.5595703125, -1.46044921875, -1.361328125, -1.26220703125, -1.1630859375, -1.06396484375, -0.96484375, -0.86572265625, -0.7666015625, -0.66748046875, -0.568359375, -0.46923828125, -0.3701171875, -0.27099609375, -0.171875, -0.07275390625, 0.0263671875, 0.12548828125, 0.224609375, 0.32373046875, 0.4228515625, 0.52197265625, 0.62109375, 0.72021484375, 0.8193359375, 0.91845703125, 1.017578125, 1.11669921875, 1.2158203125, 1.31494140625, 1.4140625, 1.51318359375, 1.6123046875, 1.71142578125, 1.810546875, 1.90966796875, 2.0087890625, 2.10791015625, 2.20703125, 2.30615234375, 2.4052734375, 2.50439453125, 2.603515625, 2.70263671875, 2.8017578125, 2.90087890625, 3.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 9.0, 13.0, 23.0, 24.0, 20.0, 39.0, 53.0, 93.0, 101.0, 183.0, 288.0, 442.0, 749.0, 1208.0, 2079.0, 4072.0, 8481.0, 20916.0, 143793.0, 813254.0, 30291.0, 10956.0, 5045.0, 2600.0, 1400.0, 872.0, 521.0, 329.0, 214.0, 143.0, 89.0, 66.0, 54.0, 24.0, 35.0, 23.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.068389892578125, -2.00201416015625, -1.935638427734375, -1.8692626953125, -1.802886962890625, -1.73651123046875, -1.670135498046875, -1.603759765625, -1.537384033203125, -1.47100830078125, -1.404632568359375, -1.3382568359375, -1.271881103515625, -1.20550537109375, -1.139129638671875, -1.07275390625, -1.006378173828125, -0.94000244140625, -0.873626708984375, -0.8072509765625, -0.740875244140625, -0.67449951171875, -0.608123779296875, -0.541748046875, -0.475372314453125, -0.40899658203125, -0.342620849609375, -0.2762451171875, -0.209869384765625, -0.14349365234375, -0.077117919921875, -0.0107421875, 0.055633544921875, 0.12200927734375, 0.188385009765625, 0.2547607421875, 0.321136474609375, 0.38751220703125, 0.453887939453125, 0.520263671875, 0.586639404296875, 0.65301513671875, 0.719390869140625, 0.7857666015625, 0.852142333984375, 0.91851806640625, 0.984893798828125, 1.05126953125, 1.117645263671875, 1.18402099609375, 1.250396728515625, 1.3167724609375, 1.383148193359375, 1.44952392578125, 1.515899658203125, 1.582275390625, 1.648651123046875, 1.71502685546875, 1.781402587890625, 1.8477783203125, 1.914154052734375, 1.98052978515625, 2.046905517578125, 2.11328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 7.0, 10.0, 9.0, 16.0, 20.0, 19.0, 22.0, 25.0, 24.0, 21.0, 29.0, 37.0, 42.0, 52.0, 53.0, 43.0, 43.0, 51.0, 47.0, 52.0, 33.0, 39.0, 38.0, 42.0, 34.0, 27.0, 20.0, 25.0, 20.0, 18.0, 15.0, 9.0, 13.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.97149658203125, -1.9019775390625, -1.83245849609375, -1.762939453125, -1.69342041015625, -1.6239013671875, -1.55438232421875, -1.48486328125, -1.41534423828125, -1.3458251953125, -1.27630615234375, -1.206787109375, -1.13726806640625, -1.0677490234375, -0.99822998046875, -0.9287109375, -0.85919189453125, -0.7896728515625, -0.72015380859375, -0.650634765625, -0.58111572265625, -0.5115966796875, -0.44207763671875, -0.37255859375, -0.30303955078125, -0.2335205078125, -0.16400146484375, -0.094482421875, -0.02496337890625, 0.0445556640625, 0.11407470703125, 0.18359375, 0.25311279296875, 0.3226318359375, 0.39215087890625, 0.461669921875, 0.53118896484375, 0.6007080078125, 0.67022705078125, 0.73974609375, 0.80926513671875, 0.8787841796875, 0.94830322265625, 1.017822265625, 1.08734130859375, 1.1568603515625, 1.22637939453125, 1.2958984375, 1.36541748046875, 1.4349365234375, 1.50445556640625, 1.573974609375, 1.64349365234375, 1.7130126953125, 1.78253173828125, 1.85205078125, 1.92156982421875, 1.9910888671875, 2.06060791015625, 2.130126953125, 2.19964599609375, 2.2691650390625, 2.33868408203125, 2.408203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 4.0, 16.0, 10.0, 27.0, 43.0, 48.0, 79.0, 86.0, 157.0, 225.0, 315.0, 475.0, 725.0, 1092.0, 1873.0, 3142.0, 6158.0, 14804.0, 57839.0, 905037.0, 32810.0, 11298.0, 5070.0, 2660.0, 1561.0, 936.0, 647.0, 417.0, 301.0, 206.0, 128.0, 97.0, 58.0, 46.0, 37.0, 27.0, 18.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6018905639648438, -0.5826873779296875, -0.5634841918945312, -0.544281005859375, -0.5250778198242188, -0.5058746337890625, -0.48667144775390625, -0.46746826171875, -0.44826507568359375, -0.4290618896484375, -0.40985870361328125, -0.390655517578125, -0.37145233154296875, -0.3522491455078125, -0.33304595947265625, -0.3138427734375, -0.29463958740234375, -0.2754364013671875, -0.25623321533203125, -0.237030029296875, -0.21782684326171875, -0.1986236572265625, -0.17942047119140625, -0.16021728515625, -0.14101409912109375, -0.1218109130859375, -0.10260772705078125, -0.083404541015625, -0.06420135498046875, -0.0449981689453125, -0.02579498291015625, -0.006591796875, 0.01261138916015625, 0.0318145751953125, 0.05101776123046875, 0.070220947265625, 0.08942413330078125, 0.1086273193359375, 0.12783050537109375, 0.14703369140625, 0.16623687744140625, 0.1854400634765625, 0.20464324951171875, 0.223846435546875, 0.24304962158203125, 0.2622528076171875, 0.28145599365234375, 0.3006591796875, 0.31986236572265625, 0.3390655517578125, 0.35826873779296875, 0.377471923828125, 0.39667510986328125, 0.4158782958984375, 0.43508148193359375, 0.45428466796875, 0.47348785400390625, 0.4926910400390625, 0.5118942260742188, 0.531097412109375, 0.5503005981445312, 0.5695037841796875, 0.5887069702148438, 0.60791015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 7.0, 2.0, 9.0, 11.0, 15.0, 18.0, 23.0, 22.0, 21.0, 20.0, 40.0, 40.0, 68.0, 75.0, 65.0, 74.0, 61.0, 53.0, 61.0, 50.0, 56.0, 33.0, 39.0, 21.0, 21.0, 14.0, 14.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6684017181396484e-05, -5.498994141817093e-05, -5.3295865654945374e-05, -5.160178989171982e-05, -4.990771412849426e-05, -4.821363836526871e-05, -4.651956260204315e-05, -4.4825486838817596e-05, -4.313141107559204e-05, -4.1437335312366486e-05, -3.974325954914093e-05, -3.8049183785915375e-05, -3.635510802268982e-05, -3.4661032259464264e-05, -3.296695649623871e-05, -3.127288073301315e-05, -2.9578804969787598e-05, -2.7884729206562042e-05, -2.6190653443336487e-05, -2.449657768011093e-05, -2.2802501916885376e-05, -2.110842615365982e-05, -1.9414350390434265e-05, -1.772027462720871e-05, -1.6026198863983154e-05, -1.4332123100757599e-05, -1.2638047337532043e-05, -1.0943971574306488e-05, -9.249895811080933e-06, -7.555820047855377e-06, -5.861744284629822e-06, -4.167668521404266e-06, -2.473592758178711e-06, -7.795169949531555e-07, 9.145587682723999e-07, 2.6086345314979553e-06, 4.302710294723511e-06, 5.996786057949066e-06, 7.690861821174622e-06, 9.384937584400177e-06, 1.1079013347625732e-05, 1.2773089110851288e-05, 1.4467164874076843e-05, 1.61612406373024e-05, 1.7855316400527954e-05, 1.954939216375351e-05, 2.1243467926979065e-05, 2.293754369020462e-05, 2.4631619453430176e-05, 2.632569521665573e-05, 2.8019770979881287e-05, 2.9713846743106842e-05, 3.14079225063324e-05, 3.310199826955795e-05, 3.479607403278351e-05, 3.6490149796009064e-05, 3.818422555923462e-05, 3.9878301322460175e-05, 4.157237708568573e-05, 4.3266452848911285e-05, 4.496052861213684e-05, 4.6654604375362396e-05, 4.834868013858795e-05, 5.004275590181351e-05, 5.173683166503906e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 15.0, 25.0, 45.0, 68.0, 96.0, 152.0, 199.0, 300.0, 536.0, 798.0, 1264.0, 1904.0, 3070.0, 4864.0, 7931.0, 13622.0, 23944.0, 47753.0, 118924.0, 319582.0, 297300.0, 106111.0, 44387.0, 22404.0, 12769.0, 7663.0, 4668.0, 2899.0, 1861.0, 1164.0, 788.0, 486.0, 276.0, 217.0, 136.0, 83.0, 77.0, 52.0, 31.0, 19.0, 12.0, 9.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23433685302734375, -0.2262420654296875, -0.21814727783203125, -0.210052490234375, -0.20195770263671875, -0.1938629150390625, -0.18576812744140625, -0.17767333984375, -0.16957855224609375, -0.1614837646484375, -0.15338897705078125, -0.145294189453125, -0.13719940185546875, -0.1291046142578125, -0.12100982666015625, -0.1129150390625, -0.10482025146484375, -0.0967254638671875, -0.08863067626953125, -0.080535888671875, -0.07244110107421875, -0.0643463134765625, -0.05625152587890625, -0.04815673828125, -0.04006195068359375, -0.0319671630859375, -0.02387237548828125, -0.015777587890625, -0.00768280029296875, 0.0004119873046875, 0.00850677490234375, 0.0166015625, 0.02469635009765625, 0.0327911376953125, 0.04088592529296875, 0.048980712890625, 0.05707550048828125, 0.0651702880859375, 0.07326507568359375, 0.08135986328125, 0.08945465087890625, 0.0975494384765625, 0.10564422607421875, 0.113739013671875, 0.12183380126953125, 0.1299285888671875, 0.13802337646484375, 0.1461181640625, 0.15421295166015625, 0.1623077392578125, 0.17040252685546875, 0.178497314453125, 0.18659210205078125, 0.1946868896484375, 0.20278167724609375, 0.21087646484375, 0.21897125244140625, 0.2270660400390625, 0.23516082763671875, 0.243255615234375, 0.25135040283203125, 0.2594451904296875, 0.26753997802734375, 0.275634765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 8.0, 18.0, 18.0, 21.0, 22.0, 30.0, 35.0, 55.0, 85.0, 61.0, 89.0, 102.0, 81.0, 84.0, 48.0, 36.0, 24.0, 21.0, 24.0, 15.0, 9.0, 13.0, 8.0, 5.0, 4.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05096435546875, -0.04932594299316406, -0.047687530517578125, -0.04604911804199219, -0.04441070556640625, -0.04277229309082031, -0.041133880615234375, -0.03949546813964844, -0.0378570556640625, -0.03621864318847656, -0.034580230712890625, -0.03294181823730469, -0.03130340576171875, -0.029664993286132812, -0.028026580810546875, -0.026388168334960938, -0.024749755859375, -0.023111343383789062, -0.021472930908203125, -0.019834518432617188, -0.01819610595703125, -0.016557693481445312, -0.014919281005859375, -0.013280868530273438, -0.0116424560546875, -0.010004043579101562, -0.008365631103515625, -0.0067272186279296875, -0.00508880615234375, -0.0034503936767578125, -0.001811981201171875, -0.0001735687255859375, 0.00146484375, 0.0031032562255859375, 0.004741668701171875, 0.0063800811767578125, 0.00801849365234375, 0.009656906127929688, 0.011295318603515625, 0.012933731079101562, 0.0145721435546875, 0.016210556030273438, 0.017848968505859375, 0.019487380981445312, 0.02112579345703125, 0.022764205932617188, 0.024402618408203125, 0.026041030883789062, 0.027679443359375, 0.029317855834960938, 0.030956268310546875, 0.03259468078613281, 0.03423309326171875, 0.03587150573730469, 0.037509918212890625, 0.03914833068847656, 0.0407867431640625, 0.04242515563964844, 0.044063568115234375, 0.04570198059082031, 0.04734039306640625, 0.04897880554199219, 0.050617218017578125, 0.05225563049316406, 0.05389404296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 9.0, 6.0, 11.0, 9.0, 10.0, 17.0, 21.0, 15.0, 22.0, 41.0, 31.0, 37.0, 39.0, 56.0, 54.0, 42.0, 43.0, 52.0, 54.0, 41.0, 47.0, 50.0, 40.0, 39.0, 40.0, 33.0, 25.0, 11.0, 11.0, 14.0, 16.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.538368225097656, -4.402956008911133, -4.267544269561768, -4.132132053375244, -3.996720314025879, -3.8613083362579346, -3.7258963584899902, -3.590484142303467, -3.4550724029541016, -3.3196604251861572, -3.184248447418213, -3.0488364696502686, -2.913424491882324, -2.77801251411438, -2.6426005363464355, -2.507188320159912, -2.3717763423919678, -2.2363643646240234, -2.100952386856079, -1.9655404090881348, -1.8301284313201904, -1.694716453552246, -1.5593043565750122, -1.4238923788070679, -1.2884804010391235, -1.1530684232711792, -1.0176564455032349, -0.8822444081306458, -0.7468324303627014, -0.6114204525947571, -0.47600841522216797, -0.34059643745422363, -0.2051844596862793, -0.06977246701717377, 0.06563952565193176, 0.2010515332221985, 0.3364635109901428, 0.47187548875808716, 0.6072875261306763, 0.7426995038986206, 0.8781114816665649, 1.0135234594345093, 1.1489354372024536, 1.2843475341796875, 1.4197595119476318, 1.5551714897155762, 1.6905834674835205, 1.8259954452514648, 1.9614074230194092, 2.0968194007873535, 2.232231378555298, 2.367643356323242, 2.5030553340911865, 2.638467311859131, 2.7738795280456543, 2.9092912673950195, 3.044703483581543, 3.1801154613494873, 3.3155274391174316, 3.450939416885376, 3.5863513946533203, 3.7217633724212646, 3.857175350189209, 3.9925875663757324, 4.127999305725098]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 12.0, 11.0, 10.0, 15.0, 9.0, 15.0, 7.0, 19.0, 33.0, 25.0, 30.0, 27.0, 40.0, 34.0, 35.0, 31.0, 40.0, 48.0, 41.0, 33.0, 35.0, 35.0, 31.0, 40.0, 50.0, 37.0, 27.0, 27.0, 26.0, 18.0, 23.0, 20.0, 17.0, 14.0, 14.0, 19.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.394810438156128, -2.318641185760498, -2.2424721717834473, -2.1663029193878174, -2.0901339054107666, -2.0139646530151367, -1.9377955198287964, -1.861626386642456, -1.7854571342468262, -1.7092880010604858, -1.6331188678741455, -1.5569496154785156, -1.4807804822921753, -1.404611349105835, -1.3284422159194946, -1.2522730827331543, -1.176103949546814, -1.0999348163604736, -1.0237656831741333, -0.9475964903831482, -0.8714272975921631, -0.7952581644058228, -0.7190890312194824, -0.6429198384284973, -0.566750705242157, -0.49058154225349426, -0.41441237926483154, -0.3382432460784912, -0.2620740830898285, -0.18590492010116577, -0.10973578691482544, -0.03356659412384033, 0.0426025390625, 0.11877169460058212, 0.19494085013866425, 0.27110999822616577, 0.3472791612148285, 0.4234483242034912, 0.49961745738983154, 0.5757866501808167, 0.651955783367157, 0.7281249165534973, 0.8042941093444824, 0.8804632425308228, 0.9566323757171631, 1.032801628112793, 1.1089706420898438, 1.1851398944854736, 1.261309027671814, 1.3374781608581543, 1.4136472940444946, 1.489816427230835, 1.5659856796264648, 1.6421548128128052, 1.7183239459991455, 1.7944931983947754, 1.8706622123718262, 1.9468313455581665, 2.023000478744507, 2.0991697311401367, 2.1753387451171875, 2.2515079975128174, 2.3276772499084473, 2.403846263885498, 2.480015516281128]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 30.0, 48.0, 78.0, 86.0, 121.0, 205.0, 309.0, 524.0, 939.0, 1610.0, 2642.0, 4895.0, 8901.0, 16857.0, 31385.0, 58225.0, 100608.0, 154838.0, 189809.0, 176991.0, 127582.0, 77803.0, 43249.0, 22905.0, 12488.0, 6612.0, 3661.0, 2078.0, 1170.0, 689.0, 421.0, 255.0, 169.0, 91.0, 71.0, 59.0, 35.0, 18.0, 11.0, 9.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.265625, -4.13128662109375, -3.9969482421875, -3.86260986328125, -3.728271484375, -3.59393310546875, -3.4595947265625, -3.32525634765625, -3.19091796875, -3.05657958984375, -2.9222412109375, -2.78790283203125, -2.653564453125, -2.51922607421875, -2.3848876953125, -2.25054931640625, -2.1162109375, -1.98187255859375, -1.8475341796875, -1.71319580078125, -1.578857421875, -1.44451904296875, -1.3101806640625, -1.17584228515625, -1.04150390625, -0.90716552734375, -0.7728271484375, -0.63848876953125, -0.504150390625, -0.36981201171875, -0.2354736328125, -0.10113525390625, 0.033203125, 0.16754150390625, 0.3018798828125, 0.43621826171875, 0.570556640625, 0.70489501953125, 0.8392333984375, 0.97357177734375, 1.10791015625, 1.24224853515625, 1.3765869140625, 1.51092529296875, 1.645263671875, 1.77960205078125, 1.9139404296875, 2.04827880859375, 2.1826171875, 2.31695556640625, 2.4512939453125, 2.58563232421875, 2.719970703125, 2.85430908203125, 2.9886474609375, 3.12298583984375, 3.25732421875, 3.39166259765625, 3.5260009765625, 3.66033935546875, 3.794677734375, 3.92901611328125, 4.0633544921875, 4.19769287109375, 4.33203125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 9.0, 13.0, 12.0, 13.0, 19.0, 23.0, 27.0, 40.0, 31.0, 42.0, 39.0, 45.0, 49.0, 44.0, 44.0, 41.0, 35.0, 38.0, 40.0, 37.0, 41.0, 42.0, 30.0, 29.0, 40.0, 22.0, 25.0, 20.0, 10.0, 16.0, 12.0, 12.0, 11.0, 8.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.19921875, -3.10540771484375, -3.0115966796875, -2.91778564453125, -2.823974609375, -2.73016357421875, -2.6363525390625, -2.54254150390625, -2.44873046875, -2.35491943359375, -2.2611083984375, -2.16729736328125, -2.073486328125, -1.97967529296875, -1.8858642578125, -1.79205322265625, -1.6982421875, -1.60443115234375, -1.5106201171875, -1.41680908203125, -1.322998046875, -1.22918701171875, -1.1353759765625, -1.04156494140625, -0.94775390625, -0.85394287109375, -0.7601318359375, -0.66632080078125, -0.572509765625, -0.47869873046875, -0.3848876953125, -0.29107666015625, -0.197265625, -0.10345458984375, -0.0096435546875, 0.08416748046875, 0.177978515625, 0.27178955078125, 0.3656005859375, 0.45941162109375, 0.55322265625, 0.64703369140625, 0.7408447265625, 0.83465576171875, 0.928466796875, 1.02227783203125, 1.1160888671875, 1.20989990234375, 1.3037109375, 1.39752197265625, 1.4913330078125, 1.58514404296875, 1.678955078125, 1.77276611328125, 1.8665771484375, 1.96038818359375, 2.05419921875, 2.14801025390625, 2.2418212890625, 2.33563232421875, 2.429443359375, 2.52325439453125, 2.6170654296875, 2.71087646484375, 2.8046875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 17.0, 16.0, 22.0, 29.0, 54.0, 79.0, 142.0, 169.0, 318.0, 479.0, 813.0, 1300.0, 2166.0, 3702.0, 6402.0, 11074.0, 18402.0, 31268.0, 51294.0, 80654.0, 116918.0, 148935.0, 157984.0, 138826.0, 102753.0, 68981.0, 42734.0, 25952.0, 15233.0, 8960.0, 5053.0, 3093.0, 1814.0, 1077.0, 697.0, 417.0, 247.0, 150.0, 116.0, 60.0, 44.0, 31.0, 22.0, 16.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.71484375, -3.599884033203125, -3.48492431640625, -3.369964599609375, -3.2550048828125, -3.140045166015625, -3.02508544921875, -2.910125732421875, -2.795166015625, -2.680206298828125, -2.56524658203125, -2.450286865234375, -2.3353271484375, -2.220367431640625, -2.10540771484375, -1.990447998046875, -1.87548828125, -1.760528564453125, -1.64556884765625, -1.530609130859375, -1.4156494140625, -1.300689697265625, -1.18572998046875, -1.070770263671875, -0.955810546875, -0.840850830078125, -0.72589111328125, -0.610931396484375, -0.4959716796875, -0.381011962890625, -0.26605224609375, -0.151092529296875, -0.0361328125, 0.078826904296875, 0.19378662109375, 0.308746337890625, 0.4237060546875, 0.538665771484375, 0.65362548828125, 0.768585205078125, 0.883544921875, 0.998504638671875, 1.11346435546875, 1.228424072265625, 1.3433837890625, 1.458343505859375, 1.57330322265625, 1.688262939453125, 1.80322265625, 1.918182373046875, 2.03314208984375, 2.148101806640625, 2.2630615234375, 2.378021240234375, 2.49298095703125, 2.607940673828125, 2.722900390625, 2.837860107421875, 2.95281982421875, 3.067779541015625, 3.1827392578125, 3.297698974609375, 3.41265869140625, 3.527618408203125, 3.642578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 11.0, 12.0, 10.0, 13.0, 11.0, 13.0, 15.0, 23.0, 26.0, 26.0, 28.0, 26.0, 35.0, 33.0, 39.0, 34.0, 48.0, 36.0, 43.0, 32.0, 35.0, 31.0, 32.0, 25.0, 33.0, 27.0, 34.0, 27.0, 27.0, 20.0, 23.0, 16.0, 23.0, 14.0, 9.0, 18.0, 14.0, 3.0, 12.0, 2.0, 11.0, 8.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0], "bins": [-1.66796875, -1.618438720703125, -1.56890869140625, -1.519378662109375, -1.4698486328125, -1.420318603515625, -1.37078857421875, -1.321258544921875, -1.271728515625, -1.222198486328125, -1.17266845703125, -1.123138427734375, -1.0736083984375, -1.024078369140625, -0.97454833984375, -0.925018310546875, -0.87548828125, -0.825958251953125, -0.77642822265625, -0.726898193359375, -0.6773681640625, -0.627838134765625, -0.57830810546875, -0.528778076171875, -0.479248046875, -0.429718017578125, -0.38018798828125, -0.330657958984375, -0.2811279296875, -0.231597900390625, -0.18206787109375, -0.132537841796875, -0.0830078125, -0.033477783203125, 0.01605224609375, 0.065582275390625, 0.1151123046875, 0.164642333984375, 0.21417236328125, 0.263702392578125, 0.313232421875, 0.362762451171875, 0.41229248046875, 0.461822509765625, 0.5113525390625, 0.560882568359375, 0.61041259765625, 0.659942626953125, 0.70947265625, 0.759002685546875, 0.80853271484375, 0.858062744140625, 0.9075927734375, 0.957122802734375, 1.00665283203125, 1.056182861328125, 1.105712890625, 1.155242919921875, 1.20477294921875, 1.254302978515625, 1.3038330078125, 1.353363037109375, 1.40289306640625, 1.452423095703125, 1.501953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 13.0, 20.0, 31.0, 33.0, 50.0, 55.0, 85.0, 89.0, 140.0, 158.0, 197.0, 271.0, 371.0, 463.0, 612.0, 853.0, 1121.0, 1565.0, 2179.0, 3323.0, 5623.0, 12627.0, 42964.0, 203496.0, 492337.0, 206416.0, 43399.0, 12877.0, 5642.0, 3226.0, 2102.0, 1521.0, 1102.0, 811.0, 670.0, 503.0, 379.0, 294.0, 211.0, 178.0, 146.0, 83.0, 76.0, 59.0, 49.0, 41.0, 22.0, 13.0, 15.0, 12.0, 9.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.8515625, -6.626953125, -6.40234375, -6.177734375, -5.953125, -5.728515625, -5.50390625, -5.279296875, -5.0546875, -4.830078125, -4.60546875, -4.380859375, -4.15625, -3.931640625, -3.70703125, -3.482421875, -3.2578125, -3.033203125, -2.80859375, -2.583984375, -2.359375, -2.134765625, -1.91015625, -1.685546875, -1.4609375, -1.236328125, -1.01171875, -0.787109375, -0.5625, -0.337890625, -0.11328125, 0.111328125, 0.3359375, 0.560546875, 0.78515625, 1.009765625, 1.234375, 1.458984375, 1.68359375, 1.908203125, 2.1328125, 2.357421875, 2.58203125, 2.806640625, 3.03125, 3.255859375, 3.48046875, 3.705078125, 3.9296875, 4.154296875, 4.37890625, 4.603515625, 4.828125, 5.052734375, 5.27734375, 5.501953125, 5.7265625, 5.951171875, 6.17578125, 6.400390625, 6.625, 6.849609375, 7.07421875, 7.298828125, 7.5234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 25.0, 60.0, 102.0, 197.0, 213.0, 182.0, 96.0, 47.0, 15.0, 12.0, 5.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009016990661621094, -0.0008754655718803406, -0.0008492320775985718, -0.000822998583316803, -0.0007967650890350342, -0.0007705315947532654, -0.0007442981004714966, -0.0007180646061897278, -0.000691831111907959, -0.0006655976176261902, -0.0006393641233444214, -0.0006131306290626526, -0.0005868971347808838, -0.000560663640499115, -0.0005344301462173462, -0.0005081966519355774, -0.0004819631576538086, -0.0004557296633720398, -0.000429496169090271, -0.0004032626748085022, -0.0003770291805267334, -0.0003507956862449646, -0.0003245621919631958, -0.000298328697681427, -0.0002720952033996582, -0.0002458617091178894, -0.0002196282148361206, -0.0001933947205543518, -0.000167161226272583, -0.0001409277319908142, -0.00011469423770904541, -8.846074342727661e-05, -6.222724914550781e-05, -3.5993754863739014e-05, -9.760260581970215e-06, 1.6473233699798584e-05, 4.270672798156738e-05, 6.894022226333618e-05, 9.517371654510498e-05, 0.00012140721082687378, 0.00014764070510864258, 0.00017387419939041138, 0.00020010769367218018, 0.00022634118795394897, 0.0002525746822357178, 0.00027880817651748657, 0.00030504167079925537, 0.00033127516508102417, 0.00035750865936279297, 0.00038374215364456177, 0.00040997564792633057, 0.00043620914220809937, 0.00046244263648986816, 0.000488676130771637, 0.0005149096250534058, 0.0005411431193351746, 0.0005673766136169434, 0.0005936101078987122, 0.000619843602180481, 0.0006460770964622498, 0.0006723105907440186, 0.0006985440850257874, 0.0007247775793075562, 0.000751011073589325, 0.0007772445678710938]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 13.0, 15.0, 18.0, 32.0, 41.0, 47.0, 60.0, 78.0, 143.0, 179.0, 275.0, 374.0, 533.0, 739.0, 1164.0, 1742.0, 2586.0, 4005.0, 9112.0, 52654.0, 457300.0, 445733.0, 50738.0, 9014.0, 3926.0, 2631.0, 1705.0, 1159.0, 750.0, 530.0, 358.0, 267.0, 187.0, 110.0, 84.0, 73.0, 43.0, 37.0, 25.0, 21.0, 18.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-9.9375, -9.6451416015625, -9.352783203125, -9.0604248046875, -8.76806640625, -8.4757080078125, -8.183349609375, -7.8909912109375, -7.5986328125, -7.3062744140625, -7.013916015625, -6.7215576171875, -6.42919921875, -6.1368408203125, -5.844482421875, -5.5521240234375, -5.259765625, -4.9674072265625, -4.675048828125, -4.3826904296875, -4.09033203125, -3.7979736328125, -3.505615234375, -3.2132568359375, -2.9208984375, -2.6285400390625, -2.336181640625, -2.0438232421875, -1.75146484375, -1.4591064453125, -1.166748046875, -0.8743896484375, -0.58203125, -0.2896728515625, 0.002685546875, 0.2950439453125, 0.58740234375, 0.8797607421875, 1.172119140625, 1.4644775390625, 1.7568359375, 2.0491943359375, 2.341552734375, 2.6339111328125, 2.92626953125, 3.2186279296875, 3.510986328125, 3.8033447265625, 4.095703125, 4.3880615234375, 4.680419921875, 4.9727783203125, 5.26513671875, 5.5574951171875, 5.849853515625, 6.1422119140625, 6.4345703125, 6.7269287109375, 7.019287109375, 7.3116455078125, 7.60400390625, 7.8963623046875, 8.188720703125, 8.4810791015625, 8.7734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 16.0, 36.0, 56.0, 108.0, 173.0, 202.0, 155.0, 113.0, 69.0, 27.0, 17.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9176177978515625, -1.847930908203125, -1.7782440185546875, -1.70855712890625, -1.6388702392578125, -1.569183349609375, -1.4994964599609375, -1.4298095703125, -1.3601226806640625, -1.290435791015625, -1.2207489013671875, -1.15106201171875, -1.0813751220703125, -1.011688232421875, -0.9420013427734375, -0.872314453125, -0.8026275634765625, -0.732940673828125, -0.6632537841796875, -0.59356689453125, -0.5238800048828125, -0.454193115234375, -0.3845062255859375, -0.3148193359375, -0.2451324462890625, -0.175445556640625, -0.1057586669921875, -0.03607177734375, 0.0336151123046875, 0.103302001953125, 0.1729888916015625, 0.24267578125, 0.3123626708984375, 0.382049560546875, 0.4517364501953125, 0.52142333984375, 0.5911102294921875, 0.660797119140625, 0.7304840087890625, 0.8001708984375, 0.8698577880859375, 0.939544677734375, 1.0092315673828125, 1.07891845703125, 1.1486053466796875, 1.218292236328125, 1.2879791259765625, 1.357666015625, 1.4273529052734375, 1.497039794921875, 1.5667266845703125, 1.63641357421875, 1.7061004638671875, 1.775787353515625, 1.8454742431640625, 1.9151611328125, 1.9848480224609375, 2.054534912109375, 2.1242218017578125, 2.19390869140625, 2.2635955810546875, 2.333282470703125, 2.4029693603515625, 2.47265625]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 8.0, 8.0, 12.0, 18.0, 16.0, 17.0, 17.0, 18.0, 35.0, 21.0, 34.0, 42.0, 39.0, 44.0, 37.0, 52.0, 51.0, 74.0, 59.0, 37.0, 35.0, 41.0, 46.0, 38.0, 29.0, 28.0, 20.0, 17.0, 11.0, 21.0, 9.0, 7.0, 10.0, 3.0, 6.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.421260833740234, -4.286639213562012, -4.152018070220947, -4.017396450042725, -3.882775068283081, -3.7481536865234375, -3.613532066345215, -3.4789106845855713, -3.3442893028259277, -3.209667921066284, -3.0750465393066406, -2.940424919128418, -2.8058035373687744, -2.671182155609131, -2.536560535430908, -2.4019391536712646, -2.267317771911621, -2.1326963901519775, -1.9980748891830444, -1.8634533882141113, -1.7288320064544678, -1.5942106246948242, -1.4595891237258911, -1.324967622756958, -1.1903462409973145, -1.055724859237671, -0.9211033582687378, -0.7864819169044495, -0.6518604755401611, -0.5172390341758728, -0.3826175928115845, -0.24799615144729614, -0.11337423324584961, 0.02124720811843872, 0.15586864948272705, 0.2904900908470154, 0.4251115322113037, 0.559732973575592, 0.6943544149398804, 0.8289758563041687, 0.963597297668457, 1.0982186794281006, 1.2328401803970337, 1.3674616813659668, 1.5020830631256104, 1.636704444885254, 1.771325945854187, 1.9059474468231201, 2.0405688285827637, 2.1751902103424072, 2.309811592102051, 2.4444332122802734, 2.579054594039917, 2.7136759757995605, 2.848297595977783, 2.9829189777374268, 3.1175403594970703, 3.252161741256714, 3.3867831230163574, 3.52140474319458, 3.6560261249542236, 3.790647506713867, 3.92526912689209, 4.059890270233154, 4.194511890411377]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 22.0, 15.0, 22.0, 23.0, 26.0, 20.0, 23.0, 36.0, 37.0, 38.0, 42.0, 37.0, 40.0, 27.0, 36.0, 34.0, 37.0, 36.0, 26.0, 40.0, 35.0, 35.0, 30.0, 28.0, 22.0, 22.0, 26.0, 20.0, 17.0, 5.0, 7.0, 14.0, 13.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.6036057472229004, -2.5236926078796387, -2.443779468536377, -2.3638663291931152, -2.2839531898498535, -2.204040050506592, -2.12412691116333, -2.0442137718200684, -1.9643006324768066, -1.884387493133545, -1.8044743537902832, -1.7245612144470215, -1.6446480751037598, -1.564734935760498, -1.4848217964172363, -1.4049086570739746, -1.3249953985214233, -1.2450822591781616, -1.1651691198349, -1.0852559804916382, -1.0053428411483765, -0.9254297018051147, -0.8455165028572083, -0.7656033635139465, -0.6856902241706848, -0.6057770848274231, -0.5258639454841614, -0.44595077633857727, -0.36603763699531555, -0.28612449765205383, -0.20621132850646973, -0.126298189163208, -0.04638504981994629, 0.03352809697389603, 0.11344124376773834, 0.19335439801216125, 0.273267537355423, 0.3531806766986847, 0.4330938458442688, 0.5130069851875305, 0.5929201245307922, 0.672833263874054, 0.7527464032173157, 0.8326596021652222, 0.9125727415084839, 0.9924858808517456, 1.0723990201950073, 1.152312159538269, 1.2322252988815308, 1.3121384382247925, 1.3920515775680542, 1.471964716911316, 1.5518778562545776, 1.6317909955978394, 1.7117042541503906, 1.7916173934936523, 1.871530532836914, 1.9514436721801758, 2.0313568115234375, 2.111269950866699, 2.191183090209961, 2.2710962295532227, 2.3510093688964844, 2.430922508239746, 2.510835647583008]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 8.0, 28.0, 26.0, 32.0, 58.0, 99.0, 93.0, 168.0, 261.0, 368.0, 520.0, 783.0, 1111.0, 1782.0, 2639.0, 4183.0, 6756.0, 10744.0, 17625.0, 29981.0, 52567.0, 95982.0, 180449.0, 346564.0, 627920.0, 889814.0, 817818.0, 510290.0, 270558.0, 141820.0, 76576.0, 42805.0, 24500.0, 14710.0, 8873.0, 5612.0, 3596.0, 2236.0, 1481.0, 968.0, 616.0, 443.0, 268.0, 176.0, 126.0, 83.0, 54.0, 38.0, 23.0, 15.0, 8.0, 8.0, 2.0, 2.0, 3.0], "bins": [-4.6328125, -4.499725341796875, -4.36663818359375, -4.233551025390625, -4.1004638671875, -3.967376708984375, -3.83428955078125, -3.701202392578125, -3.568115234375, -3.435028076171875, -3.30194091796875, -3.168853759765625, -3.0357666015625, -2.902679443359375, -2.76959228515625, -2.636505126953125, -2.50341796875, -2.370330810546875, -2.23724365234375, -2.104156494140625, -1.9710693359375, -1.837982177734375, -1.70489501953125, -1.571807861328125, -1.438720703125, -1.305633544921875, -1.17254638671875, -1.039459228515625, -0.9063720703125, -0.773284912109375, -0.64019775390625, -0.507110595703125, -0.3740234375, -0.240936279296875, -0.10784912109375, 0.025238037109375, 0.1583251953125, 0.291412353515625, 0.42449951171875, 0.557586669921875, 0.690673828125, 0.823760986328125, 0.95684814453125, 1.089935302734375, 1.2230224609375, 1.356109619140625, 1.48919677734375, 1.622283935546875, 1.75537109375, 1.888458251953125, 2.02154541015625, 2.154632568359375, 2.2877197265625, 2.420806884765625, 2.55389404296875, 2.686981201171875, 2.820068359375, 2.953155517578125, 3.08624267578125, 3.219329833984375, 3.3524169921875, 3.485504150390625, 3.61859130859375, 3.751678466796875, 3.884765625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 5.0, 2.0, 9.0, 11.0, 9.0, 10.0, 10.0, 22.0, 22.0, 19.0, 27.0, 25.0, 22.0, 30.0, 31.0, 41.0, 31.0, 46.0, 37.0, 40.0, 34.0, 40.0, 33.0, 37.0, 42.0, 43.0, 39.0, 26.0, 35.0, 34.0, 24.0, 23.0, 23.0, 21.0, 19.0, 16.0, 8.0, 12.0, 6.0, 4.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.2724609375, -2.19921875, -2.1259765625, -2.052734375, -1.9794921875, -1.90625, -1.8330078125, -1.759765625, -1.6865234375, -1.61328125, -1.5400390625, -1.466796875, -1.3935546875, -1.3203125, -1.2470703125, -1.173828125, -1.1005859375, -1.02734375, -0.9541015625, -0.880859375, -0.8076171875, -0.734375, -0.6611328125, -0.587890625, -0.5146484375, -0.44140625, -0.3681640625, -0.294921875, -0.2216796875, -0.1484375, -0.0751953125, -0.001953125, 0.0712890625, 0.14453125, 0.2177734375, 0.291015625, 0.3642578125, 0.4375, 0.5107421875, 0.583984375, 0.6572265625, 0.73046875, 0.8037109375, 0.876953125, 0.9501953125, 1.0234375, 1.0966796875, 1.169921875, 1.2431640625, 1.31640625, 1.3896484375, 1.462890625, 1.5361328125, 1.609375, 1.6826171875, 1.755859375, 1.8291015625, 1.90234375, 1.9755859375, 2.048828125, 2.1220703125, 2.1953125, 2.2685546875, 2.341796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 33.0, 31.0, 52.0, 81.0, 112.0, 204.0, 286.0, 404.0, 675.0, 1115.0, 1652.0, 2733.0, 4343.0, 7060.0, 11690.0, 19764.0, 34120.0, 59776.0, 107753.0, 195242.0, 353582.0, 604979.0, 838242.0, 780767.0, 512215.0, 290859.0, 159397.0, 87459.0, 49180.0, 27997.0, 16448.0, 9874.0, 5990.0, 3713.0, 2310.0, 1463.0, 889.0, 631.0, 381.0, 264.0, 154.0, 91.0, 85.0, 55.0, 30.0, 21.0, 14.0, 13.0, 7.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.38690185546875, -4.2347412109375, -4.08258056640625, -3.930419921875, -3.77825927734375, -3.6260986328125, -3.47393798828125, -3.32177734375, -3.16961669921875, -3.0174560546875, -2.86529541015625, -2.713134765625, -2.56097412109375, -2.4088134765625, -2.25665283203125, -2.1044921875, -1.95233154296875, -1.8001708984375, -1.64801025390625, -1.495849609375, -1.34368896484375, -1.1915283203125, -1.03936767578125, -0.88720703125, -0.73504638671875, -0.5828857421875, -0.43072509765625, -0.278564453125, -0.12640380859375, 0.0257568359375, 0.17791748046875, 0.330078125, 0.48223876953125, 0.6343994140625, 0.78656005859375, 0.938720703125, 1.09088134765625, 1.2430419921875, 1.39520263671875, 1.54736328125, 1.69952392578125, 1.8516845703125, 2.00384521484375, 2.156005859375, 2.30816650390625, 2.4603271484375, 2.61248779296875, 2.7646484375, 2.91680908203125, 3.0689697265625, 3.22113037109375, 3.373291015625, 3.52545166015625, 3.6776123046875, 3.82977294921875, 3.98193359375, 4.13409423828125, 4.2862548828125, 4.43841552734375, 4.590576171875, 4.74273681640625, 4.8948974609375, 5.04705810546875, 5.19921875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 2.0, 10.0, 10.0, 12.0, 18.0, 26.0, 29.0, 31.0, 40.0, 71.0, 67.0, 89.0, 102.0, 132.0, 170.0, 198.0, 247.0, 226.0, 270.0, 289.0, 268.0, 246.0, 258.0, 220.0, 218.0, 165.0, 148.0, 123.0, 84.0, 78.0, 62.0, 44.0, 36.0, 24.0, 15.0, 13.0, 8.0, 8.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6845703125, -1.633544921875, -1.58251953125, -1.531494140625, -1.48046875, -1.429443359375, -1.37841796875, -1.327392578125, -1.2763671875, -1.225341796875, -1.17431640625, -1.123291015625, -1.072265625, -1.021240234375, -0.97021484375, -0.919189453125, -0.8681640625, -0.817138671875, -0.76611328125, -0.715087890625, -0.6640625, -0.613037109375, -0.56201171875, -0.510986328125, -0.4599609375, -0.408935546875, -0.35791015625, -0.306884765625, -0.255859375, -0.204833984375, -0.15380859375, -0.102783203125, -0.0517578125, -0.000732421875, 0.05029296875, 0.101318359375, 0.15234375, 0.203369140625, 0.25439453125, 0.305419921875, 0.3564453125, 0.407470703125, 0.45849609375, 0.509521484375, 0.560546875, 0.611572265625, 0.66259765625, 0.713623046875, 0.7646484375, 0.815673828125, 0.86669921875, 0.917724609375, 0.96875, 1.019775390625, 1.07080078125, 1.121826171875, 1.1728515625, 1.223876953125, 1.27490234375, 1.325927734375, 1.376953125, 1.427978515625, 1.47900390625, 1.530029296875, 1.5810546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 11.0, 11.0, 9.0, 18.0, 18.0, 21.0, 27.0, 38.0, 35.0, 54.0, 45.0, 60.0, 57.0, 70.0, 72.0, 53.0, 62.0, 44.0, 46.0, 44.0, 32.0, 41.0, 21.0, 21.0, 17.0, 16.0, 9.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.877341270446777, -5.695503234863281, -5.513665199279785, -5.331827163696289, -5.149989604949951, -4.968151569366455, -4.786313533782959, -4.604475498199463, -4.422637939453125, -4.240799903869629, -4.058961868286133, -3.877124071121216, -3.695286273956299, -3.5134482383728027, -3.3316102027893066, -3.1497721672058105, -2.9679341316223145, -2.7860960960388184, -2.6042582988739014, -2.4224202632904053, -2.2405824661254883, -2.058744430541992, -1.876906394958496, -1.6950684785842896, -1.513230562210083, -1.3313926458358765, -1.14955472946167, -0.9677166938781738, -0.7858787775039673, -0.6040408611297607, -0.42220282554626465, -0.2403649091720581, -0.05852651596069336, 0.12331143021583557, 0.3051493763923645, 0.4869873523712158, 0.6688252687454224, 0.8506631851196289, 1.032501220703125, 1.2143391370773315, 1.396177053451538, 1.5780149698257446, 1.7598528861999512, 1.9416909217834473, 2.1235289573669434, 2.3053667545318604, 2.4872047901153564, 2.6690425872802734, 2.8508806228637695, 3.0327186584472656, 3.2145564556121826, 3.3963944911956787, 3.5782322883605957, 3.760070323944092, 3.941908359527588, 4.123746395111084, 4.305583953857422, 4.487421989440918, 4.669260025024414, 4.85109806060791, 5.032935619354248, 5.214773654937744, 5.39661169052124, 5.578449726104736, 5.760287761688232]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0, 2.0, 6.0, 4.0, 6.0, 15.0, 12.0, 9.0, 17.0, 11.0, 18.0, 22.0, 24.0, 22.0, 38.0, 28.0, 35.0, 26.0, 33.0, 33.0, 36.0, 34.0, 52.0, 40.0, 34.0, 38.0, 33.0, 37.0, 36.0, 38.0, 31.0, 24.0, 22.0, 19.0, 21.0, 27.0, 14.0, 11.0, 13.0, 19.0, 3.0, 17.0, 7.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-2.9414868354797363, -2.855492115020752, -2.7694976329803467, -2.6835029125213623, -2.597508430480957, -2.5115137100219727, -2.4255189895629883, -2.339524507522583, -2.2535300254821777, -2.1675353050231934, -2.081540822982788, -1.9955461025238037, -1.9095516204833984, -1.823556900024414, -1.7375622987747192, -1.6515676975250244, -1.56557297706604, -1.4795783758163452, -1.3935837745666504, -1.307589054107666, -1.2215945720672607, -1.1355998516082764, -1.0496052503585815, -0.9636106491088867, -0.8776160478591919, -0.7916214466094971, -0.7056268453598022, -0.6196321845054626, -0.5336375832557678, -0.447642982006073, -0.3616483211517334, -0.2756537199020386, -0.18965911865234375, -0.10366450250148773, -0.017669886350631714, 0.0683247447013855, 0.15431934595108032, 0.24031394720077515, 0.32630860805511475, 0.41230320930480957, 0.4982978105545044, 0.5842924118041992, 0.670287013053894, 0.7562816739082336, 0.8422762751579285, 0.9282708764076233, 1.014265537261963, 1.1002601385116577, 1.1862547397613525, 1.2722493410110474, 1.3582439422607422, 1.4442386627197266, 1.5302331447601318, 1.6162278652191162, 1.702222466468811, 1.7882170677185059, 1.8742116689682007, 1.9602062702178955, 2.04620099067688, 2.132195472717285, 2.2181901931762695, 2.304184675216675, 2.390179395675659, 2.4761738777160645, 2.562168598175049]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 13.0, 15.0, 29.0, 45.0, 62.0, 97.0, 193.0, 365.0, 643.0, 1373.0, 2880.0, 6527.0, 15368.0, 38433.0, 103326.0, 266688.0, 345720.0, 164898.0, 60674.0, 23282.0, 9698.0, 4349.0, 1962.0, 894.0, 443.0, 212.0, 144.0, 79.0, 44.0, 33.0, 21.0, 9.0, 15.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8223419189453125, -0.792144775390625, -0.7619476318359375, -0.73175048828125, -0.7015533447265625, -0.671356201171875, -0.6411590576171875, -0.6109619140625, -0.5807647705078125, -0.550567626953125, -0.5203704833984375, -0.49017333984375, -0.4599761962890625, -0.429779052734375, -0.3995819091796875, -0.369384765625, -0.3391876220703125, -0.308990478515625, -0.2787933349609375, -0.24859619140625, -0.2183990478515625, -0.188201904296875, -0.1580047607421875, -0.1278076171875, -0.0976104736328125, -0.067413330078125, -0.0372161865234375, -0.00701904296875, 0.0231781005859375, 0.053375244140625, 0.0835723876953125, 0.11376953125, 0.1439666748046875, 0.174163818359375, 0.2043609619140625, 0.23455810546875, 0.2647552490234375, 0.294952392578125, 0.3251495361328125, 0.3553466796875, 0.3855438232421875, 0.415740966796875, 0.4459381103515625, 0.47613525390625, 0.5063323974609375, 0.536529541015625, 0.5667266845703125, 0.596923828125, 0.6271209716796875, 0.657318115234375, 0.6875152587890625, 0.71771240234375, 0.7479095458984375, 0.778106689453125, 0.8083038330078125, 0.8385009765625, 0.8686981201171875, 0.898895263671875, 0.9290924072265625, 0.95928955078125, 0.9894866943359375, 1.019683837890625, 1.0498809814453125, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 11.0, 19.0, 17.0, 25.0, 33.0, 21.0, 33.0, 28.0, 36.0, 44.0, 31.0, 40.0, 43.0, 56.0, 51.0, 47.0, 55.0, 41.0, 41.0, 39.0, 43.0, 26.0, 24.0, 28.0, 17.0, 20.0, 17.0, 17.0, 17.0, 10.0, 12.0, 12.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59765625, -3.479827880859375, -3.36199951171875, -3.244171142578125, -3.1263427734375, -3.008514404296875, -2.89068603515625, -2.772857666015625, -2.655029296875, -2.537200927734375, -2.41937255859375, -2.301544189453125, -2.1837158203125, -2.065887451171875, -1.94805908203125, -1.830230712890625, -1.71240234375, -1.594573974609375, -1.47674560546875, -1.358917236328125, -1.2410888671875, -1.123260498046875, -1.00543212890625, -0.887603759765625, -0.769775390625, -0.651947021484375, -0.53411865234375, -0.416290283203125, -0.2984619140625, -0.180633544921875, -0.06280517578125, 0.055023193359375, 0.1728515625, 0.290679931640625, 0.40850830078125, 0.526336669921875, 0.6441650390625, 0.761993408203125, 0.87982177734375, 0.997650146484375, 1.115478515625, 1.233306884765625, 1.35113525390625, 1.468963623046875, 1.5867919921875, 1.704620361328125, 1.82244873046875, 1.940277099609375, 2.05810546875, 2.175933837890625, 2.29376220703125, 2.411590576171875, 2.5294189453125, 2.647247314453125, 2.76507568359375, 2.882904052734375, 3.000732421875, 3.118560791015625, 3.23638916015625, 3.354217529296875, 3.4720458984375, 3.589874267578125, 3.70770263671875, 3.825531005859375, 3.943359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 8.0, 14.0, 16.0, 29.0, 36.0, 70.0, 111.0, 188.0, 315.0, 606.0, 1145.0, 2283.0, 5561.0, 16564.0, 92937.0, 884183.0, 29265.0, 8795.0, 3258.0, 1482.0, 727.0, 374.0, 240.0, 118.0, 87.0, 53.0, 30.0, 26.0, 6.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.017669677734375, -1.93768310546875, -1.857696533203125, -1.7777099609375, -1.697723388671875, -1.61773681640625, -1.537750244140625, -1.457763671875, -1.377777099609375, -1.29779052734375, -1.217803955078125, -1.1378173828125, -1.057830810546875, -0.97784423828125, -0.897857666015625, -0.81787109375, -0.737884521484375, -0.65789794921875, -0.577911376953125, -0.4979248046875, -0.417938232421875, -0.33795166015625, -0.257965087890625, -0.177978515625, -0.097991943359375, -0.01800537109375, 0.061981201171875, 0.1419677734375, 0.221954345703125, 0.30194091796875, 0.381927490234375, 0.4619140625, 0.541900634765625, 0.62188720703125, 0.701873779296875, 0.7818603515625, 0.861846923828125, 0.94183349609375, 1.021820068359375, 1.101806640625, 1.181793212890625, 1.26177978515625, 1.341766357421875, 1.4217529296875, 1.501739501953125, 1.58172607421875, 1.661712646484375, 1.74169921875, 1.821685791015625, 1.90167236328125, 1.981658935546875, 2.0616455078125, 2.141632080078125, 2.22161865234375, 2.301605224609375, 2.381591796875, 2.461578369140625, 2.54156494140625, 2.621551513671875, 2.7015380859375, 2.781524658203125, 2.86151123046875, 2.941497802734375, 3.021484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 10.0, 17.0, 16.0, 20.0, 27.0, 38.0, 23.0, 31.0, 41.0, 33.0, 43.0, 40.0, 39.0, 40.0, 37.0, 52.0, 46.0, 46.0, 42.0, 37.0, 26.0, 27.0, 41.0, 31.0, 19.0, 23.0, 18.0, 15.0, 13.0, 17.0, 10.0, 5.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.255859375, -2.185516357421875, -2.11517333984375, -2.044830322265625, -1.9744873046875, -1.904144287109375, -1.83380126953125, -1.763458251953125, -1.693115234375, -1.622772216796875, -1.55242919921875, -1.482086181640625, -1.4117431640625, -1.341400146484375, -1.27105712890625, -1.200714111328125, -1.13037109375, -1.060028076171875, -0.98968505859375, -0.919342041015625, -0.8489990234375, -0.778656005859375, -0.70831298828125, -0.637969970703125, -0.567626953125, -0.497283935546875, -0.42694091796875, -0.356597900390625, -0.2862548828125, -0.215911865234375, -0.14556884765625, -0.075225830078125, -0.0048828125, 0.065460205078125, 0.13580322265625, 0.206146240234375, 0.2764892578125, 0.346832275390625, 0.41717529296875, 0.487518310546875, 0.557861328125, 0.628204345703125, 0.69854736328125, 0.768890380859375, 0.8392333984375, 0.909576416015625, 0.97991943359375, 1.050262451171875, 1.12060546875, 1.190948486328125, 1.26129150390625, 1.331634521484375, 1.4019775390625, 1.472320556640625, 1.54266357421875, 1.613006591796875, 1.683349609375, 1.753692626953125, 1.82403564453125, 1.894378662109375, 1.9647216796875, 2.035064697265625, 2.10540771484375, 2.175750732421875, 2.24609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 0.0, 3.0, 10.0, 17.0, 24.0, 27.0, 33.0, 73.0, 97.0, 163.0, 221.0, 371.0, 675.0, 1736.0, 6957.0, 84252.0, 938120.0, 11626.0, 2206.0, 801.0, 389.0, 240.0, 167.0, 110.0, 62.0, 53.0, 34.0, 20.0, 24.0, 4.0, 5.0, 4.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1881103515625, -1.148681640625, -1.1092529296875, -1.06982421875, -1.0303955078125, -0.990966796875, -0.9515380859375, -0.912109375, -0.8726806640625, -0.833251953125, -0.7938232421875, -0.75439453125, -0.7149658203125, -0.675537109375, -0.6361083984375, -0.5966796875, -0.5572509765625, -0.517822265625, -0.4783935546875, -0.43896484375, -0.3995361328125, -0.360107421875, -0.3206787109375, -0.28125, -0.2418212890625, -0.202392578125, -0.1629638671875, -0.12353515625, -0.0841064453125, -0.044677734375, -0.0052490234375, 0.0341796875, 0.0736083984375, 0.113037109375, 0.1524658203125, 0.19189453125, 0.2313232421875, 0.270751953125, 0.3101806640625, 0.349609375, 0.3890380859375, 0.428466796875, 0.4678955078125, 0.50732421875, 0.5467529296875, 0.586181640625, 0.6256103515625, 0.6650390625, 0.7044677734375, 0.743896484375, 0.7833251953125, 0.82275390625, 0.8621826171875, 0.901611328125, 0.9410400390625, 0.98046875, 1.0198974609375, 1.059326171875, 1.0987548828125, 1.13818359375, 1.1776123046875, 1.217041015625, 1.2564697265625, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 20.0, 41.0, 67.0, 86.0, 150.0, 166.0, 152.0, 99.0, 96.0, 53.0, 24.0, 13.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012135505676269531, -0.00011796876788139343, -0.00011458247900009155, -0.00011119619011878967, -0.00010780990123748779, -0.00010442361235618591, -0.00010103732347488403, -9.765103459358215e-05, -9.426474571228027e-05, -9.08784568309784e-05, -8.749216794967651e-05, -8.410587906837463e-05, -8.071959018707275e-05, -7.733330130577087e-05, -7.3947012424469e-05, -7.056072354316711e-05, -6.717443466186523e-05, -6.378814578056335e-05, -6.0401856899261475e-05, -5.7015568017959595e-05, -5.3629279136657715e-05, -5.0242990255355835e-05, -4.6856701374053955e-05, -4.3470412492752075e-05, -4.0084123611450195e-05, -3.6697834730148315e-05, -3.3311545848846436e-05, -2.9925256967544556e-05, -2.6538968086242676e-05, -2.3152679204940796e-05, -1.9766390323638916e-05, -1.6380101442337036e-05, -1.2993812561035156e-05, -9.607523679733276e-06, -6.2212347984313965e-06, -2.8349459171295166e-06, 5.513429641723633e-07, 3.937631845474243e-06, 7.323920726776123e-06, 1.0710209608078003e-05, 1.4096498489379883e-05, 1.7482787370681763e-05, 2.0869076251983643e-05, 2.4255365133285522e-05, 2.7641654014587402e-05, 3.102794289588928e-05, 3.441423177719116e-05, 3.780052065849304e-05, 4.118680953979492e-05, 4.45730984210968e-05, 4.795938730239868e-05, 5.134567618370056e-05, 5.473196506500244e-05, 5.811825394630432e-05, 6.15045428276062e-05, 6.489083170890808e-05, 6.827712059020996e-05, 7.166340947151184e-05, 7.504969835281372e-05, 7.84359872341156e-05, 8.182227611541748e-05, 8.520856499671936e-05, 8.859485387802124e-05, 9.198114275932312e-05, 9.5367431640625e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 5.0, 18.0, 22.0, 25.0, 35.0, 53.0, 52.0, 83.0, 122.0, 158.0, 287.0, 451.0, 743.0, 1266.0, 2051.0, 3426.0, 6426.0, 19152.0, 192160.0, 728236.0, 69760.0, 11734.0, 5010.0, 2768.0, 1706.0, 1027.0, 606.0, 371.0, 243.0, 175.0, 113.0, 76.0, 54.0, 44.0, 23.0, 20.0, 18.0, 5.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.71533203125, -0.6938629150390625, -0.672393798828125, -0.6509246826171875, -0.62945556640625, -0.6079864501953125, -0.586517333984375, -0.5650482177734375, -0.5435791015625, -0.5221099853515625, -0.500640869140625, -0.4791717529296875, -0.45770263671875, -0.4362335205078125, -0.414764404296875, -0.3932952880859375, -0.371826171875, -0.3503570556640625, -0.328887939453125, -0.3074188232421875, -0.28594970703125, -0.2644805908203125, -0.243011474609375, -0.2215423583984375, -0.2000732421875, -0.1786041259765625, -0.157135009765625, -0.1356658935546875, -0.11419677734375, -0.0927276611328125, -0.071258544921875, -0.0497894287109375, -0.0283203125, -0.0068511962890625, 0.014617919921875, 0.0360870361328125, 0.05755615234375, 0.0790252685546875, 0.100494384765625, 0.1219635009765625, 0.1434326171875, 0.1649017333984375, 0.186370849609375, 0.2078399658203125, 0.22930908203125, 0.2507781982421875, 0.272247314453125, 0.2937164306640625, 0.315185546875, 0.3366546630859375, 0.358123779296875, 0.3795928955078125, 0.40106201171875, 0.4225311279296875, 0.444000244140625, 0.4654693603515625, 0.4869384765625, 0.5084075927734375, 0.529876708984375, 0.5513458251953125, 0.57281494140625, 0.5942840576171875, 0.615753173828125, 0.6372222900390625, 0.65869140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 17.0, 39.0, 104.0, 249.0, 325.0, 145.0, 55.0, 22.0, 14.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17509841918945312, -0.16928863525390625, -0.16347885131835938, -0.1576690673828125, -0.15185928344726562, -0.14604949951171875, -0.14023971557617188, -0.134429931640625, -0.12862014770507812, -0.12281036376953125, -0.11700057983398438, -0.1111907958984375, -0.10538101196289062, -0.09957122802734375, -0.09376144409179688, -0.08795166015625, -0.08214187622070312, -0.07633209228515625, -0.07052230834960938, -0.0647125244140625, -0.058902740478515625, -0.05309295654296875, -0.047283172607421875, -0.041473388671875, -0.035663604736328125, -0.02985382080078125, -0.024044036865234375, -0.0182342529296875, -0.012424468994140625, -0.00661468505859375, -0.000804901123046875, 0.0050048828125, 0.010814666748046875, 0.01662445068359375, 0.022434234619140625, 0.0282440185546875, 0.034053802490234375, 0.03986358642578125, 0.045673370361328125, 0.051483154296875, 0.057292938232421875, 0.06310272216796875, 0.06891250610351562, 0.0747222900390625, 0.08053207397460938, 0.08634185791015625, 0.09215164184570312, 0.09796142578125, 0.10377120971679688, 0.10958099365234375, 0.11539077758789062, 0.1212005615234375, 0.12701034545898438, 0.13282012939453125, 0.13862991333007812, 0.144439697265625, 0.15024948120117188, 0.15605926513671875, 0.16186904907226562, 0.1676788330078125, 0.17348861694335938, 0.17929840087890625, 0.18510818481445312, 0.19091796875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 6.0, 10.0, 12.0, 14.0, 20.0, 16.0, 24.0, 32.0, 37.0, 43.0, 56.0, 49.0, 56.0, 71.0, 67.0, 68.0, 66.0, 45.0, 52.0, 35.0, 39.0, 43.0, 25.0, 23.0, 17.0, 16.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0382232666015625, -5.853695869445801, -5.669168472290039, -5.484641075134277, -5.300113201141357, -5.115585803985596, -4.931058406829834, -4.746531009674072, -4.562003135681152, -4.377475738525391, -4.192948341369629, -4.008420944213867, -3.8238930702209473, -3.6393656730651855, -3.454838275909424, -3.270310878753662, -3.0857834815979004, -2.9012560844421387, -2.716728448867798, -2.532201051712036, -2.3476734161376953, -2.1631460189819336, -1.9786186218261719, -1.7940911054611206, -1.6095635890960693, -1.425036072731018, -1.2405085563659668, -1.055981159210205, -0.8714536428451538, -0.6869261264801025, -0.5023987293243408, -0.31787121295928955, -0.13334321975708008, 0.051184266805648804, 0.23571175336837769, 0.4202392101287842, 0.6047667264938354, 0.7892942428588867, 0.9738216400146484, 1.1583491563796997, 1.342876672744751, 1.5274041891098022, 1.7119317054748535, 1.8964591026306152, 2.080986499786377, 2.2655141353607178, 2.4500415325164795, 2.6345691680908203, 2.819096565246582, 3.0036239624023438, 3.1881515979766846, 3.3726789951324463, 3.557206630706787, 3.741734027862549, 3.9262614250183105, 4.110788822174072, 4.295316696166992, 4.479844093322754, 4.664371490478516, 4.848898887634277, 5.033426761627197, 5.217954158782959, 5.402481555938721, 5.587008953094482, 5.771536350250244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 6.0, 4.0, 7.0, 16.0, 9.0, 11.0, 17.0, 12.0, 16.0, 18.0, 23.0, 24.0, 33.0, 37.0, 29.0, 26.0, 33.0, 28.0, 38.0, 38.0, 44.0, 47.0, 35.0, 35.0, 30.0, 39.0, 40.0, 37.0, 31.0, 26.0, 21.0, 22.0, 20.0, 22.0, 20.0, 11.0, 13.0, 11.0, 13.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-2.915468454360962, -2.8307132720947266, -2.745957851409912, -2.6612026691436768, -2.5764474868774414, -2.491692304611206, -2.4069368839263916, -2.3221817016601562, -2.237426519393921, -2.1526713371276855, -2.067915916442871, -1.9831607341766357, -1.8984055519104004, -1.8136502504348755, -1.7288949489593506, -1.6441397666931152, -1.5593844652175903, -1.4746291637420654, -1.38987398147583, -1.3051186800003052, -1.2203634977340698, -1.135608196258545, -1.0508530139923096, -0.9660977125167847, -0.8813424706459045, -0.7965872287750244, -0.7118319869041443, -0.6270767450332642, -0.5423214435577393, -0.4575662314891815, -0.372810959815979, -0.2880557179450989, -0.20330047607421875, -0.11854522675275803, -0.0337899774312973, 0.05096527934074402, 0.13572052121162415, 0.22047576308250427, 0.3052310347557068, 0.3899862766265869, 0.47474151849746704, 0.5594967603683472, 0.6442520022392273, 0.7290072441101074, 0.8137625455856323, 0.8985177278518677, 0.9832730293273926, 1.068028211593628, 1.1527835130691528, 1.2375388145446777, 1.322293996810913, 1.407049298286438, 1.4918044805526733, 1.5765597820281982, 1.6613149642944336, 1.7460702657699585, 1.8308255672454834, 1.9155808687210083, 2.000336170196533, 2.0850913524627686, 2.169846534729004, 2.2546017169952393, 2.3393571376800537, 2.424112319946289, 2.5088675022125244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 17.0, 27.0, 35.0, 57.0, 88.0, 122.0, 185.0, 286.0, 431.0, 696.0, 1111.0, 1903.0, 3288.0, 5812.0, 10544.0, 18859.0, 33677.0, 57791.0, 93381.0, 135890.0, 167106.0, 166151.0, 132296.0, 89937.0, 55354.0, 32104.0, 18091.0, 10067.0, 5515.0, 3052.0, 1833.0, 1064.0, 644.0, 374.0, 256.0, 156.0, 120.0, 65.0, 46.0, 29.0, 28.0, 19.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2265625, -4.09429931640625, -3.9620361328125, -3.82977294921875, -3.697509765625, -3.56524658203125, -3.4329833984375, -3.30072021484375, -3.16845703125, -3.03619384765625, -2.9039306640625, -2.77166748046875, -2.639404296875, -2.50714111328125, -2.3748779296875, -2.24261474609375, -2.1103515625, -1.97808837890625, -1.8458251953125, -1.71356201171875, -1.581298828125, -1.44903564453125, -1.3167724609375, -1.18450927734375, -1.05224609375, -0.91998291015625, -0.7877197265625, -0.65545654296875, -0.523193359375, -0.39093017578125, -0.2586669921875, -0.12640380859375, 0.005859375, 0.13812255859375, 0.2703857421875, 0.40264892578125, 0.534912109375, 0.66717529296875, 0.7994384765625, 0.93170166015625, 1.06396484375, 1.19622802734375, 1.3284912109375, 1.46075439453125, 1.593017578125, 1.72528076171875, 1.8575439453125, 1.98980712890625, 2.1220703125, 2.25433349609375, 2.3865966796875, 2.51885986328125, 2.651123046875, 2.78338623046875, 2.9156494140625, 3.04791259765625, 3.18017578125, 3.31243896484375, 3.4447021484375, 3.57696533203125, 3.709228515625, 3.84149169921875, 3.9737548828125, 4.10601806640625, 4.23828125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 4.0, 9.0, 10.0, 24.0, 13.0, 19.0, 21.0, 21.0, 20.0, 22.0, 40.0, 27.0, 39.0, 33.0, 40.0, 51.0, 33.0, 41.0, 41.0, 40.0, 37.0, 32.0, 37.0, 41.0, 34.0, 23.0, 33.0, 19.0, 27.0, 20.0, 18.0, 16.0, 18.0, 8.0, 9.0, 7.0, 14.0, 6.0, 5.0, 1.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.968017578125, -2.87158203125, -2.775146484375, -2.6787109375, -2.582275390625, -2.48583984375, -2.389404296875, -2.29296875, -2.196533203125, -2.10009765625, -2.003662109375, -1.9072265625, -1.810791015625, -1.71435546875, -1.617919921875, -1.521484375, -1.425048828125, -1.32861328125, -1.232177734375, -1.1357421875, -1.039306640625, -0.94287109375, -0.846435546875, -0.75, -0.653564453125, -0.55712890625, -0.460693359375, -0.3642578125, -0.267822265625, -0.17138671875, -0.074951171875, 0.021484375, 0.117919921875, 0.21435546875, 0.310791015625, 0.4072265625, 0.503662109375, 0.60009765625, 0.696533203125, 0.79296875, 0.889404296875, 0.98583984375, 1.082275390625, 1.1787109375, 1.275146484375, 1.37158203125, 1.468017578125, 1.564453125, 1.660888671875, 1.75732421875, 1.853759765625, 1.9501953125, 2.046630859375, 2.14306640625, 2.239501953125, 2.3359375, 2.432373046875, 2.52880859375, 2.625244140625, 2.7216796875, 2.818115234375, 2.91455078125, 3.010986328125, 3.107421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 7.0, 18.0, 36.0, 49.0, 73.0, 117.0, 165.0, 317.0, 503.0, 798.0, 1360.0, 2190.0, 3784.0, 6525.0, 10644.0, 18411.0, 29744.0, 48212.0, 73391.0, 103778.0, 133679.0, 147435.0, 138712.0, 111602.0, 80247.0, 52811.0, 33582.0, 20618.0, 11946.0, 7128.0, 4295.0, 2587.0, 1464.0, 880.0, 554.0, 314.0, 199.0, 137.0, 75.0, 53.0, 30.0, 26.0, 21.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.88671875, -3.771087646484375, -3.65545654296875, -3.539825439453125, -3.4241943359375, -3.308563232421875, -3.19293212890625, -3.077301025390625, -2.961669921875, -2.846038818359375, -2.73040771484375, -2.614776611328125, -2.4991455078125, -2.383514404296875, -2.26788330078125, -2.152252197265625, -2.03662109375, -1.920989990234375, -1.80535888671875, -1.689727783203125, -1.5740966796875, -1.458465576171875, -1.34283447265625, -1.227203369140625, -1.111572265625, -0.995941162109375, -0.88031005859375, -0.764678955078125, -0.6490478515625, -0.533416748046875, -0.41778564453125, -0.302154541015625, -0.1865234375, -0.070892333984375, 0.04473876953125, 0.160369873046875, 0.2760009765625, 0.391632080078125, 0.50726318359375, 0.622894287109375, 0.738525390625, 0.854156494140625, 0.96978759765625, 1.085418701171875, 1.2010498046875, 1.316680908203125, 1.43231201171875, 1.547943115234375, 1.66357421875, 1.779205322265625, 1.89483642578125, 2.010467529296875, 2.1260986328125, 2.241729736328125, 2.35736083984375, 2.472991943359375, 2.588623046875, 2.704254150390625, 2.81988525390625, 2.935516357421875, 3.0511474609375, 3.166778564453125, 3.28240966796875, 3.398040771484375, 3.513671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 6.0, 3.0, 7.0, 17.0, 13.0, 17.0, 18.0, 16.0, 24.0, 28.0, 27.0, 28.0, 48.0, 30.0, 46.0, 43.0, 39.0, 34.0, 44.0, 44.0, 47.0, 38.0, 40.0, 40.0, 36.0, 33.0, 23.0, 22.0, 26.0, 28.0, 23.0, 23.0, 19.0, 14.0, 15.0, 4.0, 8.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.099609375, -2.035552978515625, -1.97149658203125, -1.907440185546875, -1.8433837890625, -1.779327392578125, -1.71527099609375, -1.651214599609375, -1.587158203125, -1.523101806640625, -1.45904541015625, -1.394989013671875, -1.3309326171875, -1.266876220703125, -1.20281982421875, -1.138763427734375, -1.07470703125, -1.010650634765625, -0.94659423828125, -0.882537841796875, -0.8184814453125, -0.754425048828125, -0.69036865234375, -0.626312255859375, -0.562255859375, -0.498199462890625, -0.43414306640625, -0.370086669921875, -0.3060302734375, -0.241973876953125, -0.17791748046875, -0.113861083984375, -0.0498046875, 0.014251708984375, 0.07830810546875, 0.142364501953125, 0.2064208984375, 0.270477294921875, 0.33453369140625, 0.398590087890625, 0.462646484375, 0.526702880859375, 0.59075927734375, 0.654815673828125, 0.7188720703125, 0.782928466796875, 0.84698486328125, 0.911041259765625, 0.97509765625, 1.039154052734375, 1.10321044921875, 1.167266845703125, 1.2313232421875, 1.295379638671875, 1.35943603515625, 1.423492431640625, 1.487548828125, 1.551605224609375, 1.61566162109375, 1.679718017578125, 1.7437744140625, 1.807830810546875, 1.87188720703125, 1.935943603515625, 2.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 9.0, 12.0, 11.0, 27.0, 39.0, 47.0, 69.0, 116.0, 163.0, 244.0, 376.0, 698.0, 1120.0, 1787.0, 3114.0, 5363.0, 9602.0, 17432.0, 32410.0, 59348.0, 104130.0, 160288.0, 196487.0, 176084.0, 120811.0, 71256.0, 39184.0, 21067.0, 11568.0, 6369.0, 3703.0, 2170.0, 1301.0, 795.0, 493.0, 298.0, 208.0, 115.0, 79.0, 49.0, 39.0, 28.0, 12.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.384765625, -2.311737060546875, -2.23870849609375, -2.165679931640625, -2.0926513671875, -2.019622802734375, -1.94659423828125, -1.873565673828125, -1.800537109375, -1.727508544921875, -1.65447998046875, -1.581451416015625, -1.5084228515625, -1.435394287109375, -1.36236572265625, -1.289337158203125, -1.21630859375, -1.143280029296875, -1.07025146484375, -0.997222900390625, -0.9241943359375, -0.851165771484375, -0.77813720703125, -0.705108642578125, -0.632080078125, -0.559051513671875, -0.48602294921875, -0.412994384765625, -0.3399658203125, -0.266937255859375, -0.19390869140625, -0.120880126953125, -0.0478515625, 0.025177001953125, 0.09820556640625, 0.171234130859375, 0.2442626953125, 0.317291259765625, 0.39031982421875, 0.463348388671875, 0.536376953125, 0.609405517578125, 0.68243408203125, 0.755462646484375, 0.8284912109375, 0.901519775390625, 0.97454833984375, 1.047576904296875, 1.12060546875, 1.193634033203125, 1.26666259765625, 1.339691162109375, 1.4127197265625, 1.485748291015625, 1.55877685546875, 1.631805419921875, 1.704833984375, 1.777862548828125, 1.85089111328125, 1.923919677734375, 1.9969482421875, 2.069976806640625, 2.14300537109375, 2.216033935546875, 2.2890625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 11.0, 10.0, 22.0, 15.0, 53.0, 58.0, 82.0, 87.0, 106.0, 113.0, 104.0, 91.0, 78.0, 55.0, 38.0, 24.0, 13.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004456043243408203, -0.00043368712067604065, -0.000421769917011261, -0.0004098527133464813, -0.00039793550968170166, -0.000386018306016922, -0.00037410110235214233, -0.00036218389868736267, -0.000350266695022583, -0.00033834949135780334, -0.0003264322876930237, -0.000314515084028244, -0.00030259788036346436, -0.0002906806766986847, -0.00027876347303390503, -0.00026684626936912537, -0.0002549290657043457, -0.00024301186203956604, -0.00023109465837478638, -0.00021917745471000671, -0.00020726025104522705, -0.0001953430473804474, -0.00018342584371566772, -0.00017150864005088806, -0.0001595914363861084, -0.00014767423272132874, -0.00013575702905654907, -0.0001238398253917694, -0.00011192262172698975, -0.00010000541806221008, -8.808821439743042e-05, -7.617101073265076e-05, -6.42538070678711e-05, -5.233660340309143e-05, -4.041939973831177e-05, -2.8502196073532104e-05, -1.658499240875244e-05, -4.667788743972778e-06, 7.249414920806885e-06, 1.9166618585586548e-05, 3.108382225036621e-05, 4.3001025915145874e-05, 5.491822957992554e-05, 6.68354332447052e-05, 7.875263690948486e-05, 9.066984057426453e-05, 0.00010258704423904419, 0.00011450424790382385, 0.00012642145156860352, 0.00013833865523338318, 0.00015025585889816284, 0.0001621730625629425, 0.00017409026622772217, 0.00018600746989250183, 0.0001979246735572815, 0.00020984187722206116, 0.00022175908088684082, 0.00023367628455162048, 0.00024559348821640015, 0.0002575106918811798, 0.00026942789554595947, 0.00028134509921073914, 0.0002932623028755188, 0.00030517950654029846, 0.0003170967102050781]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 12.0, 16.0, 25.0, 17.0, 37.0, 52.0, 58.0, 98.0, 130.0, 170.0, 240.0, 350.0, 577.0, 883.0, 1376.0, 2336.0, 3973.0, 6767.0, 12000.0, 21484.0, 39239.0, 69864.0, 118888.0, 173203.0, 193835.0, 160429.0, 104667.0, 60084.0, 33658.0, 18785.0, 10251.0, 5812.0, 3471.0, 1993.0, 1304.0, 823.0, 552.0, 350.0, 220.0, 153.0, 98.0, 88.0, 52.0, 33.0, 28.0, 21.0, 19.0, 10.0, 11.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.384765625, -2.31109619140625, -2.2374267578125, -2.16375732421875, -2.090087890625, -2.01641845703125, -1.9427490234375, -1.86907958984375, -1.79541015625, -1.72174072265625, -1.6480712890625, -1.57440185546875, -1.500732421875, -1.42706298828125, -1.3533935546875, -1.27972412109375, -1.2060546875, -1.13238525390625, -1.0587158203125, -0.98504638671875, -0.911376953125, -0.83770751953125, -0.7640380859375, -0.69036865234375, -0.61669921875, -0.54302978515625, -0.4693603515625, -0.39569091796875, -0.322021484375, -0.24835205078125, -0.1746826171875, -0.10101318359375, -0.02734375, 0.04632568359375, 0.1199951171875, 0.19366455078125, 0.267333984375, 0.34100341796875, 0.4146728515625, 0.48834228515625, 0.56201171875, 0.63568115234375, 0.7093505859375, 0.78302001953125, 0.856689453125, 0.93035888671875, 1.0040283203125, 1.07769775390625, 1.1513671875, 1.22503662109375, 1.2987060546875, 1.37237548828125, 1.446044921875, 1.51971435546875, 1.5933837890625, 1.66705322265625, 1.74072265625, 1.81439208984375, 1.8880615234375, 1.96173095703125, 2.035400390625, 2.10906982421875, 2.1827392578125, 2.25640869140625, 2.330078125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 9.0, 5.0, 11.0, 13.0, 16.0, 24.0, 25.0, 35.0, 32.0, 38.0, 38.0, 50.0, 48.0, 66.0, 57.0, 55.0, 60.0, 43.0, 52.0, 45.0, 47.0, 34.0, 30.0, 24.0, 14.0, 26.0, 15.0, 16.0, 13.0, 8.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.642578125, -0.6241302490234375, -0.605682373046875, -0.5872344970703125, -0.56878662109375, -0.5503387451171875, -0.531890869140625, -0.5134429931640625, -0.4949951171875, -0.4765472412109375, -0.458099365234375, -0.4396514892578125, -0.42120361328125, -0.4027557373046875, -0.384307861328125, -0.3658599853515625, -0.347412109375, -0.3289642333984375, -0.310516357421875, -0.2920684814453125, -0.27362060546875, -0.2551727294921875, -0.236724853515625, -0.2182769775390625, -0.1998291015625, -0.1813812255859375, -0.162933349609375, -0.1444854736328125, -0.12603759765625, -0.1075897216796875, -0.089141845703125, -0.0706939697265625, -0.05224609375, -0.0337982177734375, -0.015350341796875, 0.0030975341796875, 0.02154541015625, 0.0399932861328125, 0.058441162109375, 0.0768890380859375, 0.0953369140625, 0.1137847900390625, 0.132232666015625, 0.1506805419921875, 0.16912841796875, 0.1875762939453125, 0.206024169921875, 0.2244720458984375, 0.242919921875, 0.2613677978515625, 0.279815673828125, 0.2982635498046875, 0.31671142578125, 0.3351593017578125, 0.353607177734375, 0.3720550537109375, 0.3905029296875, 0.4089508056640625, 0.427398681640625, 0.4458465576171875, 0.46429443359375, 0.4827423095703125, 0.501190185546875, 0.5196380615234375, 0.5380859375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 6.0, 8.0, 11.0, 16.0, 21.0, 21.0, 30.0, 32.0, 35.0, 44.0, 48.0, 68.0, 58.0, 63.0, 81.0, 74.0, 58.0, 59.0, 49.0, 39.0, 27.0, 31.0, 33.0, 23.0, 11.0, 9.0, 12.0, 6.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.592738151550293, -6.400635719299316, -6.20853328704834, -6.016430854797363, -5.824328422546387, -5.63222599029541, -5.440123558044434, -5.248021125793457, -5.0559186935424805, -4.863816261291504, -4.671713829040527, -4.479611396789551, -4.287508964538574, -4.095406532287598, -3.9033043384552, -3.7112019062042236, -3.519099712371826, -3.3269972801208496, -3.134894847869873, -2.9427924156188965, -2.75068998336792, -2.5585875511169434, -2.366485357284546, -2.1743829250335693, -1.9822804927825928, -1.7901780605316162, -1.5980756282806396, -1.4059733152389526, -1.213870882987976, -1.0217684507369995, -0.8296661376953125, -0.6375637054443359, -0.4454612731933594, -0.2533588707447052, -0.061256468296051025, 0.13084590435028076, 0.3229483366012573, 0.5150507688522339, 0.7071530818939209, 0.8992555141448975, 1.091357946395874, 1.2834603786468506, 1.4755628108978271, 1.6676651239395142, 1.8597675561904907, 2.0518698692321777, 2.2439723014831543, 2.436074733734131, 2.6281771659851074, 2.820279598236084, 3.0123820304870605, 3.204484462738037, 3.3965868949890137, 3.5886893272399902, 3.7807915210723877, 3.9728939533233643, 4.164996147155762, 4.357098579406738, 4.549201011657715, 4.741303443908691, 4.933405876159668, 5.1255083084106445, 5.317610740661621, 5.509713172912598, 5.701815605163574]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 18.0, 24.0, 27.0, 28.0, 35.0, 32.0, 32.0, 37.0, 50.0, 42.0, 39.0, 37.0, 57.0, 40.0, 42.0, 38.0, 47.0, 30.0, 34.0, 25.0, 28.0, 28.0, 18.0, 27.0, 17.0, 15.0, 11.0, 5.0, 11.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.537686347961426, -3.4350030422210693, -3.332319498062134, -3.2296361923217773, -3.126952886581421, -3.0242693424224854, -2.921586036682129, -2.8189024925231934, -2.716219186782837, -2.6135358810424805, -2.510852336883545, -2.4081690311431885, -2.305485725402832, -2.2028021812438965, -2.10011887550354, -1.997435450553894, -1.8947521448135376, -1.7920687198638916, -1.6893854141235352, -1.5867019891738892, -1.4840185642242432, -1.3813352584838867, -1.2786518335342407, -1.1759684085845947, -1.0732851028442383, -0.9706017374992371, -0.8679183125495911, -0.7652349472045898, -0.6625515222549438, -0.5598681569099426, -0.4571847915649414, -0.3545013666152954, -0.2518179416656494, -0.1491345465183258, -0.04645116627216339, 0.05623221397399902, 0.15891560912132263, 0.26159900426864624, 0.36428236961364746, 0.46696579456329346, 0.5696491599082947, 0.6723325252532959, 0.7750159502029419, 0.8776993155479431, 0.9803826808929443, 1.0830661058425903, 1.1857495307922363, 1.2884328365325928, 1.3911162614822388, 1.4937996864318848, 1.5964829921722412, 1.6991664171218872, 1.8018498420715332, 1.9045331478118896, 2.007216453552246, 2.1098999977111816, 2.212583303451538, 2.3152666091918945, 2.41795015335083, 2.5206334590911865, 2.623316764831543, 2.7260003089904785, 2.828683614730835, 2.9313669204711914, 3.034050464630127]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 9.0, 7.0, 10.0, 22.0, 20.0, 29.0, 35.0, 60.0, 77.0, 126.0, 169.0, 253.0, 401.0, 579.0, 967.0, 1484.0, 2329.0, 3797.0, 6305.0, 10285.0, 18535.0, 34119.0, 65099.0, 132402.0, 281641.0, 586474.0, 970300.0, 954120.0, 568134.0, 274482.0, 133205.0, 66654.0, 35300.0, 19418.0, 11036.0, 6572.0, 3785.0, 2356.0, 1392.0, 902.0, 518.0, 368.0, 191.0, 127.0, 77.0, 47.0, 40.0, 8.0, 4.0, 11.0, 5.0, 3.0, 1.0, 3.0], "bins": [-6.375, -6.20263671875, -6.0302734375, -5.85791015625, -5.685546875, -5.51318359375, -5.3408203125, -5.16845703125, -4.99609375, -4.82373046875, -4.6513671875, -4.47900390625, -4.306640625, -4.13427734375, -3.9619140625, -3.78955078125, -3.6171875, -3.44482421875, -3.2724609375, -3.10009765625, -2.927734375, -2.75537109375, -2.5830078125, -2.41064453125, -2.23828125, -2.06591796875, -1.8935546875, -1.72119140625, -1.548828125, -1.37646484375, -1.2041015625, -1.03173828125, -0.859375, -0.68701171875, -0.5146484375, -0.34228515625, -0.169921875, 0.00244140625, 0.1748046875, 0.34716796875, 0.51953125, 0.69189453125, 0.8642578125, 1.03662109375, 1.208984375, 1.38134765625, 1.5537109375, 1.72607421875, 1.8984375, 2.07080078125, 2.2431640625, 2.41552734375, 2.587890625, 2.76025390625, 2.9326171875, 3.10498046875, 3.27734375, 3.44970703125, 3.6220703125, 3.79443359375, 3.966796875, 4.13916015625, 4.3115234375, 4.48388671875, 4.65625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 10.0, 14.0, 7.0, 16.0, 13.0, 15.0, 22.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 39.0, 34.0, 41.0, 52.0, 49.0, 41.0, 43.0, 29.0, 53.0, 45.0, 40.0, 35.0, 38.0, 22.0, 33.0, 22.0, 13.0, 25.0, 12.0, 13.0, 11.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.052734375, -2.965850830078125, -2.87896728515625, -2.792083740234375, -2.7052001953125, -2.618316650390625, -2.53143310546875, -2.444549560546875, -2.357666015625, -2.270782470703125, -2.18389892578125, -2.097015380859375, -2.0101318359375, -1.923248291015625, -1.83636474609375, -1.749481201171875, -1.66259765625, -1.575714111328125, -1.48883056640625, -1.401947021484375, -1.3150634765625, -1.228179931640625, -1.14129638671875, -1.054412841796875, -0.967529296875, -0.880645751953125, -0.79376220703125, -0.706878662109375, -0.6199951171875, -0.533111572265625, -0.44622802734375, -0.359344482421875, -0.2724609375, -0.185577392578125, -0.09869384765625, -0.011810302734375, 0.0750732421875, 0.161956787109375, 0.24884033203125, 0.335723876953125, 0.422607421875, 0.509490966796875, 0.59637451171875, 0.683258056640625, 0.7701416015625, 0.857025146484375, 0.94390869140625, 1.030792236328125, 1.11767578125, 1.204559326171875, 1.29144287109375, 1.378326416015625, 1.4652099609375, 1.552093505859375, 1.63897705078125, 1.725860595703125, 1.812744140625, 1.899627685546875, 1.98651123046875, 2.073394775390625, 2.1602783203125, 2.247161865234375, 2.33404541015625, 2.420928955078125, 2.5078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 29.0, 34.0, 45.0, 74.0, 102.0, 171.0, 232.0, 376.0, 577.0, 905.0, 1361.0, 2128.0, 3283.0, 5203.0, 8395.0, 13655.0, 22872.0, 38670.0, 66692.0, 117931.0, 211257.0, 372398.0, 612727.0, 810640.0, 739668.0, 494160.0, 288017.0, 162159.0, 91197.0, 52108.0, 30061.0, 17832.0, 10897.0, 6661.0, 4154.0, 2649.0, 1666.0, 1098.0, 760.0, 476.0, 332.0, 202.0, 145.0, 99.0, 65.0, 50.0, 20.0, 20.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.390625, -5.220947265625, -5.05126953125, -4.881591796875, -4.7119140625, -4.542236328125, -4.37255859375, -4.202880859375, -4.033203125, -3.863525390625, -3.69384765625, -3.524169921875, -3.3544921875, -3.184814453125, -3.01513671875, -2.845458984375, -2.67578125, -2.506103515625, -2.33642578125, -2.166748046875, -1.9970703125, -1.827392578125, -1.65771484375, -1.488037109375, -1.318359375, -1.148681640625, -0.97900390625, -0.809326171875, -0.6396484375, -0.469970703125, -0.30029296875, -0.130615234375, 0.0390625, 0.208740234375, 0.37841796875, 0.548095703125, 0.7177734375, 0.887451171875, 1.05712890625, 1.226806640625, 1.396484375, 1.566162109375, 1.73583984375, 1.905517578125, 2.0751953125, 2.244873046875, 2.41455078125, 2.584228515625, 2.75390625, 2.923583984375, 3.09326171875, 3.262939453125, 3.4326171875, 3.602294921875, 3.77197265625, 3.941650390625, 4.111328125, 4.281005859375, 4.45068359375, 4.620361328125, 4.7900390625, 4.959716796875, 5.12939453125, 5.299072265625, 5.46875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 14.0, 13.0, 16.0, 13.0, 26.0, 35.0, 35.0, 30.0, 61.0, 75.0, 83.0, 98.0, 101.0, 149.0, 203.0, 193.0, 189.0, 214.0, 284.0, 264.0, 260.0, 254.0, 220.0, 190.0, 183.0, 157.0, 142.0, 109.0, 82.0, 71.0, 78.0, 50.0, 33.0, 33.0, 19.0, 16.0, 20.0, 12.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.623046875, -1.569915771484375, -1.51678466796875, -1.463653564453125, -1.4105224609375, -1.357391357421875, -1.30426025390625, -1.251129150390625, -1.197998046875, -1.144866943359375, -1.09173583984375, -1.038604736328125, -0.9854736328125, -0.932342529296875, -0.87921142578125, -0.826080322265625, -0.77294921875, -0.719818115234375, -0.66668701171875, -0.613555908203125, -0.5604248046875, -0.507293701171875, -0.45416259765625, -0.401031494140625, -0.347900390625, -0.294769287109375, -0.24163818359375, -0.188507080078125, -0.1353759765625, -0.082244873046875, -0.02911376953125, 0.024017333984375, 0.0771484375, 0.130279541015625, 0.18341064453125, 0.236541748046875, 0.2896728515625, 0.342803955078125, 0.39593505859375, 0.449066162109375, 0.502197265625, 0.555328369140625, 0.60845947265625, 0.661590576171875, 0.7147216796875, 0.767852783203125, 0.82098388671875, 0.874114990234375, 0.92724609375, 0.980377197265625, 1.03350830078125, 1.086639404296875, 1.1397705078125, 1.192901611328125, 1.24603271484375, 1.299163818359375, 1.352294921875, 1.405426025390625, 1.45855712890625, 1.511688232421875, 1.5648193359375, 1.617950439453125, 1.67108154296875, 1.724212646484375, 1.77734375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 4.0, 9.0, 13.0, 18.0, 15.0, 16.0, 24.0, 32.0, 34.0, 32.0, 50.0, 59.0, 52.0, 45.0, 43.0, 51.0, 50.0, 43.0, 53.0, 55.0, 52.0, 42.0, 26.0, 29.0, 28.0, 23.0, 14.0, 12.0, 11.0, 10.0, 13.0, 7.0, 3.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2430925369262695, -5.061591148376465, -4.88008975982666, -4.6985883712768555, -4.517086982727051, -4.335585594177246, -4.154084205627441, -3.9725828170776367, -3.791081428527832, -3.6095800399780273, -3.4280786514282227, -3.246577262878418, -3.0650758743286133, -2.8835744857788086, -2.702073097229004, -2.520571708679199, -2.3390703201293945, -2.15756893157959, -1.9760675430297852, -1.7945661544799805, -1.6130647659301758, -1.431563377380371, -1.2500619888305664, -1.0685606002807617, -0.887059211730957, -0.7055578231811523, -0.5240564346313477, -0.34255504608154297, -0.16105365753173828, 0.020447731018066406, 0.2019491195678711, 0.3834505081176758, 0.5649518966674805, 0.7464532852172852, 0.9279546737670898, 1.1094560623168945, 1.2909574508666992, 1.472458839416504, 1.6539602279663086, 1.8354616165161133, 2.016963005065918, 2.1984643936157227, 2.3799657821655273, 2.561467170715332, 2.7429685592651367, 2.9244699478149414, 3.105971336364746, 3.287472724914551, 3.4689741134643555, 3.65047550201416, 3.831976890563965, 4.0134782791137695, 4.194979667663574, 4.376481056213379, 4.557982444763184, 4.739483833312988, 4.920985221862793, 5.102486610412598, 5.283987998962402, 5.465489387512207, 5.646990776062012, 5.828492164611816, 6.009993553161621, 6.191494941711426, 6.3729963302612305]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 17.0, 15.0, 8.0, 17.0, 34.0, 20.0, 18.0, 29.0, 38.0, 38.0, 33.0, 46.0, 31.0, 29.0, 45.0, 45.0, 46.0, 41.0, 37.0, 50.0, 33.0, 38.0, 35.0, 31.0, 21.0, 33.0, 16.0, 13.0, 14.0, 17.0, 19.0, 2.0, 9.0, 9.0, 12.0, 5.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.1414031982421875, -4.029458999633789, -3.9175145626068115, -3.805570363998413, -3.6936261653900146, -3.581681728363037, -3.4697375297546387, -3.3577933311462402, -3.2458488941192627, -3.1339046955108643, -3.0219602584838867, -2.9100160598754883, -2.79807186126709, -2.6861274242401123, -2.574183225631714, -2.4622387886047363, -2.350294589996338, -2.2383503913879395, -2.126405954360962, -2.0144617557525635, -1.9025174379348755, -1.7905731201171875, -1.678628921508789, -1.566684603691101, -1.4547405242919922, -1.3427962064743042, -1.2308520078659058, -1.1189076900482178, -1.0069633722305298, -0.8950191140174866, -0.7830748558044434, -0.6711305379867554, -0.5591862201690674, -0.4472419321537018, -0.3352976441383362, -0.22335338592529297, -0.11140909790992737, 0.0005351901054382324, 0.11247944831848145, 0.22442376613616943, 0.33636802434921265, 0.44831231236457825, 0.5602566003799438, 0.6722008585929871, 0.7841451168060303, 0.8960894346237183, 1.0080337524414062, 1.1199779510498047, 1.2319222688674927, 1.3438665866851807, 1.455810785293579, 1.567755103111267, 1.679699420928955, 1.7916436195373535, 1.9035879373550415, 2.0155322551727295, 2.127476453781128, 2.2394206523895264, 2.351365089416504, 2.4633092880249023, 2.575253486633301, 2.6871979236602783, 2.7991421222686768, 2.9110865592956543, 3.0230307579040527]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 12.0, 5.0, 14.0, 19.0, 27.0, 49.0, 59.0, 70.0, 137.0, 221.0, 334.0, 484.0, 769.0, 1317.0, 2010.0, 3393.0, 5778.0, 9869.0, 16975.0, 30169.0, 54598.0, 96809.0, 159514.0, 208051.0, 183464.0, 118416.0, 67481.0, 37606.0, 21276.0, 12061.0, 6941.0, 4078.0, 2457.0, 1405.0, 969.0, 622.0, 348.0, 262.0, 151.0, 113.0, 76.0, 40.0, 23.0, 27.0, 12.0, 9.0, 15.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.58251953125, -0.564697265625, -0.546875, -0.529052734375, -0.51123046875, -0.493408203125, -0.4755859375, -0.457763671875, -0.43994140625, -0.422119140625, -0.404296875, -0.386474609375, -0.36865234375, -0.350830078125, -0.3330078125, -0.315185546875, -0.29736328125, -0.279541015625, -0.26171875, -0.243896484375, -0.22607421875, -0.208251953125, -0.1904296875, -0.172607421875, -0.15478515625, -0.136962890625, -0.119140625, -0.101318359375, -0.08349609375, -0.065673828125, -0.0478515625, -0.030029296875, -0.01220703125, 0.005615234375, 0.0234375, 0.041259765625, 0.05908203125, 0.076904296875, 0.0947265625, 0.112548828125, 0.13037109375, 0.148193359375, 0.166015625, 0.183837890625, 0.20166015625, 0.219482421875, 0.2373046875, 0.255126953125, 0.27294921875, 0.290771484375, 0.30859375, 0.326416015625, 0.34423828125, 0.362060546875, 0.3798828125, 0.397705078125, 0.41552734375, 0.433349609375, 0.451171875, 0.468994140625, 0.48681640625, 0.504638671875, 0.5224609375, 0.540283203125, 0.55810546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 14.0, 17.0, 17.0, 31.0, 19.0, 27.0, 32.0, 33.0, 45.0, 48.0, 50.0, 46.0, 46.0, 49.0, 57.0, 58.0, 45.0, 50.0, 30.0, 43.0, 30.0, 26.0, 29.0, 22.0, 22.0, 22.0, 24.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2186279296875, -4.066162109375, -3.9136962890625, -3.76123046875, -3.6087646484375, -3.456298828125, -3.3038330078125, -3.1513671875, -2.9989013671875, -2.846435546875, -2.6939697265625, -2.54150390625, -2.3890380859375, -2.236572265625, -2.0841064453125, -1.931640625, -1.7791748046875, -1.626708984375, -1.4742431640625, -1.32177734375, -1.1693115234375, -1.016845703125, -0.8643798828125, -0.7119140625, -0.5594482421875, -0.406982421875, -0.2545166015625, -0.10205078125, 0.0504150390625, 0.202880859375, 0.3553466796875, 0.5078125, 0.6602783203125, 0.812744140625, 0.9652099609375, 1.11767578125, 1.2701416015625, 1.422607421875, 1.5750732421875, 1.7275390625, 1.8800048828125, 2.032470703125, 2.1849365234375, 2.33740234375, 2.4898681640625, 2.642333984375, 2.7947998046875, 2.947265625, 3.0997314453125, 3.252197265625, 3.4046630859375, 3.55712890625, 3.7095947265625, 3.862060546875, 4.0145263671875, 4.1669921875, 4.3194580078125, 4.471923828125, 4.6243896484375, 4.77685546875, 4.9293212890625, 5.081787109375, 5.2342529296875, 5.38671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 15.0, 14.0, 30.0, 32.0, 40.0, 106.0, 127.0, 168.0, 258.0, 441.0, 698.0, 1220.0, 2296.0, 4421.0, 9500.0, 22672.0, 109613.0, 828059.0, 39704.0, 14855.0, 6762.0, 3215.0, 1724.0, 953.0, 576.0, 368.0, 252.0, 129.0, 101.0, 63.0, 46.0, 31.0, 20.0, 6.0, 14.0, 7.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7063446044921875, -1.648040771484375, -1.5897369384765625, -1.53143310546875, -1.4731292724609375, -1.414825439453125, -1.3565216064453125, -1.2982177734375, -1.2399139404296875, -1.181610107421875, -1.1233062744140625, -1.06500244140625, -1.0066986083984375, -0.948394775390625, -0.8900909423828125, -0.831787109375, -0.7734832763671875, -0.715179443359375, -0.6568756103515625, -0.59857177734375, -0.5402679443359375, -0.481964111328125, -0.4236602783203125, -0.3653564453125, -0.3070526123046875, -0.248748779296875, -0.1904449462890625, -0.13214111328125, -0.0738372802734375, -0.015533447265625, 0.0427703857421875, 0.10107421875, 0.1593780517578125, 0.217681884765625, 0.2759857177734375, 0.33428955078125, 0.3925933837890625, 0.450897216796875, 0.5092010498046875, 0.5675048828125, 0.6258087158203125, 0.684112548828125, 0.7424163818359375, 0.80072021484375, 0.8590240478515625, 0.917327880859375, 0.9756317138671875, 1.033935546875, 1.0922393798828125, 1.150543212890625, 1.2088470458984375, 1.26715087890625, 1.3254547119140625, 1.383758544921875, 1.4420623779296875, 1.5003662109375, 1.5586700439453125, 1.616973876953125, 1.6752777099609375, 1.73358154296875, 1.7918853759765625, 1.850189208984375, 1.9084930419921875, 1.966796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 7.0, 8.0, 15.0, 13.0, 19.0, 14.0, 19.0, 31.0, 19.0, 32.0, 40.0, 39.0, 51.0, 40.0, 36.0, 42.0, 51.0, 40.0, 46.0, 45.0, 45.0, 43.0, 39.0, 28.0, 22.0, 27.0, 34.0, 25.0, 20.0, 19.0, 13.0, 14.0, 12.0, 8.0, 7.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.3424072265625, -2.251220703125, -2.1600341796875, -2.06884765625, -1.9776611328125, -1.886474609375, -1.7952880859375, -1.7041015625, -1.6129150390625, -1.521728515625, -1.4305419921875, -1.33935546875, -1.2481689453125, -1.156982421875, -1.0657958984375, -0.974609375, -0.8834228515625, -0.792236328125, -0.7010498046875, -0.60986328125, -0.5186767578125, -0.427490234375, -0.3363037109375, -0.2451171875, -0.1539306640625, -0.062744140625, 0.0284423828125, 0.11962890625, 0.2108154296875, 0.302001953125, 0.3931884765625, 0.484375, 0.5755615234375, 0.666748046875, 0.7579345703125, 0.84912109375, 0.9403076171875, 1.031494140625, 1.1226806640625, 1.2138671875, 1.3050537109375, 1.396240234375, 1.4874267578125, 1.57861328125, 1.6697998046875, 1.760986328125, 1.8521728515625, 1.943359375, 2.0345458984375, 2.125732421875, 2.2169189453125, 2.30810546875, 2.3992919921875, 2.490478515625, 2.5816650390625, 2.6728515625, 2.7640380859375, 2.855224609375, 2.9464111328125, 3.03759765625, 3.1287841796875, 3.219970703125, 3.3111572265625, 3.40234375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 8.0, 2.0, 11.0, 8.0, 12.0, 16.0, 28.0, 41.0, 48.0, 50.0, 96.0, 131.0, 194.0, 333.0, 475.0, 793.0, 1296.0, 2049.0, 3709.0, 6809.0, 13414.0, 30020.0, 809480.0, 131997.0, 23126.0, 10830.0, 5520.0, 3199.0, 1736.0, 1107.0, 691.0, 457.0, 269.0, 210.0, 116.0, 68.0, 45.0, 50.0, 29.0, 25.0, 12.0, 15.0, 10.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.318115234375, -0.30626678466796875, -0.2944183349609375, -0.28256988525390625, -0.270721435546875, -0.25887298583984375, -0.2470245361328125, -0.23517608642578125, -0.22332763671875, -0.21147918701171875, -0.1996307373046875, -0.18778228759765625, -0.175933837890625, -0.16408538818359375, -0.1522369384765625, -0.14038848876953125, -0.1285400390625, -0.11669158935546875, -0.1048431396484375, -0.09299468994140625, -0.081146240234375, -0.06929779052734375, -0.0574493408203125, -0.04560089111328125, -0.03375244140625, -0.02190399169921875, -0.0100555419921875, 0.00179290771484375, 0.013641357421875, 0.02548980712890625, 0.0373382568359375, 0.04918670654296875, 0.06103515625, 0.07288360595703125, 0.0847320556640625, 0.09658050537109375, 0.108428955078125, 0.12027740478515625, 0.1321258544921875, 0.14397430419921875, 0.15582275390625, 0.16767120361328125, 0.1795196533203125, 0.19136810302734375, 0.203216552734375, 0.21506500244140625, 0.2269134521484375, 0.23876190185546875, 0.2506103515625, 0.26245880126953125, 0.2743072509765625, 0.28615570068359375, 0.298004150390625, 0.30985260009765625, 0.3217010498046875, 0.33354949951171875, 0.34539794921875, 0.35724639892578125, 0.3690948486328125, 0.38094329833984375, 0.392791748046875, 0.40464019775390625, 0.4164886474609375, 0.42833709716796875, 0.440185546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 12.0, 7.0, 13.0, 18.0, 16.0, 26.0, 21.0, 30.0, 19.0, 43.0, 30.0, 45.0, 41.0, 53.0, 60.0, 38.0, 54.0, 58.0, 58.0, 45.0, 45.0, 36.0, 21.0, 39.0, 24.0, 32.0, 17.0, 22.0, 13.0, 9.0, 10.0, 13.0, 4.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.103725612163544e-05, -3.0007213354110718e-05, -2.8977170586586e-05, -2.794712781906128e-05, -2.691708505153656e-05, -2.588704228401184e-05, -2.485699951648712e-05, -2.3826956748962402e-05, -2.2796913981437683e-05, -2.1766871213912964e-05, -2.0736828446388245e-05, -1.9706785678863525e-05, -1.8676742911338806e-05, -1.7646700143814087e-05, -1.6616657376289368e-05, -1.558661460876465e-05, -1.455657184123993e-05, -1.352652907371521e-05, -1.249648630619049e-05, -1.1466443538665771e-05, -1.0436400771141052e-05, -9.406358003616333e-06, -8.376315236091614e-06, -7.3462724685668945e-06, -6.316229701042175e-06, -5.286186933517456e-06, -4.256144165992737e-06, -3.2261013984680176e-06, -2.1960586309432983e-06, -1.166015863418579e-06, -1.3597309589385986e-07, 8.940696716308594e-07, 1.9241124391555786e-06, 2.954155206680298e-06, 3.984197974205017e-06, 5.014240741729736e-06, 6.0442835092544556e-06, 7.074326276779175e-06, 8.104369044303894e-06, 9.134411811828613e-06, 1.0164454579353333e-05, 1.1194497346878052e-05, 1.2224540114402771e-05, 1.325458288192749e-05, 1.428462564945221e-05, 1.531466841697693e-05, 1.6344711184501648e-05, 1.7374753952026367e-05, 1.8404796719551086e-05, 1.9434839487075806e-05, 2.0464882254600525e-05, 2.1494925022125244e-05, 2.2524967789649963e-05, 2.3555010557174683e-05, 2.4585053324699402e-05, 2.561509609222412e-05, 2.664513885974884e-05, 2.767518162727356e-05, 2.870522439479828e-05, 2.9735267162322998e-05, 3.076530992984772e-05, 3.1795352697372437e-05, 3.2825395464897156e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 19.0, 22.0, 29.0, 27.0, 49.0, 53.0, 98.0, 117.0, 154.0, 238.0, 352.0, 536.0, 825.0, 1222.0, 2055.0, 3467.0, 6248.0, 11312.0, 21582.0, 43809.0, 88449.0, 170722.0, 255350.0, 209157.0, 114180.0, 56987.0, 28100.0, 14410.0, 7706.0, 4267.0, 2555.0, 1561.0, 928.0, 605.0, 404.0, 252.0, 189.0, 122.0, 77.0, 67.0, 45.0, 43.0, 27.0, 26.0, 25.0, 16.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-0.1854248046875, -0.17957305908203125, -0.1737213134765625, -0.16786956787109375, -0.162017822265625, -0.15616607666015625, -0.1503143310546875, -0.14446258544921875, -0.13861083984375, -0.13275909423828125, -0.1269073486328125, -0.12105560302734375, -0.115203857421875, -0.10935211181640625, -0.1035003662109375, -0.09764862060546875, -0.091796875, -0.08594512939453125, -0.0800933837890625, -0.07424163818359375, -0.068389892578125, -0.06253814697265625, -0.0566864013671875, -0.05083465576171875, -0.04498291015625, -0.03913116455078125, -0.0332794189453125, -0.02742767333984375, -0.021575927734375, -0.01572418212890625, -0.0098724365234375, -0.00402069091796875, 0.0018310546875, 0.00768280029296875, 0.0135345458984375, 0.01938629150390625, 0.025238037109375, 0.03108978271484375, 0.0369415283203125, 0.04279327392578125, 0.04864501953125, 0.05449676513671875, 0.0603485107421875, 0.06620025634765625, 0.072052001953125, 0.07790374755859375, 0.0837554931640625, 0.08960723876953125, 0.095458984375, 0.10131072998046875, 0.1071624755859375, 0.11301422119140625, 0.118865966796875, 0.12471771240234375, 0.1305694580078125, 0.13642120361328125, 0.14227294921875, 0.14812469482421875, 0.1539764404296875, 0.15982818603515625, 0.165679931640625, 0.17153167724609375, 0.1773834228515625, 0.18323516845703125, 0.1890869140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 5.0, 13.0, 14.0, 17.0, 12.0, 22.0, 26.0, 24.0, 33.0, 25.0, 48.0, 44.0, 55.0, 56.0, 60.0, 73.0, 53.0, 60.0, 54.0, 28.0, 49.0, 36.0, 26.0, 27.0, 17.0, 18.0, 14.0, 15.0, 10.0, 4.0, 8.0, 4.0, 4.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.033934593200683594, -0.03277397155761719, -0.03161334991455078, -0.030452728271484375, -0.02929210662841797, -0.028131484985351562, -0.026970863342285156, -0.02581024169921875, -0.024649620056152344, -0.023488998413085938, -0.02232837677001953, -0.021167755126953125, -0.02000713348388672, -0.018846511840820312, -0.017685890197753906, -0.0165252685546875, -0.015364646911621094, -0.014204025268554688, -0.013043403625488281, -0.011882781982421875, -0.010722160339355469, -0.009561538696289062, -0.008400917053222656, -0.00724029541015625, -0.006079673767089844, -0.0049190521240234375, -0.0037584304809570312, -0.002597808837890625, -0.0014371871948242188, -0.0002765655517578125, 0.0008840560913085938, 0.002044677734375, 0.0032052993774414062, 0.0043659210205078125, 0.005526542663574219, 0.006687164306640625, 0.007847785949707031, 0.009008407592773438, 0.010169029235839844, 0.01132965087890625, 0.012490272521972656, 0.013650894165039062, 0.014811515808105469, 0.015972137451171875, 0.01713275909423828, 0.018293380737304688, 0.019454002380371094, 0.0206146240234375, 0.021775245666503906, 0.022935867309570312, 0.02409648895263672, 0.025257110595703125, 0.02641773223876953, 0.027578353881835938, 0.028738975524902344, 0.02989959716796875, 0.031060218811035156, 0.03222084045410156, 0.03338146209716797, 0.034542083740234375, 0.03570270538330078, 0.03686332702636719, 0.038023948669433594, 0.0391845703125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 3.0, 11.0, 14.0, 16.0, 14.0, 17.0, 27.0, 28.0, 43.0, 31.0, 51.0, 60.0, 55.0, 45.0, 44.0, 56.0, 44.0, 46.0, 60.0, 49.0, 45.0, 43.0, 32.0, 23.0, 28.0, 16.0, 14.0, 13.0, 12.0, 13.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.221388816833496, -5.038038730621338, -4.85468864440918, -4.6713385581970215, -4.487988471984863, -4.304637908935547, -4.121288299560547, -3.9379377365112305, -3.7545876502990723, -3.571237564086914, -3.387887477874756, -3.2045373916625977, -3.0211870670318604, -2.837836980819702, -2.654486894607544, -2.4711365699768066, -2.2877867221832275, -2.1044366359710693, -1.9210864305496216, -1.7377363443374634, -1.5543861389160156, -1.3710360527038574, -1.1876859664916992, -1.0043357610702515, -0.8209856748580933, -0.6376355290412903, -0.4542854130268097, -0.2709352970123291, -0.08758515119552612, 0.09576499462127686, 0.27911508083343506, 0.4624652862548828, 0.645815372467041, 0.829165518283844, 1.012515664100647, 1.1958657503128052, 1.379215955734253, 1.5625660419464111, 1.7459161281585693, 1.929266333580017, 2.112616539001465, 2.295966625213623, 2.4793167114257812, 2.6626667976379395, 2.8460171222686768, 3.029367208480835, 3.212717294692993, 3.3960676193237305, 3.5794174671173096, 3.7627675533294678, 3.946117639541626, 4.129467964172363, 4.3128180503845215, 4.49616813659668, 4.679518222808838, 4.862868309020996, 5.046218395233154, 5.2295684814453125, 5.412918567657471, 5.596268653869629, 5.779618740081787, 5.962968826293945, 6.146319389343262, 6.32966947555542, 6.513019561767578]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 11.0, 14.0, 15.0, 31.0, 22.0, 18.0, 29.0, 39.0, 38.0, 36.0, 43.0, 29.0, 32.0, 45.0, 45.0, 44.0, 41.0, 36.0, 54.0, 34.0, 34.0, 33.0, 34.0, 21.0, 30.0, 19.0, 12.0, 15.0, 17.0, 18.0, 3.0, 10.0, 7.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.09265661239624, -3.9814138412475586, -3.870170831680298, -3.758928060531616, -3.6476850509643555, -3.536442279815674, -3.425199508666992, -3.3139567375183105, -3.20271372795105, -3.091470956802368, -2.9802279472351074, -2.868985176086426, -2.757742404937744, -2.6464993953704834, -2.5352566242218018, -2.424013614654541, -2.3127708435058594, -2.2015280723571777, -2.090285062789917, -1.9790422916412354, -1.8677994012832642, -1.756556510925293, -1.6453137397766113, -1.5340708494186401, -1.422827959060669, -1.3115850687026978, -1.2003421783447266, -1.089099407196045, -0.9778565168380737, -0.8666136264801025, -0.7553707957267761, -0.6441279649734497, -0.5328850746154785, -0.4216422140598297, -0.3103993535041809, -0.1991564929485321, -0.0879136323928833, 0.02332925796508789, 0.1345720887184143, 0.24581491947174072, 0.3570578098297119, 0.4683006703853607, 0.5795435309410095, 0.6907863616943359, 0.8020292520523071, 0.9132721424102783, 1.02451491355896, 1.1357578039169312, 1.2470006942749023, 1.3582435846328735, 1.4694864749908447, 1.5807292461395264, 1.6919721364974976, 1.8032150268554688, 1.9144577980041504, 2.025700569152832, 2.1369435787200928, 2.2481863498687744, 2.359429359436035, 2.470672130584717, 2.5819149017333984, 2.693157911300659, 2.804400682449341, 2.9156436920166016, 3.026886463165283]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 26.0, 43.0, 64.0, 86.0, 149.0, 210.0, 388.0, 666.0, 1034.0, 1773.0, 3069.0, 5580.0, 10332.0, 19473.0, 36804.0, 66839.0, 112644.0, 165928.0, 190714.0, 167139.0, 115680.0, 68165.0, 37485.0, 20077.0, 10823.0, 5652.0, 3185.0, 1798.0, 1030.0, 626.0, 379.0, 244.0, 139.0, 78.0, 56.0, 60.0, 30.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.0797119140625, -4.901611328125, -4.7235107421875, -4.54541015625, -4.3673095703125, -4.189208984375, -4.0111083984375, -3.8330078125, -3.6549072265625, -3.476806640625, -3.2987060546875, -3.12060546875, -2.9425048828125, -2.764404296875, -2.5863037109375, -2.408203125, -2.2301025390625, -2.052001953125, -1.8739013671875, -1.69580078125, -1.5177001953125, -1.339599609375, -1.1614990234375, -0.9833984375, -0.8052978515625, -0.627197265625, -0.4490966796875, -0.27099609375, -0.0928955078125, 0.085205078125, 0.2633056640625, 0.44140625, 0.6195068359375, 0.797607421875, 0.9757080078125, 1.15380859375, 1.3319091796875, 1.510009765625, 1.6881103515625, 1.8662109375, 2.0443115234375, 2.222412109375, 2.4005126953125, 2.57861328125, 2.7567138671875, 2.934814453125, 3.1129150390625, 3.291015625, 3.4691162109375, 3.647216796875, 3.8253173828125, 4.00341796875, 4.1815185546875, 4.359619140625, 4.5377197265625, 4.7158203125, 4.8939208984375, 5.072021484375, 5.2501220703125, 5.42822265625, 5.6063232421875, 5.784423828125, 5.9625244140625, 6.140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 4.0, 7.0, 14.0, 10.0, 21.0, 29.0, 20.0, 21.0, 21.0, 30.0, 38.0, 43.0, 41.0, 40.0, 55.0, 46.0, 51.0, 61.0, 41.0, 59.0, 50.0, 42.0, 47.0, 33.0, 32.0, 24.0, 23.0, 15.0, 15.0, 14.0, 6.0, 12.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.30718994140625, -4.1612548828125, -4.01531982421875, -3.869384765625, -3.72344970703125, -3.5775146484375, -3.43157958984375, -3.28564453125, -3.13970947265625, -2.9937744140625, -2.84783935546875, -2.701904296875, -2.55596923828125, -2.4100341796875, -2.26409912109375, -2.1181640625, -1.97222900390625, -1.8262939453125, -1.68035888671875, -1.534423828125, -1.38848876953125, -1.2425537109375, -1.09661865234375, -0.95068359375, -0.80474853515625, -0.6588134765625, -0.51287841796875, -0.366943359375, -0.22100830078125, -0.0750732421875, 0.07086181640625, 0.216796875, 0.36273193359375, 0.5086669921875, 0.65460205078125, 0.800537109375, 0.94647216796875, 1.0924072265625, 1.23834228515625, 1.38427734375, 1.53021240234375, 1.6761474609375, 1.82208251953125, 1.968017578125, 2.11395263671875, 2.2598876953125, 2.40582275390625, 2.5517578125, 2.69769287109375, 2.8436279296875, 2.98956298828125, 3.135498046875, 3.28143310546875, 3.4273681640625, 3.57330322265625, 3.71923828125, 3.86517333984375, 4.0111083984375, 4.15704345703125, 4.302978515625, 4.44891357421875, 4.5948486328125, 4.74078369140625, 4.88671875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 13.0, 12.0, 12.0, 17.0, 36.0, 33.0, 57.0, 79.0, 103.0, 196.0, 287.0, 405.0, 625.0, 1023.0, 1771.0, 3011.0, 5222.0, 9895.0, 17824.0, 34005.0, 62454.0, 107475.0, 161693.0, 193809.0, 173018.0, 119502.0, 70579.0, 38764.0, 20876.0, 11102.0, 6040.0, 3415.0, 1926.0, 1179.0, 701.0, 470.0, 318.0, 195.0, 133.0, 86.0, 56.0, 39.0, 38.0, 22.0, 13.0, 9.0, 4.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.67779541015625, -5.4923095703125, -5.30682373046875, -5.121337890625, -4.93585205078125, -4.7503662109375, -4.56488037109375, -4.37939453125, -4.19390869140625, -4.0084228515625, -3.82293701171875, -3.637451171875, -3.45196533203125, -3.2664794921875, -3.08099365234375, -2.8955078125, -2.71002197265625, -2.5245361328125, -2.33905029296875, -2.153564453125, -1.96807861328125, -1.7825927734375, -1.59710693359375, -1.41162109375, -1.22613525390625, -1.0406494140625, -0.85516357421875, -0.669677734375, -0.48419189453125, -0.2987060546875, -0.11322021484375, 0.072265625, 0.25775146484375, 0.4432373046875, 0.62872314453125, 0.814208984375, 0.99969482421875, 1.1851806640625, 1.37066650390625, 1.55615234375, 1.74163818359375, 1.9271240234375, 2.11260986328125, 2.298095703125, 2.48358154296875, 2.6690673828125, 2.85455322265625, 3.0400390625, 3.22552490234375, 3.4110107421875, 3.59649658203125, 3.781982421875, 3.96746826171875, 4.1529541015625, 4.33843994140625, 4.52392578125, 4.70941162109375, 4.8948974609375, 5.08038330078125, 5.265869140625, 5.45135498046875, 5.6368408203125, 5.82232666015625, 6.0078125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 4.0, 12.0, 13.0, 9.0, 19.0, 10.0, 15.0, 18.0, 31.0, 23.0, 33.0, 36.0, 43.0, 42.0, 47.0, 33.0, 43.0, 45.0, 34.0, 37.0, 41.0, 37.0, 44.0, 33.0, 30.0, 23.0, 35.0, 27.0, 23.0, 24.0, 16.0, 20.0, 20.0, 10.0, 15.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.038421630859375, -1.96551513671875, -1.892608642578125, -1.8197021484375, -1.746795654296875, -1.67388916015625, -1.600982666015625, -1.528076171875, -1.455169677734375, -1.38226318359375, -1.309356689453125, -1.2364501953125, -1.163543701171875, -1.09063720703125, -1.017730712890625, -0.94482421875, -0.871917724609375, -0.79901123046875, -0.726104736328125, -0.6531982421875, -0.580291748046875, -0.50738525390625, -0.434478759765625, -0.361572265625, -0.288665771484375, -0.21575927734375, -0.142852783203125, -0.0699462890625, 0.002960205078125, 0.07586669921875, 0.148773193359375, 0.2216796875, 0.294586181640625, 0.36749267578125, 0.440399169921875, 0.5133056640625, 0.586212158203125, 0.65911865234375, 0.732025146484375, 0.804931640625, 0.877838134765625, 0.95074462890625, 1.023651123046875, 1.0965576171875, 1.169464111328125, 1.24237060546875, 1.315277099609375, 1.38818359375, 1.461090087890625, 1.53399658203125, 1.606903076171875, 1.6798095703125, 1.752716064453125, 1.82562255859375, 1.898529052734375, 1.971435546875, 2.044342041015625, 2.11724853515625, 2.190155029296875, 2.2630615234375, 2.335968017578125, 2.40887451171875, 2.481781005859375, 2.5546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 6.0, 4.0, 4.0, 9.0, 15.0, 19.0, 30.0, 41.0, 49.0, 97.0, 105.0, 151.0, 219.0, 380.0, 521.0, 824.0, 1320.0, 1920.0, 3121.0, 4948.0, 7873.0, 12922.0, 21075.0, 33874.0, 54983.0, 84998.0, 120953.0, 149523.0, 154529.0, 130626.0, 95465.0, 63379.0, 39858.0, 24656.0, 14939.0, 9342.0, 5648.0, 3578.0, 2248.0, 1489.0, 951.0, 647.0, 403.0, 258.0, 175.0, 116.0, 92.0, 61.0, 29.0, 37.0, 16.0, 11.0, 10.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.416015625, -2.338470458984375, -2.26092529296875, -2.183380126953125, -2.1058349609375, -2.028289794921875, -1.95074462890625, -1.873199462890625, -1.795654296875, -1.718109130859375, -1.64056396484375, -1.563018798828125, -1.4854736328125, -1.407928466796875, -1.33038330078125, -1.252838134765625, -1.17529296875, -1.097747802734375, -1.02020263671875, -0.942657470703125, -0.8651123046875, -0.787567138671875, -0.71002197265625, -0.632476806640625, -0.554931640625, -0.477386474609375, -0.39984130859375, -0.322296142578125, -0.2447509765625, -0.167205810546875, -0.08966064453125, -0.012115478515625, 0.0654296875, 0.142974853515625, 0.22052001953125, 0.298065185546875, 0.3756103515625, 0.453155517578125, 0.53070068359375, 0.608245849609375, 0.685791015625, 0.763336181640625, 0.84088134765625, 0.918426513671875, 0.9959716796875, 1.073516845703125, 1.15106201171875, 1.228607177734375, 1.30615234375, 1.383697509765625, 1.46124267578125, 1.538787841796875, 1.6163330078125, 1.693878173828125, 1.77142333984375, 1.848968505859375, 1.926513671875, 2.004058837890625, 2.08160400390625, 2.159149169921875, 2.2366943359375, 2.314239501953125, 2.39178466796875, 2.469329833984375, 2.546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 3.0, 7.0, 27.0, 8.0, 19.0, 19.0, 26.0, 33.0, 38.0, 53.0, 46.0, 32.0, 55.0, 73.0, 52.0, 71.0, 59.0, 59.0, 60.0, 44.0, 42.0, 24.0, 27.0, 28.0, 19.0, 12.0, 9.0, 11.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.0003085136413574219, -0.0002989768981933594, -0.0002894401550292969, -0.0002799034118652344, -0.0002703666687011719, -0.0002608299255371094, -0.0002512931823730469, -0.00024175643920898438, -0.00023221969604492188, -0.00022268295288085938, -0.00021314620971679688, -0.00020360946655273438, -0.00019407272338867188, -0.00018453598022460938, -0.00017499923706054688, -0.00016546249389648438, -0.00015592575073242188, -0.00014638900756835938, -0.00013685226440429688, -0.00012731552124023438, -0.00011777877807617188, -0.00010824203491210938, -9.870529174804688e-05, -8.916854858398438e-05, -7.963180541992188e-05, -7.009506225585938e-05, -6.0558319091796875e-05, -5.1021575927734375e-05, -4.1484832763671875e-05, -3.1948089599609375e-05, -2.2411346435546875e-05, -1.2874603271484375e-05, -3.337860107421875e-06, 6.198883056640625e-06, 1.5735626220703125e-05, 2.5272369384765625e-05, 3.4809112548828125e-05, 4.4345855712890625e-05, 5.3882598876953125e-05, 6.341934204101562e-05, 7.295608520507812e-05, 8.249282836914062e-05, 9.202957153320312e-05, 0.00010156631469726562, 0.00011110305786132812, 0.00012063980102539062, 0.00013017654418945312, 0.00013971328735351562, 0.00014925003051757812, 0.00015878677368164062, 0.00016832351684570312, 0.00017786026000976562, 0.00018739700317382812, 0.00019693374633789062, 0.00020647048950195312, 0.00021600723266601562, 0.00022554397583007812, 0.00023508071899414062, 0.0002446174621582031, 0.0002541542053222656, 0.0002636909484863281, 0.0002732276916503906, 0.0002827644348144531, 0.0002923011779785156]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 9.0, 13.0, 20.0, 29.0, 43.0, 50.0, 76.0, 117.0, 158.0, 252.0, 329.0, 542.0, 732.0, 1074.0, 1620.0, 2381.0, 3554.0, 5402.0, 8293.0, 12755.0, 20154.0, 31505.0, 48395.0, 72817.0, 102931.0, 130820.0, 143108.0, 133325.0, 106192.0, 76229.0, 50986.0, 33601.0, 21440.0, 13552.0, 8722.0, 5735.0, 3718.0, 2596.0, 1653.0, 1149.0, 764.0, 535.0, 368.0, 250.0, 177.0, 119.0, 85.0, 58.0, 33.0, 35.0, 24.0, 8.0, 11.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.0606689453125, -1.988525390625, -1.9163818359375, -1.84423828125, -1.7720947265625, -1.699951171875, -1.6278076171875, -1.5556640625, -1.4835205078125, -1.411376953125, -1.3392333984375, -1.26708984375, -1.1949462890625, -1.122802734375, -1.0506591796875, -0.978515625, -0.9063720703125, -0.834228515625, -0.7620849609375, -0.68994140625, -0.6177978515625, -0.545654296875, -0.4735107421875, -0.4013671875, -0.3292236328125, -0.257080078125, -0.1849365234375, -0.11279296875, -0.0406494140625, 0.031494140625, 0.1036376953125, 0.17578125, 0.2479248046875, 0.320068359375, 0.3922119140625, 0.46435546875, 0.5364990234375, 0.608642578125, 0.6807861328125, 0.7529296875, 0.8250732421875, 0.897216796875, 0.9693603515625, 1.04150390625, 1.1136474609375, 1.185791015625, 1.2579345703125, 1.330078125, 1.4022216796875, 1.474365234375, 1.5465087890625, 1.61865234375, 1.6907958984375, 1.762939453125, 1.8350830078125, 1.9072265625, 1.9793701171875, 2.051513671875, 2.1236572265625, 2.19580078125, 2.2679443359375, 2.340087890625, 2.4122314453125, 2.484375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 7.0, 5.0, 9.0, 7.0, 8.0, 6.0, 20.0, 25.0, 31.0, 15.0, 28.0, 25.0, 35.0, 47.0, 43.0, 40.0, 46.0, 52.0, 55.0, 52.0, 47.0, 58.0, 51.0, 37.0, 36.0, 31.0, 32.0, 26.0, 19.0, 15.0, 16.0, 16.0, 10.0, 7.0, 5.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71044921875, -0.686431884765625, -0.66241455078125, -0.638397216796875, -0.6143798828125, -0.590362548828125, -0.56634521484375, -0.542327880859375, -0.518310546875, -0.494293212890625, -0.47027587890625, -0.446258544921875, -0.4222412109375, -0.398223876953125, -0.37420654296875, -0.350189208984375, -0.326171875, -0.302154541015625, -0.27813720703125, -0.254119873046875, -0.2301025390625, -0.206085205078125, -0.18206787109375, -0.158050537109375, -0.134033203125, -0.110015869140625, -0.08599853515625, -0.061981201171875, -0.0379638671875, -0.013946533203125, 0.01007080078125, 0.034088134765625, 0.05810546875, 0.082122802734375, 0.10614013671875, 0.130157470703125, 0.1541748046875, 0.178192138671875, 0.20220947265625, 0.226226806640625, 0.250244140625, 0.274261474609375, 0.29827880859375, 0.322296142578125, 0.3463134765625, 0.370330810546875, 0.39434814453125, 0.418365478515625, 0.4423828125, 0.466400146484375, 0.49041748046875, 0.514434814453125, 0.5384521484375, 0.562469482421875, 0.58648681640625, 0.610504150390625, 0.634521484375, 0.658538818359375, 0.68255615234375, 0.706573486328125, 0.7305908203125, 0.754608154296875, 0.77862548828125, 0.802642822265625, 0.82666015625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 7.0, 4.0, 2.0, 10.0, 10.0, 15.0, 20.0, 19.0, 21.0, 19.0, 27.0, 44.0, 30.0, 38.0, 36.0, 50.0, 59.0, 59.0, 51.0, 50.0, 51.0, 53.0, 51.0, 29.0, 39.0, 38.0, 29.0, 28.0, 20.0, 22.0, 14.0, 11.0, 6.0, 10.0, 10.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.928782939910889, -4.745309829711914, -4.5618367195129395, -4.378363609313965, -4.19489049911499, -4.011417388916016, -3.827944040298462, -3.6444709300994873, -3.4609978199005127, -3.277524709701538, -3.0940515995025635, -2.9105782508850098, -2.727105140686035, -2.5436320304870605, -2.360158920288086, -2.1766858100891113, -1.9932126998901367, -1.809739589691162, -1.6262664794921875, -1.4427932500839233, -1.2593201398849487, -1.0758470296859741, -0.89237380027771, -0.7089006900787354, -0.5254275798797607, -0.34195443987846375, -0.15848129987716675, 0.024991869926452637, 0.20846498012542725, 0.39193809032440186, 0.575411319732666, 0.7588844299316406, 0.9423580169677734, 1.125831127166748, 1.3093042373657227, 1.4927774667739868, 1.6762505769729614, 1.859723687171936, 2.0431969165802, 2.226670026779175, 2.4101431369781494, 2.593616247177124, 2.7770893573760986, 2.9605627059936523, 3.144035816192627, 3.3275089263916016, 3.510982036590576, 3.694455146789551, 3.8779282569885254, 4.0614013671875, 4.244874477386475, 4.428347587585449, 4.611820697784424, 4.795293807983398, 4.978767395019531, 5.162240028381348, 5.3457136154174805, 5.529186725616455, 5.71265983581543, 5.896132946014404, 6.079606056213379, 6.2630791664123535, 6.446552276611328, 6.630025863647461, 6.813498497009277]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 14.0, 16.0, 13.0, 15.0, 15.0, 19.0, 22.0, 22.0, 20.0, 34.0, 28.0, 40.0, 36.0, 26.0, 35.0, 54.0, 39.0, 50.0, 44.0, 42.0, 44.0, 35.0, 29.0, 24.0, 31.0, 32.0, 22.0, 17.0, 18.0, 24.0, 16.0, 12.0, 16.0, 12.0, 16.0, 6.0, 5.0, 3.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-3.8244690895080566, -3.712723970413208, -3.6009790897369385, -3.48923397064209, -3.3774890899658203, -3.2657439708709717, -3.153998851776123, -3.0422539710998535, -2.930508852005005, -2.8187637329101562, -2.7070188522338867, -2.595273733139038, -2.4835286140441895, -2.37178373336792, -2.2600386142730713, -2.1482934951782227, -2.036548614501953, -1.924803614616394, -1.813058614730835, -1.7013134956359863, -1.5895684957504272, -1.4778234958648682, -1.3660783767700195, -1.2543333768844604, -1.1425883769989014, -1.0308433771133423, -0.9190983176231384, -0.8073532581329346, -0.6956082582473755, -0.5838632583618164, -0.47211819887161255, -0.3603731393814087, -0.2486283779144287, -0.13688334822654724, -0.02513831853866577, 0.0866067111492157, 0.19835174083709717, 0.31009674072265625, 0.4218418002128601, 0.533586859703064, 0.645331859588623, 0.7570768594741821, 0.868821918964386, 0.9805669784545898, 1.092311978340149, 1.204056978225708, 1.3158020973205566, 1.4275470972061157, 1.5392920970916748, 1.6510370969772339, 1.762782096862793, 1.8745272159576416, 1.9862722158432007, 2.0980172157287598, 2.2097623348236084, 2.321507453918457, 2.4332523345947266, 2.544997453689575, 2.6567423343658447, 2.7684874534606934, 2.880232334136963, 2.9919774532318115, 3.10372257232666, 3.2154674530029297, 3.3272125720977783]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 22.0, 22.0, 39.0, 53.0, 64.0, 109.0, 174.0, 267.0, 385.0, 587.0, 891.0, 1554.0, 2707.0, 4293.0, 7585.0, 13128.0, 24379.0, 45902.0, 90837.0, 189045.0, 405765.0, 788998.0, 1039414.0, 785845.0, 406213.0, 191629.0, 92727.0, 46413.0, 24488.0, 13014.0, 7417.0, 4140.0, 2458.0, 1417.0, 881.0, 542.0, 325.0, 200.0, 122.0, 85.0, 46.0, 27.0, 19.0, 14.0, 8.0, 5.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.90234375, -6.6962890625, -6.490234375, -6.2841796875, -6.078125, -5.8720703125, -5.666015625, -5.4599609375, -5.25390625, -5.0478515625, -4.841796875, -4.6357421875, -4.4296875, -4.2236328125, -4.017578125, -3.8115234375, -3.60546875, -3.3994140625, -3.193359375, -2.9873046875, -2.78125, -2.5751953125, -2.369140625, -2.1630859375, -1.95703125, -1.7509765625, -1.544921875, -1.3388671875, -1.1328125, -0.9267578125, -0.720703125, -0.5146484375, -0.30859375, -0.1025390625, 0.103515625, 0.3095703125, 0.515625, 0.7216796875, 0.927734375, 1.1337890625, 1.33984375, 1.5458984375, 1.751953125, 1.9580078125, 2.1640625, 2.3701171875, 2.576171875, 2.7822265625, 2.98828125, 3.1943359375, 3.400390625, 3.6064453125, 3.8125, 4.0185546875, 4.224609375, 4.4306640625, 4.63671875, 4.8427734375, 5.048828125, 5.2548828125, 5.4609375, 5.6669921875, 5.873046875, 6.0791015625, 6.28515625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 9.0, 18.0, 21.0, 21.0, 21.0, 14.0, 33.0, 41.0, 39.0, 29.0, 44.0, 51.0, 48.0, 45.0, 50.0, 60.0, 52.0, 48.0, 29.0, 46.0, 39.0, 31.0, 30.0, 20.0, 23.0, 15.0, 17.0, 20.0, 11.0, 9.0, 3.0, 8.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.701171875, -3.58648681640625, -3.4718017578125, -3.35711669921875, -3.242431640625, -3.12774658203125, -3.0130615234375, -2.89837646484375, -2.78369140625, -2.66900634765625, -2.5543212890625, -2.43963623046875, -2.324951171875, -2.21026611328125, -2.0955810546875, -1.98089599609375, -1.8662109375, -1.75152587890625, -1.6368408203125, -1.52215576171875, -1.407470703125, -1.29278564453125, -1.1781005859375, -1.06341552734375, -0.94873046875, -0.83404541015625, -0.7193603515625, -0.60467529296875, -0.489990234375, -0.37530517578125, -0.2606201171875, -0.14593505859375, -0.03125, 0.08343505859375, 0.1981201171875, 0.31280517578125, 0.427490234375, 0.54217529296875, 0.6568603515625, 0.77154541015625, 0.88623046875, 1.00091552734375, 1.1156005859375, 1.23028564453125, 1.344970703125, 1.45965576171875, 1.5743408203125, 1.68902587890625, 1.8037109375, 1.91839599609375, 2.0330810546875, 2.14776611328125, 2.262451171875, 2.37713623046875, 2.4918212890625, 2.60650634765625, 2.72119140625, 2.83587646484375, 2.9505615234375, 3.06524658203125, 3.179931640625, 3.29461669921875, 3.4093017578125, 3.52398681640625, 3.638671875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 25.0, 35.0, 48.0, 71.0, 115.0, 195.0, 239.0, 417.0, 589.0, 984.0, 1403.0, 2121.0, 3284.0, 5206.0, 8142.0, 13094.0, 21577.0, 35271.0, 59213.0, 99988.0, 168750.0, 285494.0, 459535.0, 654453.0, 734496.0, 608889.0, 410282.0, 251651.0, 147935.0, 86820.0, 52016.0, 30878.0, 18989.0, 11692.0, 7347.0, 4578.0, 2913.0, 1904.0, 1240.0, 843.0, 519.0, 366.0, 215.0, 147.0, 97.0, 71.0, 46.0, 20.0, 19.0, 20.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.765625, -5.58184814453125, -5.3980712890625, -5.21429443359375, -5.030517578125, -4.84674072265625, -4.6629638671875, -4.47918701171875, -4.29541015625, -4.11163330078125, -3.9278564453125, -3.74407958984375, -3.560302734375, -3.37652587890625, -3.1927490234375, -3.00897216796875, -2.8251953125, -2.64141845703125, -2.4576416015625, -2.27386474609375, -2.090087890625, -1.90631103515625, -1.7225341796875, -1.53875732421875, -1.35498046875, -1.17120361328125, -0.9874267578125, -0.80364990234375, -0.619873046875, -0.43609619140625, -0.2523193359375, -0.06854248046875, 0.115234375, 0.29901123046875, 0.4827880859375, 0.66656494140625, 0.850341796875, 1.03411865234375, 1.2178955078125, 1.40167236328125, 1.58544921875, 1.76922607421875, 1.9530029296875, 2.13677978515625, 2.320556640625, 2.50433349609375, 2.6881103515625, 2.87188720703125, 3.0556640625, 3.23944091796875, 3.4232177734375, 3.60699462890625, 3.790771484375, 3.97454833984375, 4.1583251953125, 4.34210205078125, 4.52587890625, 4.70965576171875, 4.8934326171875, 5.07720947265625, 5.260986328125, 5.44476318359375, 5.6285400390625, 5.81231689453125, 5.99609375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 6.0, 9.0, 13.0, 12.0, 22.0, 30.0, 45.0, 40.0, 50.0, 70.0, 94.0, 135.0, 137.0, 162.0, 171.0, 233.0, 233.0, 258.0, 284.0, 266.0, 240.0, 232.0, 237.0, 215.0, 197.0, 143.0, 119.0, 89.0, 81.0, 56.0, 44.0, 30.0, 25.0, 19.0, 14.0, 15.0, 8.0, 5.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.02386474609375, -1.9559326171875, -1.88800048828125, -1.820068359375, -1.75213623046875, -1.6842041015625, -1.61627197265625, -1.54833984375, -1.48040771484375, -1.4124755859375, -1.34454345703125, -1.276611328125, -1.20867919921875, -1.1407470703125, -1.07281494140625, -1.0048828125, -0.93695068359375, -0.8690185546875, -0.80108642578125, -0.733154296875, -0.66522216796875, -0.5972900390625, -0.52935791015625, -0.46142578125, -0.39349365234375, -0.3255615234375, -0.25762939453125, -0.189697265625, -0.12176513671875, -0.0538330078125, 0.01409912109375, 0.08203125, 0.14996337890625, 0.2178955078125, 0.28582763671875, 0.353759765625, 0.42169189453125, 0.4896240234375, 0.55755615234375, 0.62548828125, 0.69342041015625, 0.7613525390625, 0.82928466796875, 0.897216796875, 0.96514892578125, 1.0330810546875, 1.10101318359375, 1.1689453125, 1.23687744140625, 1.3048095703125, 1.37274169921875, 1.440673828125, 1.50860595703125, 1.5765380859375, 1.64447021484375, 1.71240234375, 1.78033447265625, 1.8482666015625, 1.91619873046875, 1.984130859375, 2.05206298828125, 2.1199951171875, 2.18792724609375, 2.255859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 11.0, 10.0, 19.0, 16.0, 34.0, 29.0, 49.0, 42.0, 54.0, 57.0, 73.0, 62.0, 62.0, 52.0, 67.0, 65.0, 53.0, 38.0, 35.0, 36.0, 26.0, 33.0, 14.0, 10.0, 14.0, 6.0, 6.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.956415176391602, -7.686728477478027, -7.417041778564453, -7.147355079650879, -6.877668380737305, -6.6079816818237305, -6.338294982910156, -6.068608283996582, -5.798921585083008, -5.529234886169434, -5.259548187255859, -4.989861488342285, -4.720174789428711, -4.450488090515137, -4.1808013916015625, -3.9111149311065674, -3.6414284706115723, -3.371741771697998, -3.102055072784424, -2.8323683738708496, -2.5626816749572754, -2.292994976043701, -2.023308515548706, -1.7536218166351318, -1.4839351177215576, -1.2142484188079834, -0.944561779499054, -0.6748751401901245, -0.4051884412765503, -0.13550174236297607, 0.1341848373413086, 0.4038715362548828, 0.673558235168457, 0.9432449340820312, 1.2129316329956055, 1.4826182126998901, 1.7523049116134644, 2.021991729736328, 2.2916781902313232, 2.5613648891448975, 2.8310515880584717, 3.100738286972046, 3.37042498588562, 3.6401114463806152, 3.9097981452941895, 4.179484844207764, 4.449171543121338, 4.718858242034912, 4.988544940948486, 5.2582316398620605, 5.527918338775635, 5.797605037689209, 6.067291736602783, 6.336978435516357, 6.606664657592773, 6.876351356506348, 7.146038055419922, 7.415724754333496, 7.68541145324707, 7.9550981521606445, 8.224784851074219, 8.494471549987793, 8.764158248901367, 9.033844947814941, 9.303531646728516]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 12.0, 22.0, 22.0, 34.0, 20.0, 25.0, 39.0, 41.0, 30.0, 32.0, 33.0, 47.0, 47.0, 38.0, 46.0, 41.0, 50.0, 36.0, 40.0, 38.0, 36.0, 29.0, 20.0, 25.0, 17.0, 21.0, 18.0, 18.0, 14.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.775452136993408, -4.6400041580200195, -4.504555702209473, -4.369107723236084, -4.233659744262695, -4.098211288452148, -3.9627633094787598, -3.827315092086792, -3.691866874694824, -3.5564186573028564, -3.4209704399108887, -3.2855224609375, -3.1500742435455322, -3.0146260261535645, -2.879178047180176, -2.743729829788208, -2.6082816123962402, -2.4728333950042725, -2.3373851776123047, -2.201937198638916, -2.0664889812469482, -1.9310407638549805, -1.7955926656723022, -1.660144567489624, -1.5246963500976562, -1.3892481327056885, -1.2538000345230103, -1.118351936340332, -0.9829037189483643, -0.8474555611610413, -0.7120074033737183, -0.5765592455863953, -0.44111084938049316, -0.30566269159317017, -0.17021453380584717, -0.03476637601852417, 0.10068178176879883, 0.23612993955612183, 0.3715780973434448, 0.5070262551307678, 0.6424744129180908, 0.7779225707054138, 0.9133707284927368, 1.048818826675415, 1.1842670440673828, 1.3197152614593506, 1.4551633596420288, 1.590611457824707, 1.7260596752166748, 1.8615078926086426, 1.9969559907913208, 2.132404088973999, 2.267852306365967, 2.4033005237579346, 2.5387487411499023, 2.674196720123291, 2.809644937515259, 2.9450931549072266, 3.0805411338806152, 3.215989351272583, 3.351437568664551, 3.4868857860565186, 3.6223340034484863, 3.757781982421875, 3.8932301998138428]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 10.0, 27.0, 44.0, 59.0, 81.0, 155.0, 196.0, 344.0, 539.0, 967.0, 1597.0, 2658.0, 4677.0, 8303.0, 14445.0, 25468.0, 45088.0, 76950.0, 126681.0, 178772.0, 189858.0, 147354.0, 94600.0, 55407.0, 31703.0, 17956.0, 10395.0, 5807.0, 3459.0, 1920.0, 1151.0, 690.0, 462.0, 254.0, 165.0, 112.0, 73.0, 48.0, 24.0, 19.0, 14.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5245132446289062, -0.5065460205078125, -0.48857879638671875, -0.470611572265625, -0.45264434814453125, -0.4346771240234375, -0.41670989990234375, -0.39874267578125, -0.38077545166015625, -0.3628082275390625, -0.34484100341796875, -0.326873779296875, -0.30890655517578125, -0.2909393310546875, -0.27297210693359375, -0.2550048828125, -0.23703765869140625, -0.2190704345703125, -0.20110321044921875, -0.183135986328125, -0.16516876220703125, -0.1472015380859375, -0.12923431396484375, -0.11126708984375, -0.09329986572265625, -0.0753326416015625, -0.05736541748046875, -0.039398193359375, -0.02143096923828125, -0.0034637451171875, 0.01450347900390625, 0.032470703125, 0.05043792724609375, 0.0684051513671875, 0.08637237548828125, 0.104339599609375, 0.12230682373046875, 0.1402740478515625, 0.15824127197265625, 0.17620849609375, 0.19417572021484375, 0.2121429443359375, 0.23011016845703125, 0.248077392578125, 0.26604461669921875, 0.2840118408203125, 0.30197906494140625, 0.3199462890625, 0.33791351318359375, 0.3558807373046875, 0.37384796142578125, 0.391815185546875, 0.40978240966796875, 0.4277496337890625, 0.44571685791015625, 0.46368408203125, 0.48165130615234375, 0.4996185302734375, 0.5175857543945312, 0.535552978515625, 0.5535202026367188, 0.5714874267578125, 0.5894546508789062, 0.607421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 6.0, 7.0, 6.0, 16.0, 11.0, 18.0, 15.0, 28.0, 30.0, 20.0, 33.0, 33.0, 34.0, 37.0, 30.0, 42.0, 42.0, 35.0, 33.0, 45.0, 31.0, 53.0, 44.0, 44.0, 34.0, 35.0, 30.0, 36.0, 23.0, 27.0, 21.0, 14.0, 15.0, 16.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.6171875, -5.46527099609375, -5.3133544921875, -5.16143798828125, -5.009521484375, -4.85760498046875, -4.7056884765625, -4.55377197265625, -4.40185546875, -4.24993896484375, -4.0980224609375, -3.94610595703125, -3.794189453125, -3.64227294921875, -3.4903564453125, -3.33843994140625, -3.1865234375, -3.03460693359375, -2.8826904296875, -2.73077392578125, -2.578857421875, -2.42694091796875, -2.2750244140625, -2.12310791015625, -1.97119140625, -1.81927490234375, -1.6673583984375, -1.51544189453125, -1.363525390625, -1.21160888671875, -1.0596923828125, -0.90777587890625, -0.755859375, -0.60394287109375, -0.4520263671875, -0.30010986328125, -0.148193359375, 0.00372314453125, 0.1556396484375, 0.30755615234375, 0.45947265625, 0.61138916015625, 0.7633056640625, 0.91522216796875, 1.067138671875, 1.21905517578125, 1.3709716796875, 1.52288818359375, 1.6748046875, 1.82672119140625, 1.9786376953125, 2.13055419921875, 2.282470703125, 2.43438720703125, 2.5863037109375, 2.73822021484375, 2.89013671875, 3.04205322265625, 3.1939697265625, 3.34588623046875, 3.497802734375, 3.64971923828125, 3.8016357421875, 3.95355224609375, 4.10546875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 13.0, 11.0, 23.0, 20.0, 19.0, 29.0, 39.0, 45.0, 65.0, 111.0, 106.0, 167.0, 234.0, 363.0, 487.0, 742.0, 1143.0, 1845.0, 3083.0, 5634.0, 10447.0, 20734.0, 67814.0, 811320.0, 76479.0, 22257.0, 10723.0, 5734.0, 3237.0, 1920.0, 1193.0, 742.0, 515.0, 344.0, 230.0, 170.0, 138.0, 99.0, 67.0, 54.0, 43.0, 24.0, 20.0, 14.0, 14.0, 8.0, 5.0, 6.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.50390625, -1.457672119140625, -1.41143798828125, -1.365203857421875, -1.3189697265625, -1.272735595703125, -1.22650146484375, -1.180267333984375, -1.134033203125, -1.087799072265625, -1.04156494140625, -0.995330810546875, -0.9490966796875, -0.902862548828125, -0.85662841796875, -0.810394287109375, -0.76416015625, -0.717926025390625, -0.67169189453125, -0.625457763671875, -0.5792236328125, -0.532989501953125, -0.48675537109375, -0.440521240234375, -0.394287109375, -0.348052978515625, -0.30181884765625, -0.255584716796875, -0.2093505859375, -0.163116455078125, -0.11688232421875, -0.070648193359375, -0.0244140625, 0.021820068359375, 0.06805419921875, 0.114288330078125, 0.1605224609375, 0.206756591796875, 0.25299072265625, 0.299224853515625, 0.345458984375, 0.391693115234375, 0.43792724609375, 0.484161376953125, 0.5303955078125, 0.576629638671875, 0.62286376953125, 0.669097900390625, 0.71533203125, 0.761566162109375, 0.80780029296875, 0.854034423828125, 0.9002685546875, 0.946502685546875, 0.99273681640625, 1.038970947265625, 1.085205078125, 1.131439208984375, 1.17767333984375, 1.223907470703125, 1.2701416015625, 1.316375732421875, 1.36260986328125, 1.408843994140625, 1.455078125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 12.0, 8.0, 6.0, 8.0, 6.0, 23.0, 17.0, 16.0, 11.0, 24.0, 29.0, 21.0, 25.0, 28.0, 41.0, 44.0, 34.0, 40.0, 43.0, 38.0, 42.0, 38.0, 38.0, 41.0, 37.0, 28.0, 29.0, 30.0, 29.0, 29.0, 28.0, 24.0, 14.0, 10.0, 20.0, 18.0, 9.0, 8.0, 7.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80108642578125, -2.7115478515625, -2.62200927734375, -2.532470703125, -2.44293212890625, -2.3533935546875, -2.26385498046875, -2.17431640625, -2.08477783203125, -1.9952392578125, -1.90570068359375, -1.816162109375, -1.72662353515625, -1.6370849609375, -1.54754638671875, -1.4580078125, -1.36846923828125, -1.2789306640625, -1.18939208984375, -1.099853515625, -1.01031494140625, -0.9207763671875, -0.83123779296875, -0.74169921875, -0.65216064453125, -0.5626220703125, -0.47308349609375, -0.383544921875, -0.29400634765625, -0.2044677734375, -0.11492919921875, -0.025390625, 0.06414794921875, 0.1536865234375, 0.24322509765625, 0.332763671875, 0.42230224609375, 0.5118408203125, 0.60137939453125, 0.69091796875, 0.78045654296875, 0.8699951171875, 0.95953369140625, 1.049072265625, 1.13861083984375, 1.2281494140625, 1.31768798828125, 1.4072265625, 1.49676513671875, 1.5863037109375, 1.67584228515625, 1.765380859375, 1.85491943359375, 1.9444580078125, 2.03399658203125, 2.12353515625, 2.21307373046875, 2.3026123046875, 2.39215087890625, 2.481689453125, 2.57122802734375, 2.6607666015625, 2.75030517578125, 2.83984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 8.0, 25.0, 30.0, 18.0, 39.0, 48.0, 57.0, 90.0, 120.0, 167.0, 249.0, 345.0, 505.0, 760.0, 1144.0, 1856.0, 2891.0, 4755.0, 8043.0, 14312.0, 28500.0, 591290.0, 333721.0, 26339.0, 13422.0, 7583.0, 4457.0, 2674.0, 1701.0, 1080.0, 686.0, 443.0, 342.0, 228.0, 168.0, 125.0, 90.0, 49.0, 42.0, 31.0, 19.0, 22.0, 15.0, 12.0, 7.0, 12.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.3427734375, -0.3320465087890625, -0.321319580078125, -0.3105926513671875, -0.29986572265625, -0.2891387939453125, -0.278411865234375, -0.2676849365234375, -0.2569580078125, -0.2462310791015625, -0.235504150390625, -0.2247772216796875, -0.21405029296875, -0.2033233642578125, -0.192596435546875, -0.1818695068359375, -0.171142578125, -0.1604156494140625, -0.149688720703125, -0.1389617919921875, -0.12823486328125, -0.1175079345703125, -0.106781005859375, -0.0960540771484375, -0.0853271484375, -0.0746002197265625, -0.063873291015625, -0.0531463623046875, -0.04241943359375, -0.0316925048828125, -0.020965576171875, -0.0102386474609375, 0.00048828125, 0.0112152099609375, 0.021942138671875, 0.0326690673828125, 0.04339599609375, 0.0541229248046875, 0.064849853515625, 0.0755767822265625, 0.0863037109375, 0.0970306396484375, 0.107757568359375, 0.1184844970703125, 0.12921142578125, 0.1399383544921875, 0.150665283203125, 0.1613922119140625, 0.172119140625, 0.1828460693359375, 0.193572998046875, 0.2042999267578125, 0.21502685546875, 0.2257537841796875, 0.236480712890625, 0.2472076416015625, 0.2579345703125, 0.2686614990234375, 0.279388427734375, 0.2901153564453125, 0.30084228515625, 0.3115692138671875, 0.322296142578125, 0.3330230712890625, 0.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 10.0, 6.0, 7.0, 8.0, 11.0, 14.0, 20.0, 13.0, 23.0, 31.0, 26.0, 39.0, 34.0, 35.0, 47.0, 46.0, 50.0, 53.0, 43.0, 49.0, 42.0, 32.0, 45.0, 42.0, 36.0, 31.0, 38.0, 24.0, 29.0, 16.0, 21.0, 14.0, 14.0, 14.0, 8.0, 10.0, 4.0, 3.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.8908252716064453e-05, -2.8051435947418213e-05, -2.7194619178771973e-05, -2.6337802410125732e-05, -2.5480985641479492e-05, -2.4624168872833252e-05, -2.3767352104187012e-05, -2.291053533554077e-05, -2.205371856689453e-05, -2.119690179824829e-05, -2.034008502960205e-05, -1.948326826095581e-05, -1.862645149230957e-05, -1.776963472366333e-05, -1.691281795501709e-05, -1.605600118637085e-05, -1.519918441772461e-05, -1.4342367649078369e-05, -1.3485550880432129e-05, -1.2628734111785889e-05, -1.1771917343139648e-05, -1.0915100574493408e-05, -1.0058283805847168e-05, -9.201467037200928e-06, -8.344650268554688e-06, -7.487833499908447e-06, -6.631016731262207e-06, -5.774199962615967e-06, -4.9173831939697266e-06, -4.060566425323486e-06, -3.203749656677246e-06, -2.346932888031006e-06, -1.4901161193847656e-06, -6.332993507385254e-07, 2.2351741790771484e-07, 1.080334186553955e-06, 1.9371509552001953e-06, 2.7939677238464355e-06, 3.6507844924926758e-06, 4.507601261138916e-06, 5.364418029785156e-06, 6.2212347984313965e-06, 7.078051567077637e-06, 7.934868335723877e-06, 8.791685104370117e-06, 9.648501873016357e-06, 1.0505318641662598e-05, 1.1362135410308838e-05, 1.2218952178955078e-05, 1.3075768947601318e-05, 1.3932585716247559e-05, 1.4789402484893799e-05, 1.564621925354004e-05, 1.650303602218628e-05, 1.735985279083252e-05, 1.821666955947876e-05, 1.9073486328125e-05, 1.993030309677124e-05, 2.078711986541748e-05, 2.164393663406372e-05, 2.250075340270996e-05, 2.33575701713562e-05, 2.421438694000244e-05, 2.507120370864868e-05, 2.5928020477294922e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 17.0, 32.0, 35.0, 55.0, 71.0, 167.0, 222.0, 386.0, 528.0, 980.0, 1726.0, 2985.0, 5483.0, 10822.0, 22318.0, 49275.0, 113264.0, 239353.0, 294454.0, 167022.0, 73997.0, 32770.0, 15397.0, 7687.0, 3982.0, 2250.0, 1301.0, 732.0, 446.0, 279.0, 170.0, 119.0, 62.0, 45.0, 29.0, 27.0, 14.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2765922546386719, -0.26827239990234375, -0.2599525451660156, -0.2516326904296875, -0.24331283569335938, -0.23499298095703125, -0.22667312622070312, -0.218353271484375, -0.21003341674804688, -0.20171356201171875, -0.19339370727539062, -0.1850738525390625, -0.17675399780273438, -0.16843414306640625, -0.16011428833007812, -0.15179443359375, -0.14347457885742188, -0.13515472412109375, -0.12683486938476562, -0.1185150146484375, -0.11019515991210938, -0.10187530517578125, -0.09355545043945312, -0.085235595703125, -0.07691574096679688, -0.06859588623046875, -0.060276031494140625, -0.0519561767578125, -0.043636322021484375, -0.03531646728515625, -0.026996612548828125, -0.0186767578125, -0.010356903076171875, -0.00203704833984375, 0.006282806396484375, 0.0146026611328125, 0.022922515869140625, 0.03124237060546875, 0.039562225341796875, 0.047882080078125, 0.056201934814453125, 0.06452178955078125, 0.07284164428710938, 0.0811614990234375, 0.08948135375976562, 0.09780120849609375, 0.10612106323242188, 0.11444091796875, 0.12276077270507812, 0.13108062744140625, 0.13940048217773438, 0.1477203369140625, 0.15604019165039062, 0.16436004638671875, 0.17267990112304688, 0.180999755859375, 0.18931961059570312, 0.19763946533203125, 0.20595932006835938, 0.2142791748046875, 0.22259902954101562, 0.23091888427734375, 0.23923873901367188, 0.24755859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 9.0, 15.0, 9.0, 10.0, 9.0, 18.0, 15.0, 21.0, 24.0, 34.0, 47.0, 34.0, 70.0, 54.0, 48.0, 64.0, 56.0, 56.0, 51.0, 47.0, 41.0, 35.0, 36.0, 33.0, 25.0, 29.0, 17.0, 10.0, 19.0, 12.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03598356246948242, -0.034613609313964844, -0.033243656158447266, -0.03187370300292969, -0.03050374984741211, -0.02913379669189453, -0.027763843536376953, -0.026393890380859375, -0.025023937225341797, -0.02365398406982422, -0.02228403091430664, -0.020914077758789062, -0.019544124603271484, -0.018174171447753906, -0.016804218292236328, -0.01543426513671875, -0.014064311981201172, -0.012694358825683594, -0.011324405670166016, -0.009954452514648438, -0.00858449935913086, -0.007214546203613281, -0.005844593048095703, -0.004474639892578125, -0.003104686737060547, -0.0017347335815429688, -0.0003647804260253906, 0.0010051727294921875, 0.0023751258850097656, 0.0037450790405273438, 0.005115032196044922, 0.0064849853515625, 0.007854938507080078, 0.009224891662597656, 0.010594844818115234, 0.011964797973632812, 0.01333475112915039, 0.014704704284667969, 0.016074657440185547, 0.017444610595703125, 0.018814563751220703, 0.02018451690673828, 0.02155447006225586, 0.022924423217773438, 0.024294376373291016, 0.025664329528808594, 0.027034282684326172, 0.02840423583984375, 0.029774188995361328, 0.031144142150878906, 0.032514095306396484, 0.03388404846191406, 0.03525400161743164, 0.03662395477294922, 0.0379939079284668, 0.039363861083984375, 0.04073381423950195, 0.04210376739501953, 0.04347372055053711, 0.04484367370605469, 0.046213626861572266, 0.047583580017089844, 0.04895353317260742, 0.050323486328125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 9.0, 15.0, 13.0, 23.0, 31.0, 33.0, 48.0, 45.0, 55.0, 65.0, 66.0, 63.0, 58.0, 62.0, 67.0, 57.0, 57.0, 34.0, 36.0, 36.0, 25.0, 31.0, 10.0, 13.0, 10.0, 8.0, 3.0, 1.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.933457374572754, -7.662163257598877, -7.390869140625, -7.119575023651123, -6.848280906677246, -6.576986789703369, -6.305692672729492, -6.034398555755615, -5.763104438781738, -5.491810321807861, -5.220516204833984, -4.949222087860107, -4.6779279708862305, -4.4066338539123535, -4.135339736938477, -3.8640456199645996, -3.5927515029907227, -3.3214573860168457, -3.0501632690429688, -2.778869152069092, -2.507575035095215, -2.236280918121338, -1.964986801147461, -1.693692684173584, -1.422398567199707, -1.15110445022583, -0.8798103332519531, -0.6085162162780762, -0.3372220993041992, -0.06592798233032227, 0.2053661346435547, 0.47666025161743164, 0.7479534149169922, 1.0192475318908691, 1.290541648864746, 1.561835765838623, 1.8331298828125, 2.104423999786377, 2.375718116760254, 2.647012233734131, 2.918306350708008, 3.1896004676818848, 3.4608945846557617, 3.7321887016296387, 4.003482818603516, 4.274776935577393, 4.5460710525512695, 4.8173651695251465, 5.088659286499023, 5.3599534034729, 5.631247520446777, 5.902541637420654, 6.173835754394531, 6.445129871368408, 6.716423988342285, 6.987718105316162, 7.259012222290039, 7.530306339263916, 7.801600456237793, 8.072895050048828, 8.344188690185547, 8.615482330322266, 8.8867769241333, 9.158071517944336, 9.429365158081055]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 4.0, 5.0, 11.0, 7.0, 9.0, 13.0, 18.0, 11.0, 20.0, 23.0, 32.0, 23.0, 23.0, 40.0, 35.0, 34.0, 35.0, 32.0, 40.0, 51.0, 42.0, 39.0, 43.0, 51.0, 38.0, 36.0, 42.0, 34.0, 30.0, 21.0, 26.0, 17.0, 22.0, 16.0, 17.0, 16.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.752599716186523, -4.61810827255249, -4.483617305755615, -4.349125862121582, -4.214634895324707, -4.080143451690674, -3.9456522464752197, -3.8111610412597656, -3.6766698360443115, -3.5421786308288574, -3.4076874256134033, -3.273196220397949, -3.138704776763916, -3.004213809967041, -2.869722366333008, -2.7352311611175537, -2.6007399559020996, -2.4662487506866455, -2.3317575454711914, -2.1972663402557373, -2.062775135040283, -1.9282838106155396, -1.793792486190796, -1.6593012809753418, -1.5248100757598877, -1.3903188705444336, -1.2558276653289795, -1.1213363409042358, -0.9868451356887817, -0.8523539304733276, -0.7178626656532288, -0.5833714008331299, -0.4488801956176758, -0.3143889605998993, -0.1798977255821228, -0.045406490564346313, 0.08908474445343018, 0.22357594966888428, 0.35806721448898315, 0.49255847930908203, 0.6270496845245361, 0.7615408897399902, 0.8960321545600891, 1.030523419380188, 1.165014624595642, 1.2995058298110962, 1.4339971542358398, 1.568488359451294, 1.702979564666748, 1.8374707698822021, 1.9719619750976562, 2.1064531803131104, 2.2409443855285645, 2.3754358291625977, 2.5099270343780518, 2.644418239593506, 2.77890944480896, 2.913400650024414, 3.047891855239868, 3.1823830604553223, 3.3168745040893555, 3.4513654708862305, 3.5858569145202637, 3.7203481197357178, 3.854839324951172]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 14.0, 26.0, 38.0, 63.0, 84.0, 115.0, 179.0, 286.0, 426.0, 629.0, 969.0, 1481.0, 2389.0, 3808.0, 5710.0, 9054.0, 13802.0, 21247.0, 32086.0, 46996.0, 66732.0, 88452.0, 109439.0, 121545.0, 121791.0, 109076.0, 87754.0, 65971.0, 46994.0, 31963.0, 20821.0, 13694.0, 8710.0, 5664.0, 3668.0, 2378.0, 1554.0, 979.0, 618.0, 430.0, 284.0, 185.0, 134.0, 77.0, 75.0, 44.0, 27.0, 27.0, 14.0, 12.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-3.681640625, -3.566558837890625, -3.45147705078125, -3.336395263671875, -3.2213134765625, -3.106231689453125, -2.99114990234375, -2.876068115234375, -2.760986328125, -2.645904541015625, -2.53082275390625, -2.415740966796875, -2.3006591796875, -2.185577392578125, -2.07049560546875, -1.955413818359375, -1.84033203125, -1.725250244140625, -1.61016845703125, -1.495086669921875, -1.3800048828125, -1.264923095703125, -1.14984130859375, -1.034759521484375, -0.919677734375, -0.804595947265625, -0.68951416015625, -0.574432373046875, -0.4593505859375, -0.344268798828125, -0.22918701171875, -0.114105224609375, 0.0009765625, 0.116058349609375, 0.23114013671875, 0.346221923828125, 0.4613037109375, 0.576385498046875, 0.69146728515625, 0.806549072265625, 0.921630859375, 1.036712646484375, 1.15179443359375, 1.266876220703125, 1.3819580078125, 1.497039794921875, 1.61212158203125, 1.727203369140625, 1.84228515625, 1.957366943359375, 2.07244873046875, 2.187530517578125, 2.3026123046875, 2.417694091796875, 2.53277587890625, 2.647857666015625, 2.762939453125, 2.878021240234375, 2.99310302734375, 3.108184814453125, 3.2232666015625, 3.338348388671875, 3.45343017578125, 3.568511962890625, 3.68359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 15.0, 8.0, 14.0, 17.0, 22.0, 23.0, 26.0, 31.0, 44.0, 28.0, 30.0, 34.0, 38.0, 35.0, 38.0, 37.0, 47.0, 33.0, 39.0, 42.0, 47.0, 30.0, 41.0, 22.0, 26.0, 24.0, 29.0, 20.0, 26.0, 14.0, 22.0, 8.0, 11.0, 7.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.09375, -4.95062255859375, -4.8074951171875, -4.66436767578125, -4.521240234375, -4.37811279296875, -4.2349853515625, -4.09185791015625, -3.94873046875, -3.80560302734375, -3.6624755859375, -3.51934814453125, -3.376220703125, -3.23309326171875, -3.0899658203125, -2.94683837890625, -2.8037109375, -2.66058349609375, -2.5174560546875, -2.37432861328125, -2.231201171875, -2.08807373046875, -1.9449462890625, -1.80181884765625, -1.65869140625, -1.51556396484375, -1.3724365234375, -1.22930908203125, -1.086181640625, -0.94305419921875, -0.7999267578125, -0.65679931640625, -0.513671875, -0.37054443359375, -0.2274169921875, -0.08428955078125, 0.058837890625, 0.20196533203125, 0.3450927734375, 0.48822021484375, 0.63134765625, 0.77447509765625, 0.9176025390625, 1.06072998046875, 1.203857421875, 1.34698486328125, 1.4901123046875, 1.63323974609375, 1.7763671875, 1.91949462890625, 2.0626220703125, 2.20574951171875, 2.348876953125, 2.49200439453125, 2.6351318359375, 2.77825927734375, 2.92138671875, 3.06451416015625, 3.2076416015625, 3.35076904296875, 3.493896484375, 3.63702392578125, 3.7801513671875, 3.92327880859375, 4.06640625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 20.0, 36.0, 67.0, 124.0, 179.0, 350.0, 596.0, 999.0, 1728.0, 3128.0, 5665.0, 9936.0, 17134.0, 30031.0, 50480.0, 79640.0, 116002.0, 148349.0, 158535.0, 141548.0, 106480.0, 71765.0, 44335.0, 26395.0, 14968.0, 8587.0, 4972.0, 2777.0, 1556.0, 867.0, 535.0, 305.0, 174.0, 93.0, 60.0, 43.0, 24.0, 12.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.03515625, -4.879638671875, -4.72412109375, -4.568603515625, -4.4130859375, -4.257568359375, -4.10205078125, -3.946533203125, -3.791015625, -3.635498046875, -3.47998046875, -3.324462890625, -3.1689453125, -3.013427734375, -2.85791015625, -2.702392578125, -2.546875, -2.391357421875, -2.23583984375, -2.080322265625, -1.9248046875, -1.769287109375, -1.61376953125, -1.458251953125, -1.302734375, -1.147216796875, -0.99169921875, -0.836181640625, -0.6806640625, -0.525146484375, -0.36962890625, -0.214111328125, -0.05859375, 0.096923828125, 0.25244140625, 0.407958984375, 0.5634765625, 0.718994140625, 0.87451171875, 1.030029296875, 1.185546875, 1.341064453125, 1.49658203125, 1.652099609375, 1.8076171875, 1.963134765625, 2.11865234375, 2.274169921875, 2.4296875, 2.585205078125, 2.74072265625, 2.896240234375, 3.0517578125, 3.207275390625, 3.36279296875, 3.518310546875, 3.673828125, 3.829345703125, 3.98486328125, 4.140380859375, 4.2958984375, 4.451416015625, 4.60693359375, 4.762451171875, 4.91796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 5.0, 11.0, 8.0, 9.0, 2.0, 8.0, 14.0, 18.0, 27.0, 28.0, 36.0, 35.0, 40.0, 45.0, 59.0, 47.0, 46.0, 54.0, 64.0, 44.0, 30.0, 42.0, 53.0, 48.0, 31.0, 41.0, 21.0, 31.0, 18.0, 18.0, 22.0, 17.0, 6.0, 9.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.6832275390625, -2.569580078125, -2.4559326171875, -2.34228515625, -2.2286376953125, -2.114990234375, -2.0013427734375, -1.8876953125, -1.7740478515625, -1.660400390625, -1.5467529296875, -1.43310546875, -1.3194580078125, -1.205810546875, -1.0921630859375, -0.978515625, -0.8648681640625, -0.751220703125, -0.6375732421875, -0.52392578125, -0.4102783203125, -0.296630859375, -0.1829833984375, -0.0693359375, 0.0443115234375, 0.157958984375, 0.2716064453125, 0.38525390625, 0.4989013671875, 0.612548828125, 0.7261962890625, 0.83984375, 0.9534912109375, 1.067138671875, 1.1807861328125, 1.29443359375, 1.4080810546875, 1.521728515625, 1.6353759765625, 1.7490234375, 1.8626708984375, 1.976318359375, 2.0899658203125, 2.20361328125, 2.3172607421875, 2.430908203125, 2.5445556640625, 2.658203125, 2.7718505859375, 2.885498046875, 2.9991455078125, 3.11279296875, 3.2264404296875, 3.340087890625, 3.4537353515625, 3.5673828125, 3.6810302734375, 3.794677734375, 3.9083251953125, 4.02197265625, 4.1356201171875, 4.249267578125, 4.3629150390625, 4.4765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 10.0, 15.0, 17.0, 35.0, 47.0, 54.0, 72.0, 104.0, 169.0, 235.0, 282.0, 443.0, 624.0, 975.0, 1345.0, 2125.0, 3531.0, 6128.0, 11388.0, 22332.0, 47523.0, 102503.0, 199651.0, 258804.0, 194664.0, 100715.0, 45902.0, 21957.0, 10984.0, 6009.0, 3317.0, 2218.0, 1337.0, 885.0, 623.0, 432.0, 313.0, 246.0, 156.0, 104.0, 84.0, 54.0, 38.0, 29.0, 24.0, 17.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.05767822265625, -3.9200439453125, -3.78240966796875, -3.644775390625, -3.50714111328125, -3.3695068359375, -3.23187255859375, -3.09423828125, -2.95660400390625, -2.8189697265625, -2.68133544921875, -2.543701171875, -2.40606689453125, -2.2684326171875, -2.13079833984375, -1.9931640625, -1.85552978515625, -1.7178955078125, -1.58026123046875, -1.442626953125, -1.30499267578125, -1.1673583984375, -1.02972412109375, -0.89208984375, -0.75445556640625, -0.6168212890625, -0.47918701171875, -0.341552734375, -0.20391845703125, -0.0662841796875, 0.07135009765625, 0.208984375, 0.34661865234375, 0.4842529296875, 0.62188720703125, 0.759521484375, 0.89715576171875, 1.0347900390625, 1.17242431640625, 1.31005859375, 1.44769287109375, 1.5853271484375, 1.72296142578125, 1.860595703125, 1.99822998046875, 2.1358642578125, 2.27349853515625, 2.4111328125, 2.54876708984375, 2.6864013671875, 2.82403564453125, 2.961669921875, 3.09930419921875, 3.2369384765625, 3.37457275390625, 3.51220703125, 3.64984130859375, 3.7874755859375, 3.92510986328125, 4.062744140625, 4.20037841796875, 4.3380126953125, 4.47564697265625, 4.61328125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 8.0, 12.0, 15.0, 28.0, 19.0, 53.0, 29.0, 66.0, 61.0, 70.0, 75.0, 65.0, 68.0, 57.0, 67.0, 72.0, 47.0, 37.0, 31.0, 16.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00034999847412109375, -0.000339265912771225, -0.0003285333514213562, -0.0003178007900714874, -0.00030706822872161865, -0.0002963356673717499, -0.0002856031060218811, -0.00027487054467201233, -0.00026413798332214355, -0.0002534054219722748, -0.000242672860622406, -0.00023194029927253723, -0.00022120773792266846, -0.00021047517657279968, -0.0001997426152229309, -0.00018901005387306213, -0.00017827749252319336, -0.00016754493117332458, -0.0001568123698234558, -0.00014607980847358704, -0.00013534724712371826, -0.0001246146857738495, -0.00011388212442398071, -0.00010314956307411194, -9.241700172424316e-05, -8.168444037437439e-05, -7.095187902450562e-05, -6.021931767463684e-05, -4.9486756324768066e-05, -3.875419497489929e-05, -2.8021633625030518e-05, -1.7289072275161743e-05, -6.556510925292969e-06, 4.176050424575806e-06, 1.490861177444458e-05, 2.5641173124313354e-05, 3.637373447418213e-05, 4.71062958240509e-05, 5.783885717391968e-05, 6.857141852378845e-05, 7.930397987365723e-05, 9.0036541223526e-05, 0.00010076910257339478, 0.00011150166392326355, 0.00012223422527313232, 0.0001329667866230011, 0.00014369934797286987, 0.00015443190932273865, 0.00016516447067260742, 0.0001758970320224762, 0.00018662959337234497, 0.00019736215472221375, 0.00020809471607208252, 0.0002188272774219513, 0.00022955983877182007, 0.00024029240012168884, 0.0002510249614715576, 0.0002617575228214264, 0.00027249008417129517, 0.00028322264552116394, 0.0002939552068710327, 0.0003046877682209015, 0.00031542032957077026, 0.00032615289092063904, 0.0003368854522705078]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 9.0, 11.0, 22.0, 32.0, 37.0, 41.0, 57.0, 72.0, 131.0, 140.0, 204.0, 261.0, 364.0, 527.0, 823.0, 1193.0, 2008.0, 3404.0, 6605.0, 14010.0, 33634.0, 86192.0, 202408.0, 304137.0, 221869.0, 98510.0, 38463.0, 15892.0, 7354.0, 3825.0, 2154.0, 1248.0, 825.0, 571.0, 379.0, 296.0, 240.0, 141.0, 105.0, 79.0, 63.0, 51.0, 41.0, 34.0, 28.0, 16.0, 11.0, 6.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.4765625, -5.3031005859375, -5.129638671875, -4.9561767578125, -4.78271484375, -4.6092529296875, -4.435791015625, -4.2623291015625, -4.0888671875, -3.9154052734375, -3.741943359375, -3.5684814453125, -3.39501953125, -3.2215576171875, -3.048095703125, -2.8746337890625, -2.701171875, -2.5277099609375, -2.354248046875, -2.1807861328125, -2.00732421875, -1.8338623046875, -1.660400390625, -1.4869384765625, -1.3134765625, -1.1400146484375, -0.966552734375, -0.7930908203125, -0.61962890625, -0.4461669921875, -0.272705078125, -0.0992431640625, 0.07421875, 0.2476806640625, 0.421142578125, 0.5946044921875, 0.76806640625, 0.9415283203125, 1.114990234375, 1.2884521484375, 1.4619140625, 1.6353759765625, 1.808837890625, 1.9822998046875, 2.15576171875, 2.3292236328125, 2.502685546875, 2.6761474609375, 2.849609375, 3.0230712890625, 3.196533203125, 3.3699951171875, 3.54345703125, 3.7169189453125, 3.890380859375, 4.0638427734375, 4.2373046875, 4.4107666015625, 4.584228515625, 4.7576904296875, 4.93115234375, 5.1046142578125, 5.278076171875, 5.4515380859375, 5.625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 8.0, 11.0, 24.0, 26.0, 31.0, 40.0, 45.0, 63.0, 62.0, 71.0, 69.0, 55.0, 83.0, 62.0, 62.0, 58.0, 34.0, 35.0, 28.0, 26.0, 21.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.1064453125, -1.0707550048828125, -1.035064697265625, -0.9993743896484375, -0.96368408203125, -0.9279937744140625, -0.892303466796875, -0.8566131591796875, -0.8209228515625, -0.7852325439453125, -0.749542236328125, -0.7138519287109375, -0.67816162109375, -0.6424713134765625, -0.606781005859375, -0.5710906982421875, -0.535400390625, -0.4997100830078125, -0.464019775390625, -0.4283294677734375, -0.39263916015625, -0.3569488525390625, -0.321258544921875, -0.2855682373046875, -0.2498779296875, -0.2141876220703125, -0.178497314453125, -0.1428070068359375, -0.10711669921875, -0.0714263916015625, -0.035736083984375, -4.57763671875e-05, 0.03564453125, 0.0713348388671875, 0.107025146484375, 0.1427154541015625, 0.17840576171875, 0.2140960693359375, 0.249786376953125, 0.2854766845703125, 0.3211669921875, 0.3568572998046875, 0.392547607421875, 0.4282379150390625, 0.46392822265625, 0.4996185302734375, 0.535308837890625, 0.5709991455078125, 0.606689453125, 0.6423797607421875, 0.678070068359375, 0.7137603759765625, 0.74945068359375, 0.7851409912109375, 0.820831298828125, 0.8565216064453125, 0.8922119140625, 0.9279022216796875, 0.963592529296875, 0.9992828369140625, 1.03497314453125, 1.0706634521484375, 1.106353759765625, 1.1420440673828125, 1.177734375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 28.0, 23.0, 26.0, 33.0, 44.0, 46.0, 66.0, 67.0, 78.0, 79.0, 56.0, 62.0, 65.0, 60.0, 46.0, 44.0, 42.0, 25.0, 21.0, 25.0, 10.0, 10.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.256855010986328, -7.958423614501953, -7.659992694854736, -7.361561298370361, -7.0631303787231445, -6.7646989822387695, -6.4662675857543945, -6.1678361892700195, -5.869405269622803, -5.570973873138428, -5.272542953491211, -4.974111557006836, -4.675680160522461, -4.377249240875244, -4.078817844390869, -3.7803866863250732, -3.4819555282592773, -3.1835243701934814, -2.8850932121276855, -2.5866618156433105, -2.2882306575775146, -1.9897994995117188, -1.6913682222366333, -1.3929369449615479, -1.094505786895752, -0.7960745692253113, -0.4976433515548706, -0.19921213388442993, 0.09921908378601074, 0.39765024185180664, 0.6960815191268921, 0.9945127964019775, 1.2929449081420898, 1.5913760662078857, 1.8898073434829712, 2.1882386207580566, 2.4866697788238525, 2.7851009368896484, 3.0835323333740234, 3.3819634914398193, 3.6803946495056152, 3.978825807571411, 4.277256965637207, 4.575688362121582, 4.874119758605957, 5.172550678253174, 5.470982074737549, 5.769412994384766, 6.067844390869141, 6.366275787353516, 6.664706707000732, 6.963138103485107, 7.261569023132324, 7.560000419616699, 7.858431816101074, 8.15686321258545, 8.455293655395508, 8.753725051879883, 9.052156448364258, 9.350586891174316, 9.649018287658691, 9.947449684143066, 10.245881080627441, 10.544312477111816, 10.842743873596191]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 7.0, 8.0, 12.0, 6.0, 13.0, 18.0, 16.0, 24.0, 22.0, 18.0, 43.0, 19.0, 38.0, 32.0, 25.0, 41.0, 37.0, 40.0, 44.0, 39.0, 30.0, 43.0, 33.0, 33.0, 33.0, 35.0, 26.0, 36.0, 23.0, 19.0, 24.0, 18.0, 22.0, 25.0, 8.0, 15.0, 7.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9709115028381348, -3.8391921520233154, -3.707473039627075, -3.575753688812256, -3.4440345764160156, -3.3123152256011963, -3.180595874786377, -3.0488767623901367, -2.9171574115753174, -2.785438060760498, -2.653718948364258, -2.5219995975494385, -2.390280246734619, -2.258561134338379, -2.1268417835235596, -1.9951225519180298, -1.8634033203125, -1.7316840887069702, -1.5999648571014404, -1.468245506286621, -1.3365262746810913, -1.2048070430755615, -1.0730876922607422, -0.9413684606552124, -0.8096492290496826, -0.6779299974441528, -0.5462107062339783, -0.4144914448261261, -0.2827721834182739, -0.15105295181274414, -0.01933366060256958, 0.11238563060760498, 0.24410486221313477, 0.37582412362098694, 0.5075433850288391, 0.6392626762390137, 0.7709819078445435, 0.9027011394500732, 1.0344204902648926, 1.1661397218704224, 1.2978589534759521, 1.429578185081482, 1.5612974166870117, 1.693016767501831, 1.8247359991073608, 1.9564552307128906, 2.08817458152771, 2.2198939323425293, 2.3516130447387695, 2.483332395553589, 2.615051507949829, 2.7467708587646484, 2.8784899711608887, 3.010209321975708, 3.1419286727905273, 3.2736477851867676, 3.405367136001587, 3.5370864868164062, 3.6688055992126465, 3.800524950027466, 3.932244300842285, 4.063963413238525, 4.195682525634766, 4.327402114868164, 4.459121227264404]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 5.0, 9.0, 7.0, 10.0, 12.0, 20.0, 23.0, 46.0, 61.0, 68.0, 139.0, 159.0, 281.0, 454.0, 678.0, 1048.0, 1851.0, 2975.0, 4947.0, 8522.0, 14791.0, 25915.0, 47929.0, 89841.0, 175287.0, 347675.0, 642379.0, 907245.0, 828155.0, 520793.0, 273099.0, 139445.0, 72378.0, 38121.0, 21033.0, 11995.0, 6807.0, 4018.0, 2342.0, 1363.0, 857.0, 562.0, 321.0, 214.0, 137.0, 93.0, 62.0, 50.0, 27.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.06640625, -6.84423828125, -6.6220703125, -6.39990234375, -6.177734375, -5.95556640625, -5.7333984375, -5.51123046875, -5.2890625, -5.06689453125, -4.8447265625, -4.62255859375, -4.400390625, -4.17822265625, -3.9560546875, -3.73388671875, -3.51171875, -3.28955078125, -3.0673828125, -2.84521484375, -2.623046875, -2.40087890625, -2.1787109375, -1.95654296875, -1.734375, -1.51220703125, -1.2900390625, -1.06787109375, -0.845703125, -0.62353515625, -0.4013671875, -0.17919921875, 0.04296875, 0.26513671875, 0.4873046875, 0.70947265625, 0.931640625, 1.15380859375, 1.3759765625, 1.59814453125, 1.8203125, 2.04248046875, 2.2646484375, 2.48681640625, 2.708984375, 2.93115234375, 3.1533203125, 3.37548828125, 3.59765625, 3.81982421875, 4.0419921875, 4.26416015625, 4.486328125, 4.70849609375, 4.9306640625, 5.15283203125, 5.375, 5.59716796875, 5.8193359375, 6.04150390625, 6.263671875, 6.48583984375, 6.7080078125, 6.93017578125, 7.15234375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 7.0, 8.0, 12.0, 12.0, 10.0, 24.0, 32.0, 24.0, 31.0, 34.0, 38.0, 45.0, 41.0, 49.0, 59.0, 58.0, 47.0, 35.0, 36.0, 49.0, 36.0, 43.0, 42.0, 43.0, 35.0, 25.0, 31.0, 19.0, 13.0, 7.0, 9.0, 7.0, 9.0, 9.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.822662353515625, -3.67071533203125, -3.518768310546875, -3.3668212890625, -3.214874267578125, -3.06292724609375, -2.910980224609375, -2.759033203125, -2.607086181640625, -2.45513916015625, -2.303192138671875, -2.1512451171875, -1.999298095703125, -1.84735107421875, -1.695404052734375, -1.54345703125, -1.391510009765625, -1.23956298828125, -1.087615966796875, -0.9356689453125, -0.783721923828125, -0.63177490234375, -0.479827880859375, -0.327880859375, -0.175933837890625, -0.02398681640625, 0.127960205078125, 0.2799072265625, 0.431854248046875, 0.58380126953125, 0.735748291015625, 0.8876953125, 1.039642333984375, 1.19158935546875, 1.343536376953125, 1.4954833984375, 1.647430419921875, 1.79937744140625, 1.951324462890625, 2.103271484375, 2.255218505859375, 2.40716552734375, 2.559112548828125, 2.7110595703125, 2.863006591796875, 3.01495361328125, 3.166900634765625, 3.31884765625, 3.470794677734375, 3.62274169921875, 3.774688720703125, 3.9266357421875, 4.078582763671875, 4.23052978515625, 4.382476806640625, 4.534423828125, 4.686370849609375, 4.83831787109375, 4.990264892578125, 5.1422119140625, 5.294158935546875, 5.44610595703125, 5.598052978515625, 5.75]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 18.0, 35.0, 49.0, 110.0, 164.0, 253.0, 412.0, 727.0, 1243.0, 2199.0, 3628.0, 6580.0, 11854.0, 22001.0, 40766.0, 78443.0, 152811.0, 294116.0, 539645.0, 824988.0, 872000.0, 615402.0, 346684.0, 180697.0, 93642.0, 48797.0, 25480.0, 13776.0, 7642.0, 4294.0, 2400.0, 1336.0, 845.0, 474.0, 279.0, 186.0, 108.0, 59.0, 45.0, 22.0, 15.0, 19.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.0723876953125, -7.785400390625, -7.4984130859375, -7.21142578125, -6.9244384765625, -6.637451171875, -6.3504638671875, -6.0634765625, -5.7764892578125, -5.489501953125, -5.2025146484375, -4.91552734375, -4.6285400390625, -4.341552734375, -4.0545654296875, -3.767578125, -3.4805908203125, -3.193603515625, -2.9066162109375, -2.61962890625, -2.3326416015625, -2.045654296875, -1.7586669921875, -1.4716796875, -1.1846923828125, -0.897705078125, -0.6107177734375, -0.32373046875, -0.0367431640625, 0.250244140625, 0.5372314453125, 0.82421875, 1.1112060546875, 1.398193359375, 1.6851806640625, 1.97216796875, 2.2591552734375, 2.546142578125, 2.8331298828125, 3.1201171875, 3.4071044921875, 3.694091796875, 3.9810791015625, 4.26806640625, 4.5550537109375, 4.842041015625, 5.1290283203125, 5.416015625, 5.7030029296875, 5.989990234375, 6.2769775390625, 6.56396484375, 6.8509521484375, 7.137939453125, 7.4249267578125, 7.7119140625, 7.9989013671875, 8.285888671875, 8.5728759765625, 8.85986328125, 9.1468505859375, 9.433837890625, 9.7208251953125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 15.0, 15.0, 29.0, 37.0, 37.0, 48.0, 61.0, 77.0, 111.0, 113.0, 143.0, 150.0, 204.0, 238.0, 254.0, 271.0, 257.0, 253.0, 202.0, 246.0, 233.0, 173.0, 152.0, 154.0, 110.0, 102.0, 70.0, 53.0, 43.0, 43.0, 37.0, 30.0, 23.0, 20.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.6339111328125, -2.551025390625, -2.4681396484375, -2.38525390625, -2.3023681640625, -2.219482421875, -2.1365966796875, -2.0537109375, -1.9708251953125, -1.887939453125, -1.8050537109375, -1.72216796875, -1.6392822265625, -1.556396484375, -1.4735107421875, -1.390625, -1.3077392578125, -1.224853515625, -1.1419677734375, -1.05908203125, -0.9761962890625, -0.893310546875, -0.8104248046875, -0.7275390625, -0.6446533203125, -0.561767578125, -0.4788818359375, -0.39599609375, -0.3131103515625, -0.230224609375, -0.1473388671875, -0.064453125, 0.0184326171875, 0.101318359375, 0.1842041015625, 0.26708984375, 0.3499755859375, 0.432861328125, 0.5157470703125, 0.5986328125, 0.6815185546875, 0.764404296875, 0.8472900390625, 0.93017578125, 1.0130615234375, 1.095947265625, 1.1788330078125, 1.26171875, 1.3446044921875, 1.427490234375, 1.5103759765625, 1.59326171875, 1.6761474609375, 1.759033203125, 1.8419189453125, 1.9248046875, 2.0076904296875, 2.090576171875, 2.1734619140625, 2.25634765625, 2.3392333984375, 2.422119140625, 2.5050048828125, 2.587890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 20.0, 23.0, 18.0, 22.0, 32.0, 26.0, 41.0, 41.0, 49.0, 48.0, 57.0, 53.0, 58.0, 72.0, 63.0, 61.0, 39.0, 40.0, 47.0, 37.0, 30.0, 24.0, 22.0, 11.0, 15.0, 3.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.052596092224121, -9.751803398132324, -9.451009750366211, -9.150217056274414, -8.849424362182617, -8.54863166809082, -8.247838020324707, -7.94704532623291, -7.646252155303955, -7.345458984375, -7.044666290283203, -6.743873119354248, -6.443079948425293, -6.142287254333496, -5.841494083404541, -5.540700912475586, -5.239908218383789, -4.939115047454834, -4.638322353363037, -4.337529182434082, -4.036736488342285, -3.73594331741333, -3.435150146484375, -3.134357213973999, -2.833564281463623, -2.532771348953247, -2.231978416442871, -1.931185245513916, -1.63039231300354, -1.329599380493164, -1.0288063287734985, -0.728013277053833, -0.42722129821777344, -0.12642830610275269, 0.17436468601226807, 0.4751576781272888, 0.7759506702423096, 1.0767436027526855, 1.377536654472351, 1.6783297061920166, 1.9791226387023926, 2.2799155712127686, 2.5807085037231445, 2.8815016746520996, 3.1822946071624756, 3.4830875396728516, 3.7838807106018066, 4.084673881530762, 4.385466575622559, 4.686259746551514, 4.9870524406433105, 5.287845611572266, 5.5886383056640625, 5.889431476593018, 6.190224647521973, 6.4910173416137695, 6.791810512542725, 7.09260368347168, 7.393396377563477, 7.694189548492432, 7.994982719421387, 8.295775413513184, 8.59656810760498, 8.897361755371094, 9.19815444946289]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 13.0, 12.0, 16.0, 11.0, 15.0, 10.0, 17.0, 36.0, 24.0, 32.0, 28.0, 21.0, 31.0, 30.0, 42.0, 38.0, 27.0, 43.0, 44.0, 28.0, 53.0, 37.0, 35.0, 40.0, 34.0, 36.0, 26.0, 30.0, 27.0, 26.0, 20.0, 17.0, 24.0, 12.0, 12.0, 8.0, 5.0, 11.0, 6.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.544286251068115, -5.38059663772583, -5.216907024383545, -5.05321741104126, -4.889527797698975, -4.7258381843566895, -4.562148571014404, -4.398458957672119, -4.234769344329834, -4.071079730987549, -3.9073901176452637, -3.7437005043029785, -3.5800108909606934, -3.416321277618408, -3.252631664276123, -3.088942050933838, -2.9252524375915527, -2.7615628242492676, -2.5978732109069824, -2.4341835975646973, -2.270493984222412, -2.106804370880127, -1.9431147575378418, -1.7794251441955566, -1.6157355308532715, -1.4520459175109863, -1.2883563041687012, -1.124666690826416, -0.9609770774841309, -0.7972874641418457, -0.6335978507995605, -0.4699082374572754, -0.30621910095214844, -0.14252948760986328, 0.021160125732421875, 0.18484973907470703, 0.3485393524169922, 0.5122289657592773, 0.6759185791015625, 0.8396081924438477, 1.0032978057861328, 1.166987419128418, 1.3306770324707031, 1.4943666458129883, 1.6580562591552734, 1.8217458724975586, 1.9854354858398438, 2.149125099182129, 2.312814712524414, 2.476504325866699, 2.6401939392089844, 2.8038835525512695, 2.9675731658935547, 3.13126277923584, 3.294952392578125, 3.45864200592041, 3.6223316192626953, 3.7860212326049805, 3.9497108459472656, 4.113400459289551, 4.277090072631836, 4.440779685974121, 4.604469299316406, 4.768158912658691, 4.931848526000977]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 7.0, 11.0, 8.0, 23.0, 17.0, 35.0, 73.0, 93.0, 115.0, 194.0, 324.0, 501.0, 741.0, 1217.0, 2139.0, 3366.0, 5548.0, 9446.0, 16172.0, 27408.0, 47725.0, 81612.0, 132071.0, 183242.0, 187068.0, 139279.0, 87014.0, 51309.0, 29384.0, 17032.0, 10141.0, 5950.0, 3526.0, 2116.0, 1317.0, 812.0, 518.0, 330.0, 228.0, 139.0, 92.0, 66.0, 44.0, 25.0, 23.0, 14.0, 15.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6492996215820312, -0.6277008056640625, -0.6061019897460938, -0.584503173828125, -0.5629043579101562, -0.5413055419921875, -0.5197067260742188, -0.49810791015625, -0.47650909423828125, -0.4549102783203125, -0.43331146240234375, -0.411712646484375, -0.39011383056640625, -0.3685150146484375, -0.34691619873046875, -0.3253173828125, -0.30371856689453125, -0.2821197509765625, -0.26052093505859375, -0.238922119140625, -0.21732330322265625, -0.1957244873046875, -0.17412567138671875, -0.15252685546875, -0.13092803955078125, -0.1093292236328125, -0.08773040771484375, -0.066131591796875, -0.04453277587890625, -0.0229339599609375, -0.00133514404296875, 0.020263671875, 0.04186248779296875, 0.0634613037109375, 0.08506011962890625, 0.106658935546875, 0.12825775146484375, 0.1498565673828125, 0.17145538330078125, 0.19305419921875, 0.21465301513671875, 0.2362518310546875, 0.25785064697265625, 0.279449462890625, 0.30104827880859375, 0.3226470947265625, 0.34424591064453125, 0.3658447265625, 0.38744354248046875, 0.4090423583984375, 0.43064117431640625, 0.452239990234375, 0.47383880615234375, 0.4954376220703125, 0.5170364379882812, 0.53863525390625, 0.5602340698242188, 0.5818328857421875, 0.6034317016601562, 0.625030517578125, 0.6466293334960938, 0.6682281494140625, 0.6898269653320312, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 2.0, 3.0, 9.0, 9.0, 11.0, 12.0, 10.0, 7.0, 14.0, 17.0, 30.0, 23.0, 29.0, 29.0, 32.0, 28.0, 35.0, 35.0, 46.0, 42.0, 40.0, 58.0, 44.0, 39.0, 53.0, 29.0, 36.0, 38.0, 34.0, 41.0, 21.0, 26.0, 21.0, 18.0, 20.0, 17.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75775146484375, -5.5623779296875, -5.36700439453125, -5.171630859375, -4.97625732421875, -4.7808837890625, -4.58551025390625, -4.39013671875, -4.19476318359375, -3.9993896484375, -3.80401611328125, -3.608642578125, -3.41326904296875, -3.2178955078125, -3.02252197265625, -2.8271484375, -2.63177490234375, -2.4364013671875, -2.24102783203125, -2.045654296875, -1.85028076171875, -1.6549072265625, -1.45953369140625, -1.26416015625, -1.06878662109375, -0.8734130859375, -0.67803955078125, -0.482666015625, -0.28729248046875, -0.0919189453125, 0.10345458984375, 0.298828125, 0.49420166015625, 0.6895751953125, 0.88494873046875, 1.080322265625, 1.27569580078125, 1.4710693359375, 1.66644287109375, 1.86181640625, 2.05718994140625, 2.2525634765625, 2.44793701171875, 2.643310546875, 2.83868408203125, 3.0340576171875, 3.22943115234375, 3.4248046875, 3.62017822265625, 3.8155517578125, 4.01092529296875, 4.206298828125, 4.40167236328125, 4.5970458984375, 4.79241943359375, 4.98779296875, 5.18316650390625, 5.3785400390625, 5.57391357421875, 5.769287109375, 5.96466064453125, 6.1600341796875, 6.35540771484375, 6.55078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 5.0, 13.0, 13.0, 12.0, 18.0, 29.0, 38.0, 46.0, 56.0, 84.0, 120.0, 146.0, 212.0, 306.0, 506.0, 682.0, 1115.0, 1899.0, 3222.0, 6055.0, 12095.0, 26672.0, 184586.0, 736996.0, 39928.0, 15604.0, 7679.0, 4032.0, 2341.0, 1397.0, 809.0, 515.0, 356.0, 257.0, 196.0, 140.0, 96.0, 60.0, 54.0, 42.0, 21.0, 26.0, 23.0, 7.0, 6.0, 8.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.912109375, -1.8487548828125, -1.785400390625, -1.7220458984375, -1.65869140625, -1.5953369140625, -1.531982421875, -1.4686279296875, -1.4052734375, -1.3419189453125, -1.278564453125, -1.2152099609375, -1.15185546875, -1.0885009765625, -1.025146484375, -0.9617919921875, -0.8984375, -0.8350830078125, -0.771728515625, -0.7083740234375, -0.64501953125, -0.5816650390625, -0.518310546875, -0.4549560546875, -0.3916015625, -0.3282470703125, -0.264892578125, -0.2015380859375, -0.13818359375, -0.0748291015625, -0.011474609375, 0.0518798828125, 0.115234375, 0.1785888671875, 0.241943359375, 0.3052978515625, 0.36865234375, 0.4320068359375, 0.495361328125, 0.5587158203125, 0.6220703125, 0.6854248046875, 0.748779296875, 0.8121337890625, 0.87548828125, 0.9388427734375, 1.002197265625, 1.0655517578125, 1.12890625, 1.1922607421875, 1.255615234375, 1.3189697265625, 1.38232421875, 1.4456787109375, 1.509033203125, 1.5723876953125, 1.6357421875, 1.6990966796875, 1.762451171875, 1.8258056640625, 1.88916015625, 1.9525146484375, 2.015869140625, 2.0792236328125, 2.142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 8.0, 8.0, 13.0, 11.0, 11.0, 19.0, 22.0, 22.0, 20.0, 22.0, 34.0, 33.0, 32.0, 40.0, 31.0, 33.0, 41.0, 40.0, 38.0, 43.0, 38.0, 46.0, 38.0, 32.0, 33.0, 29.0, 31.0, 36.0, 27.0, 30.0, 21.0, 15.0, 14.0, 12.0, 9.0, 10.0, 13.0, 3.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.703125, -3.583343505859375, -3.46356201171875, -3.343780517578125, -3.2239990234375, -3.104217529296875, -2.98443603515625, -2.864654541015625, -2.744873046875, -2.625091552734375, -2.50531005859375, -2.385528564453125, -2.2657470703125, -2.145965576171875, -2.02618408203125, -1.906402587890625, -1.78662109375, -1.666839599609375, -1.54705810546875, -1.427276611328125, -1.3074951171875, -1.187713623046875, -1.06793212890625, -0.948150634765625, -0.828369140625, -0.708587646484375, -0.58880615234375, -0.469024658203125, -0.3492431640625, -0.229461669921875, -0.10968017578125, 0.010101318359375, 0.1298828125, 0.249664306640625, 0.36944580078125, 0.489227294921875, 0.6090087890625, 0.728790283203125, 0.84857177734375, 0.968353271484375, 1.088134765625, 1.207916259765625, 1.32769775390625, 1.447479248046875, 1.5672607421875, 1.687042236328125, 1.80682373046875, 1.926605224609375, 2.04638671875, 2.166168212890625, 2.28594970703125, 2.405731201171875, 2.5255126953125, 2.645294189453125, 2.76507568359375, 2.884857177734375, 3.004638671875, 3.124420166015625, 3.24420166015625, 3.363983154296875, 3.4837646484375, 3.603546142578125, 3.72332763671875, 3.843109130859375, 3.962890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 11.0, 12.0, 28.0, 25.0, 56.0, 65.0, 94.0, 115.0, 184.0, 285.0, 421.0, 642.0, 979.0, 1461.0, 2147.0, 3379.0, 5138.0, 8188.0, 13455.0, 23715.0, 108709.0, 799764.0, 34049.0, 17211.0, 10228.0, 6368.0, 3996.0, 2624.0, 1754.0, 1149.0, 754.0, 491.0, 336.0, 220.0, 154.0, 111.0, 72.0, 49.0, 32.0, 30.0, 14.0, 11.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.349609375, -0.33908843994140625, -0.3285675048828125, -0.31804656982421875, -0.307525634765625, -0.29700469970703125, -0.2864837646484375, -0.27596282958984375, -0.26544189453125, -0.25492095947265625, -0.2444000244140625, -0.23387908935546875, -0.223358154296875, -0.21283721923828125, -0.2023162841796875, -0.19179534912109375, -0.1812744140625, -0.17075347900390625, -0.1602325439453125, -0.14971160888671875, -0.139190673828125, -0.12866973876953125, -0.1181488037109375, -0.10762786865234375, -0.09710693359375, -0.08658599853515625, -0.0760650634765625, -0.06554412841796875, -0.055023193359375, -0.04450225830078125, -0.0339813232421875, -0.02346038818359375, -0.012939453125, -0.00241851806640625, 0.0081024169921875, 0.01862335205078125, 0.029144287109375, 0.03966522216796875, 0.0501861572265625, 0.06070709228515625, 0.07122802734375, 0.08174896240234375, 0.0922698974609375, 0.10279083251953125, 0.113311767578125, 0.12383270263671875, 0.1343536376953125, 0.14487457275390625, 0.1553955078125, 0.16591644287109375, 0.1764373779296875, 0.18695831298828125, 0.197479248046875, 0.20800018310546875, 0.2185211181640625, 0.22904205322265625, 0.23956298828125, 0.25008392333984375, 0.2606048583984375, 0.27112579345703125, 0.281646728515625, 0.29216766357421875, 0.3026885986328125, 0.31320953369140625, 0.32373046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 10.0, 19.0, 19.0, 23.0, 26.0, 28.0, 33.0, 29.0, 24.0, 34.0, 30.0, 43.0, 37.0, 38.0, 29.0, 38.0, 44.0, 55.0, 57.0, 24.0, 38.0, 40.0, 34.0, 38.0, 26.0, 19.0, 21.0, 27.0, 9.0, 21.0, 12.0, 8.0, 11.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3769214749336243e-05, -2.2921711206436157e-05, -2.2074207663536072e-05, -2.1226704120635986e-05, -2.03792005777359e-05, -1.9531697034835815e-05, -1.868419349193573e-05, -1.7836689949035645e-05, -1.698918640613556e-05, -1.6141682863235474e-05, -1.5294179320335388e-05, -1.4446675777435303e-05, -1.3599172234535217e-05, -1.2751668691635132e-05, -1.1904165148735046e-05, -1.1056661605834961e-05, -1.0209158062934875e-05, -9.36165452003479e-06, -8.514150977134705e-06, -7.666647434234619e-06, -6.819143891334534e-06, -5.971640348434448e-06, -5.124136805534363e-06, -4.276633262634277e-06, -3.429129719734192e-06, -2.5816261768341064e-06, -1.734122633934021e-06, -8.866190910339355e-07, -3.91155481338501e-08, 8.083879947662354e-07, 1.6558915376663208e-06, 2.5033950805664062e-06, 3.3508986234664917e-06, 4.198402166366577e-06, 5.045905709266663e-06, 5.893409252166748e-06, 6.7409127950668335e-06, 7.588416337966919e-06, 8.435919880867004e-06, 9.28342342376709e-06, 1.0130926966667175e-05, 1.097843050956726e-05, 1.1825934052467346e-05, 1.2673437595367432e-05, 1.3520941138267517e-05, 1.4368444681167603e-05, 1.5215948224067688e-05, 1.6063451766967773e-05, 1.691095530986786e-05, 1.7758458852767944e-05, 1.860596239566803e-05, 1.9453465938568115e-05, 2.03009694814682e-05, 2.1148473024368286e-05, 2.199597656726837e-05, 2.2843480110168457e-05, 2.3690983653068542e-05, 2.4538487195968628e-05, 2.5385990738868713e-05, 2.62334942817688e-05, 2.7080997824668884e-05, 2.792850136756897e-05, 2.8776004910469055e-05, 2.962350845336914e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 17.0, 23.0, 28.0, 37.0, 54.0, 89.0, 119.0, 198.0, 294.0, 484.0, 829.0, 1229.0, 1873.0, 2948.0, 4883.0, 7726.0, 12928.0, 21809.0, 36345.0, 61327.0, 100451.0, 150181.0, 184201.0, 165239.0, 115510.0, 71664.0, 42942.0, 25444.0, 15322.0, 9088.0, 5701.0, 3518.0, 2197.0, 1380.0, 905.0, 567.0, 350.0, 222.0, 143.0, 98.0, 66.0, 43.0, 29.0, 17.0, 13.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18826675415039062, -0.18231964111328125, -0.17637252807617188, -0.1704254150390625, -0.16447830200195312, -0.15853118896484375, -0.15258407592773438, -0.146636962890625, -0.14068984985351562, -0.13474273681640625, -0.12879562377929688, -0.1228485107421875, -0.11690139770507812, -0.11095428466796875, -0.10500717163085938, -0.09906005859375, -0.09311294555664062, -0.08716583251953125, -0.08121871948242188, -0.0752716064453125, -0.06932449340820312, -0.06337738037109375, -0.057430267333984375, -0.051483154296875, -0.045536041259765625, -0.03958892822265625, -0.033641815185546875, -0.0276947021484375, -0.021747589111328125, -0.01580047607421875, -0.009853363037109375, -0.00390625, 0.002040863037109375, 0.00798797607421875, 0.013935089111328125, 0.0198822021484375, 0.025829315185546875, 0.03177642822265625, 0.037723541259765625, 0.043670654296875, 0.049617767333984375, 0.05556488037109375, 0.061511993408203125, 0.0674591064453125, 0.07340621948242188, 0.07935333251953125, 0.08530044555664062, 0.09124755859375, 0.09719467163085938, 0.10314178466796875, 0.10908889770507812, 0.1150360107421875, 0.12098312377929688, 0.12693023681640625, 0.13287734985351562, 0.138824462890625, 0.14477157592773438, 0.15071868896484375, 0.15666580200195312, 0.1626129150390625, 0.16856002807617188, 0.17450714111328125, 0.18045425415039062, 0.1864013671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 15.0, 14.0, 16.0, 26.0, 34.0, 29.0, 43.0, 39.0, 47.0, 53.0, 44.0, 71.0, 56.0, 69.0, 50.0, 48.0, 54.0, 54.0, 39.0, 25.0, 30.0, 23.0, 19.0, 16.0, 13.0, 8.0, 9.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.055511474609375, -0.05358457565307617, -0.051657676696777344, -0.049730777740478516, -0.04780387878417969, -0.04587697982788086, -0.04395008087158203, -0.0420231819152832, -0.040096282958984375, -0.03816938400268555, -0.03624248504638672, -0.03431558609008789, -0.03238868713378906, -0.030461788177490234, -0.028534889221191406, -0.026607990264892578, -0.02468109130859375, -0.022754192352294922, -0.020827293395996094, -0.018900394439697266, -0.016973495483398438, -0.01504659652709961, -0.013119697570800781, -0.011192798614501953, -0.009265899658203125, -0.007339000701904297, -0.005412101745605469, -0.0034852027893066406, -0.0015583038330078125, 0.0003685951232910156, 0.0022954940795898438, 0.004222393035888672, 0.0061492919921875, 0.008076190948486328, 0.010003089904785156, 0.011929988861083984, 0.013856887817382812, 0.01578378677368164, 0.01771068572998047, 0.019637584686279297, 0.021564483642578125, 0.023491382598876953, 0.02541828155517578, 0.02734518051147461, 0.029272079467773438, 0.031198978424072266, 0.033125877380371094, 0.03505277633666992, 0.03697967529296875, 0.03890657424926758, 0.040833473205566406, 0.042760372161865234, 0.04468727111816406, 0.04661417007446289, 0.04854106903076172, 0.05046796798706055, 0.052394866943359375, 0.0543217658996582, 0.05624866485595703, 0.05817556381225586, 0.06010246276855469, 0.062029361724853516, 0.06395626068115234, 0.06588315963745117, 0.06781005859375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 6.0, 13.0, 22.0, 18.0, 22.0, 21.0, 37.0, 32.0, 41.0, 47.0, 47.0, 47.0, 58.0, 57.0, 65.0, 70.0, 48.0, 60.0, 41.0, 44.0, 37.0, 34.0, 31.0, 21.0, 18.0, 12.0, 10.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.832262992858887, -9.5341215133667, -9.235980033874512, -8.937837600708008, -8.63969612121582, -8.341554641723633, -8.043413162231445, -7.745271682739258, -7.447129726409912, -7.148988246917725, -6.850846290588379, -6.552704811096191, -6.254563331604004, -5.956421375274658, -5.658279895782471, -5.360137939453125, -5.0619964599609375, -4.76385498046875, -4.465713024139404, -4.167571544647217, -3.86942982673645, -3.5712881088256836, -3.273146629333496, -2.9750049114227295, -2.676863193511963, -2.3787214756011963, -2.0805797576904297, -1.7824382781982422, -1.4842965602874756, -1.186154842376709, -0.8880132436752319, -0.5898716449737549, -0.2917299270629883, 0.006411731243133545, 0.30455338954925537, 0.6026950478553772, 0.900836706161499, 1.1989784240722656, 1.4971200227737427, 1.7952616214752197, 2.0934033393859863, 2.391545057296753, 2.6896867752075195, 2.987828254699707, 3.2859699726104736, 3.5841116905212402, 3.8822531700134277, 4.180395126342773, 4.478536605834961, 4.776678085327148, 5.074820041656494, 5.372961521148682, 5.671103477478027, 5.969244956970215, 6.267386436462402, 6.56552791595459, 6.8636698722839355, 7.161811351776123, 7.459953308105469, 7.758094787597656, 8.056236267089844, 8.354377746582031, 8.652520179748535, 8.950661659240723, 9.24880313873291]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 7.0, 7.0, 15.0, 12.0, 16.0, 9.0, 14.0, 12.0, 17.0, 35.0, 29.0, 30.0, 25.0, 23.0, 31.0, 36.0, 36.0, 37.0, 29.0, 51.0, 36.0, 31.0, 47.0, 45.0, 32.0, 38.0, 34.0, 32.0, 30.0, 30.0, 28.0, 25.0, 19.0, 14.0, 24.0, 12.0, 14.0, 7.0, 5.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.478827476501465, -5.315625190734863, -5.1524224281311035, -4.989220142364502, -4.8260178565979, -4.662815570831299, -4.499612808227539, -4.3364105224609375, -4.173208236694336, -4.010005950927734, -3.8468034267425537, -3.683600902557373, -3.5203986167907715, -3.357196092605591, -3.19399356842041, -3.0307912826538086, -2.867588758468628, -2.7043862342834473, -2.5411839485168457, -2.377981424331665, -2.2147791385650635, -2.051576614379883, -1.8883742094039917, -1.7251718044281006, -1.5619693994522095, -1.3987669944763184, -1.2355645895004272, -1.0723621845245361, -0.9091597199440002, -0.7459573149681091, -0.5827548503875732, -0.41955244541168213, -0.256350040435791, -0.09314762055873871, 0.0700547993183136, 0.2332572340965271, 0.3964596390724182, 0.5596620440483093, 0.7228645086288452, 0.8860669136047363, 1.0492693185806274, 1.2124717235565186, 1.3756741285324097, 1.5388765335083008, 1.7020790576934814, 1.865281343460083, 2.0284838676452637, 2.1916861534118652, 2.354888677597046, 2.5180912017822266, 2.681293487548828, 2.844496011734009, 3.0076982975006104, 3.170900821685791, 3.3341031074523926, 3.4973056316375732, 3.660508155822754, 3.8237106800079346, 3.986912965774536, 4.150115489959717, 4.313317775726318, 4.47652006149292, 4.63972282409668, 4.802925109863281, 4.966127395629883]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 22.0, 21.0, 47.0, 60.0, 94.0, 147.0, 229.0, 325.0, 463.0, 735.0, 1195.0, 1746.0, 2808.0, 4309.0, 6651.0, 9953.0, 14834.0, 22394.0, 32843.0, 46396.0, 63640.0, 82631.0, 99908.0, 110825.0, 112827.0, 104792.0, 89115.0, 70896.0, 53277.0, 37934.0, 25945.0, 17783.0, 11644.0, 7599.0, 5015.0, 3284.0, 2128.0, 1416.0, 900.0, 566.0, 363.0, 285.0, 163.0, 115.0, 72.0, 54.0, 34.0, 20.0, 18.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.8984375, -3.77734375, -3.65625, -3.53515625, -3.4140625, -3.29296875, -3.171875, -3.05078125, -2.9296875, -2.80859375, -2.6875, -2.56640625, -2.4453125, -2.32421875, -2.203125, -2.08203125, -1.9609375, -1.83984375, -1.71875, -1.59765625, -1.4765625, -1.35546875, -1.234375, -1.11328125, -0.9921875, -0.87109375, -0.75, -0.62890625, -0.5078125, -0.38671875, -0.265625, -0.14453125, -0.0234375, 0.09765625, 0.21875, 0.33984375, 0.4609375, 0.58203125, 0.703125, 0.82421875, 0.9453125, 1.06640625, 1.1875, 1.30859375, 1.4296875, 1.55078125, 1.671875, 1.79296875, 1.9140625, 2.03515625, 2.15625, 2.27734375, 2.3984375, 2.51953125, 2.640625, 2.76171875, 2.8828125, 3.00390625, 3.125, 3.24609375, 3.3671875, 3.48828125, 3.609375, 3.73046875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 14.0, 11.0, 24.0, 17.0, 18.0, 26.0, 37.0, 26.0, 32.0, 18.0, 32.0, 38.0, 46.0, 31.0, 40.0, 48.0, 28.0, 39.0, 47.0, 32.0, 39.0, 41.0, 25.0, 44.0, 30.0, 31.0, 23.0, 22.0, 24.0, 22.0, 7.0, 10.0, 9.0, 7.0, 5.0, 9.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0], "bins": [-6.69140625, -6.51092529296875, -6.3304443359375, -6.14996337890625, -5.969482421875, -5.78900146484375, -5.6085205078125, -5.42803955078125, -5.24755859375, -5.06707763671875, -4.8865966796875, -4.70611572265625, -4.525634765625, -4.34515380859375, -4.1646728515625, -3.98419189453125, -3.8037109375, -3.62322998046875, -3.4427490234375, -3.26226806640625, -3.081787109375, -2.90130615234375, -2.7208251953125, -2.54034423828125, -2.35986328125, -2.17938232421875, -1.9989013671875, -1.81842041015625, -1.637939453125, -1.45745849609375, -1.2769775390625, -1.09649658203125, -0.916015625, -0.73553466796875, -0.5550537109375, -0.37457275390625, -0.194091796875, -0.01361083984375, 0.1668701171875, 0.34735107421875, 0.52783203125, 0.70831298828125, 0.8887939453125, 1.06927490234375, 1.249755859375, 1.43023681640625, 1.6107177734375, 1.79119873046875, 1.9716796875, 2.15216064453125, 2.3326416015625, 2.51312255859375, 2.693603515625, 2.87408447265625, 3.0545654296875, 3.23504638671875, 3.41552734375, 3.59600830078125, 3.7764892578125, 3.95697021484375, 4.137451171875, 4.31793212890625, 4.4984130859375, 4.67889404296875, 4.859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 24.0, 21.0, 34.0, 52.0, 85.0, 112.0, 179.0, 275.0, 445.0, 679.0, 1075.0, 1722.0, 2652.0, 4383.0, 6939.0, 10829.0, 16856.0, 26276.0, 39140.0, 56839.0, 78006.0, 100234.0, 117554.0, 123762.0, 116502.0, 99299.0, 77704.0, 56173.0, 38992.0, 25871.0, 16858.0, 10662.0, 6653.0, 4335.0, 2684.0, 1675.0, 1064.0, 709.0, 397.0, 281.0, 165.0, 107.0, 67.0, 57.0, 39.0, 27.0, 13.0, 10.0, 11.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.40234375, -4.2579345703125, -4.113525390625, -3.9691162109375, -3.82470703125, -3.6802978515625, -3.535888671875, -3.3914794921875, -3.2470703125, -3.1026611328125, -2.958251953125, -2.8138427734375, -2.66943359375, -2.5250244140625, -2.380615234375, -2.2362060546875, -2.091796875, -1.9473876953125, -1.802978515625, -1.6585693359375, -1.51416015625, -1.3697509765625, -1.225341796875, -1.0809326171875, -0.9365234375, -0.7921142578125, -0.647705078125, -0.5032958984375, -0.35888671875, -0.2144775390625, -0.070068359375, 0.0743408203125, 0.21875, 0.3631591796875, 0.507568359375, 0.6519775390625, 0.79638671875, 0.9407958984375, 1.085205078125, 1.2296142578125, 1.3740234375, 1.5184326171875, 1.662841796875, 1.8072509765625, 1.95166015625, 2.0960693359375, 2.240478515625, 2.3848876953125, 2.529296875, 2.6737060546875, 2.818115234375, 2.9625244140625, 3.10693359375, 3.2513427734375, 3.395751953125, 3.5401611328125, 3.6845703125, 3.8289794921875, 3.973388671875, 4.1177978515625, 4.26220703125, 4.4066162109375, 4.551025390625, 4.6954345703125, 4.83984375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 6.0, 14.0, 10.0, 11.0, 14.0, 22.0, 30.0, 29.0, 41.0, 30.0, 37.0, 38.0, 33.0, 42.0, 62.0, 44.0, 39.0, 48.0, 60.0, 28.0, 58.0, 34.0, 34.0, 35.0, 29.0, 34.0, 21.0, 31.0, 23.0, 15.0, 9.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 15.0, 10.0, 19.0, 25.0, 47.0, 63.0, 91.0, 125.0, 194.0, 296.0, 433.0, 720.0, 1195.0, 1816.0, 2996.0, 4833.0, 8690.0, 14858.0, 26382.0, 46171.0, 79822.0, 125716.0, 170667.0, 180963.0, 147400.0, 97897.0, 58227.0, 33236.0, 18851.0, 10844.0, 6154.0, 3639.0, 2275.0, 1386.0, 882.0, 568.0, 342.0, 247.0, 144.0, 93.0, 73.0, 41.0, 29.0, 30.0, 19.0, 3.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.95501708984375, -3.8240966796875, -3.69317626953125, -3.562255859375, -3.43133544921875, -3.3004150390625, -3.16949462890625, -3.03857421875, -2.90765380859375, -2.7767333984375, -2.64581298828125, -2.514892578125, -2.38397216796875, -2.2530517578125, -2.12213134765625, -1.9912109375, -1.86029052734375, -1.7293701171875, -1.59844970703125, -1.467529296875, -1.33660888671875, -1.2056884765625, -1.07476806640625, -0.94384765625, -0.81292724609375, -0.6820068359375, -0.55108642578125, -0.420166015625, -0.28924560546875, -0.1583251953125, -0.02740478515625, 0.103515625, 0.23443603515625, 0.3653564453125, 0.49627685546875, 0.627197265625, 0.75811767578125, 0.8890380859375, 1.01995849609375, 1.15087890625, 1.28179931640625, 1.4127197265625, 1.54364013671875, 1.674560546875, 1.80548095703125, 1.9364013671875, 2.06732177734375, 2.1982421875, 2.32916259765625, 2.4600830078125, 2.59100341796875, 2.721923828125, 2.85284423828125, 2.9837646484375, 3.11468505859375, 3.24560546875, 3.37652587890625, 3.5074462890625, 3.63836669921875, 3.769287109375, 3.90020751953125, 4.0311279296875, 4.16204833984375, 4.29296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 3.0, 9.0, 13.0, 17.0, 14.0, 19.0, 36.0, 30.0, 47.0, 50.0, 61.0, 71.0, 86.0, 66.0, 60.0, 63.0, 68.0, 44.0, 38.0, 44.0, 21.0, 26.0, 17.0, 16.0, 12.0, 16.0, 8.0, 2.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005102157592773438, -0.0004954151809215546, -0.0004806146025657654, -0.0004658140242099762, -0.000451013445854187, -0.00043621286749839783, -0.00042141228914260864, -0.00040661171078681946, -0.0003918111324310303, -0.0003770105540752411, -0.0003622099757194519, -0.0003474093973636627, -0.00033260881900787354, -0.00031780824065208435, -0.00030300766229629517, -0.000288207083940506, -0.0002734065055847168, -0.0002586059272289276, -0.00024380534887313843, -0.00022900477051734924, -0.00021420419216156006, -0.00019940361380577087, -0.0001846030354499817, -0.0001698024570941925, -0.00015500187873840332, -0.00014020130038261414, -0.00012540072202682495, -0.00011060014367103577, -9.579956531524658e-05, -8.09989869594574e-05, -6.619840860366821e-05, -5.139783024787903e-05, -3.6597251892089844e-05, -2.179667353630066e-05, -6.996095180511475e-06, 7.80448317527771e-06, 2.2605061531066895e-05, 3.740563988685608e-05, 5.2206218242645264e-05, 6.700679659843445e-05, 8.180737495422363e-05, 9.660795331001282e-05, 0.000111408531665802, 0.0001262091100215912, 0.00014100968837738037, 0.00015581026673316956, 0.00017061084508895874, 0.00018541142344474792, 0.0002002120018005371, 0.0002150125801563263, 0.00022981315851211548, 0.00024461373686790466, 0.00025941431522369385, 0.00027421489357948303, 0.0002890154719352722, 0.0003038160502910614, 0.0003186166286468506, 0.00033341720700263977, 0.00034821778535842896, 0.00036301836371421814, 0.0003778189420700073, 0.0003926195204257965, 0.0004074200987815857, 0.0004222206771373749, 0.00043702125549316406]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 10.0, 14.0, 27.0, 50.0, 67.0, 81.0, 117.0, 170.0, 266.0, 431.0, 694.0, 1045.0, 1694.0, 2659.0, 4658.0, 7731.0, 13490.0, 24031.0, 42880.0, 76789.0, 124727.0, 174583.0, 188610.0, 151719.0, 98752.0, 57985.0, 32072.0, 17849.0, 10006.0, 5961.0, 3511.0, 2121.0, 1316.0, 819.0, 523.0, 368.0, 234.0, 142.0, 125.0, 74.0, 51.0, 28.0, 25.0, 16.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.8359375, -4.69049072265625, -4.5450439453125, -4.39959716796875, -4.254150390625, -4.10870361328125, -3.9632568359375, -3.81781005859375, -3.67236328125, -3.52691650390625, -3.3814697265625, -3.23602294921875, -3.090576171875, -2.94512939453125, -2.7996826171875, -2.65423583984375, -2.5087890625, -2.36334228515625, -2.2178955078125, -2.07244873046875, -1.927001953125, -1.78155517578125, -1.6361083984375, -1.49066162109375, -1.34521484375, -1.19976806640625, -1.0543212890625, -0.90887451171875, -0.763427734375, -0.61798095703125, -0.4725341796875, -0.32708740234375, -0.181640625, -0.03619384765625, 0.1092529296875, 0.25469970703125, 0.400146484375, 0.54559326171875, 0.6910400390625, 0.83648681640625, 0.98193359375, 1.12738037109375, 1.2728271484375, 1.41827392578125, 1.563720703125, 1.70916748046875, 1.8546142578125, 2.00006103515625, 2.1455078125, 2.29095458984375, 2.4364013671875, 2.58184814453125, 2.727294921875, 2.87274169921875, 3.0181884765625, 3.16363525390625, 3.30908203125, 3.45452880859375, 3.5999755859375, 3.74542236328125, 3.890869140625, 4.03631591796875, 4.1817626953125, 4.32720947265625, 4.47265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 6.0, 4.0, 13.0, 12.0, 14.0, 13.0, 23.0, 26.0, 34.0, 42.0, 55.0, 54.0, 53.0, 68.0, 60.0, 66.0, 60.0, 65.0, 58.0, 56.0, 42.0, 20.0, 30.0, 21.0, 12.0, 15.0, 13.0, 15.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4627532958984375, -1.420623779296875, -1.3784942626953125, -1.33636474609375, -1.2942352294921875, -1.252105712890625, -1.2099761962890625, -1.1678466796875, -1.1257171630859375, -1.083587646484375, -1.0414581298828125, -0.99932861328125, -0.9571990966796875, -0.915069580078125, -0.8729400634765625, -0.830810546875, -0.7886810302734375, -0.746551513671875, -0.7044219970703125, -0.66229248046875, -0.6201629638671875, -0.578033447265625, -0.5359039306640625, -0.4937744140625, -0.4516448974609375, -0.409515380859375, -0.3673858642578125, -0.32525634765625, -0.2831268310546875, -0.240997314453125, -0.1988677978515625, -0.15673828125, -0.1146087646484375, -0.072479248046875, -0.0303497314453125, 0.01177978515625, 0.0539093017578125, 0.096038818359375, 0.1381683349609375, 0.1802978515625, 0.2224273681640625, 0.264556884765625, 0.3066864013671875, 0.34881591796875, 0.3909454345703125, 0.433074951171875, 0.4752044677734375, 0.517333984375, 0.5594635009765625, 0.601593017578125, 0.6437225341796875, 0.68585205078125, 0.7279815673828125, 0.770111083984375, 0.8122406005859375, 0.8543701171875, 0.8964996337890625, 0.938629150390625, 0.9807586669921875, 1.02288818359375, 1.0650177001953125, 1.107147216796875, 1.1492767333984375, 1.19140625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 8.0, 10.0, 12.0, 25.0, 14.0, 24.0, 34.0, 26.0, 36.0, 41.0, 55.0, 48.0, 42.0, 54.0, 55.0, 62.0, 65.0, 49.0, 51.0, 42.0, 46.0, 41.0, 34.0, 15.0, 21.0, 24.0, 12.0, 12.0, 6.0, 9.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.650629043579102, -10.352104187011719, -10.053580284118652, -9.75505542755127, -9.456531524658203, -9.15800666809082, -8.859481811523438, -8.560957908630371, -8.262433052062988, -7.963908672332764, -7.665384292602539, -7.366859436035156, -7.068335056304932, -6.769810676574707, -6.471286296844482, -6.172761917114258, -5.874237537384033, -5.575713157653809, -5.277188777923584, -4.978664398193359, -4.680139541625977, -4.381615161895752, -4.083090782165527, -3.7845661640167236, -3.486041784286499, -3.1875174045562744, -2.8889927864074707, -2.590468406677246, -2.2919440269470215, -1.9934194087982178, -1.6948950290679932, -1.3963704109191895, -1.0978460311889648, -0.7993215322494507, -0.5007970929145813, -0.20227265357971191, 0.09625184535980225, 0.3947763442993164, 0.693300724029541, 0.9918253421783447, 1.2903497219085693, 1.5888742208480835, 1.8873987197875977, 2.1859230995178223, 2.484447479248047, 2.7829720973968506, 3.081496477127075, 3.380021095275879, 3.6785454750061035, 3.977069854736328, 4.275594234466553, 4.574118614196777, 4.87264347076416, 5.171167850494385, 5.469692230224609, 5.768217086791992, 6.066740989685059, 6.365265369415283, 6.663789749145508, 6.962314605712891, 7.260838985443115, 7.55936336517334, 7.8578877449035645, 8.156412124633789, 8.454936981201172]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 13.0, 12.0, 19.0, 19.0, 18.0, 26.0, 20.0, 26.0, 32.0, 34.0, 36.0, 37.0, 31.0, 43.0, 49.0, 50.0, 34.0, 37.0, 42.0, 37.0, 40.0, 30.0, 39.0, 37.0, 27.0, 25.0, 29.0, 23.0, 23.0, 16.0, 18.0, 10.0, 8.0, 13.0, 9.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.264275074005127, -6.079763412475586, -5.895252227783203, -5.710740566253662, -5.526229381561279, -5.341717720031738, -5.1572065353393555, -4.9726948738098145, -4.788183689117432, -4.603672027587891, -4.419160842895508, -4.234649181365967, -4.050137996673584, -3.865626573562622, -3.68111515045166, -3.496603488922119, -3.3120920658111572, -3.1275806427001953, -2.9430692195892334, -2.7585577964782715, -2.5740463733673096, -2.3895349502563477, -2.2050232887268066, -2.020512104034424, -1.8360005617141724, -1.6514891386032104, -1.4669777154922485, -1.282466173171997, -1.0979547500610352, -0.913443386554718, -0.7289319038391113, -0.5444204807281494, -0.3599090576171875, -0.1753976196050644, 0.009113818407058716, 0.19362527132034302, 0.37813669443130493, 0.5626481175422668, 0.7471596002578735, 0.9316710233688354, 1.1161824464797974, 1.3006938695907593, 1.4852052927017212, 1.6697168350219727, 1.8542282581329346, 2.0387396812438965, 2.2232511043548584, 2.4077625274658203, 2.5922739505767822, 2.776785373687744, 2.961296796798706, 3.145808219909668, 3.33031964302063, 3.514831066131592, 3.699342727661133, 3.8838539123535156, 4.068365573883057, 4.252877235412598, 4.4373884201049805, 4.6219000816345215, 4.806411266326904, 4.990922927856445, 5.175434112548828, 5.359945774078369, 5.544456958770752]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 19.0, 22.0, 27.0, 37.0, 68.0, 103.0, 165.0, 216.0, 318.0, 554.0, 766.0, 1223.0, 1942.0, 3110.0, 5101.0, 8688.0, 15240.0, 27559.0, 51448.0, 101181.0, 207114.0, 427300.0, 767312.0, 963519.0, 758700.0, 424153.0, 209678.0, 103656.0, 52238.0, 27649.0, 14766.0, 8443.0, 4816.0, 2732.0, 1664.0, 1050.0, 610.0, 431.0, 248.0, 145.0, 83.0, 60.0, 41.0, 27.0, 19.0, 14.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.0078125, -9.7176513671875, -9.427490234375, -9.1373291015625, -8.84716796875, -8.5570068359375, -8.266845703125, -7.9766845703125, -7.6865234375, -7.3963623046875, -7.106201171875, -6.8160400390625, -6.52587890625, -6.2357177734375, -5.945556640625, -5.6553955078125, -5.365234375, -5.0750732421875, -4.784912109375, -4.4947509765625, -4.20458984375, -3.9144287109375, -3.624267578125, -3.3341064453125, -3.0439453125, -2.7537841796875, -2.463623046875, -2.1734619140625, -1.88330078125, -1.5931396484375, -1.302978515625, -1.0128173828125, -0.72265625, -0.4324951171875, -0.142333984375, 0.1478271484375, 0.43798828125, 0.7281494140625, 1.018310546875, 1.3084716796875, 1.5986328125, 1.8887939453125, 2.178955078125, 2.4691162109375, 2.75927734375, 3.0494384765625, 3.339599609375, 3.6297607421875, 3.919921875, 4.2100830078125, 4.500244140625, 4.7904052734375, 5.08056640625, 5.3707275390625, 5.660888671875, 5.9510498046875, 6.2412109375, 6.5313720703125, 6.821533203125, 7.1116943359375, 7.40185546875, 7.6920166015625, 7.982177734375, 8.2723388671875, 8.5625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 5.0, 7.0, 15.0, 11.0, 24.0, 14.0, 15.0, 22.0, 23.0, 32.0, 26.0, 35.0, 40.0, 41.0, 41.0, 43.0, 46.0, 49.0, 42.0, 35.0, 43.0, 31.0, 25.0, 40.0, 31.0, 35.0, 32.0, 29.0, 27.0, 25.0, 17.0, 15.0, 15.0, 11.0, 12.0, 4.0, 13.0, 4.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.1875, -5.01556396484375, -4.8436279296875, -4.67169189453125, -4.499755859375, -4.32781982421875, -4.1558837890625, -3.98394775390625, -3.81201171875, -3.64007568359375, -3.4681396484375, -3.29620361328125, -3.124267578125, -2.95233154296875, -2.7803955078125, -2.60845947265625, -2.4365234375, -2.26458740234375, -2.0926513671875, -1.92071533203125, -1.748779296875, -1.57684326171875, -1.4049072265625, -1.23297119140625, -1.06103515625, -0.88909912109375, -0.7171630859375, -0.54522705078125, -0.373291015625, -0.20135498046875, -0.0294189453125, 0.14251708984375, 0.314453125, 0.48638916015625, 0.6583251953125, 0.83026123046875, 1.002197265625, 1.17413330078125, 1.3460693359375, 1.51800537109375, 1.68994140625, 1.86187744140625, 2.0338134765625, 2.20574951171875, 2.377685546875, 2.54962158203125, 2.7215576171875, 2.89349365234375, 3.0654296875, 3.23736572265625, 3.4093017578125, 3.58123779296875, 3.753173828125, 3.92510986328125, 4.0970458984375, 4.26898193359375, 4.44091796875, 4.61285400390625, 4.7847900390625, 4.95672607421875, 5.128662109375, 5.30059814453125, 5.4725341796875, 5.64447021484375, 5.81640625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 4.0, 18.0, 19.0, 45.0, 47.0, 90.0, 114.0, 198.0, 253.0, 389.0, 617.0, 973.0, 1584.0, 2613.0, 4212.0, 7009.0, 11938.0, 20688.0, 35840.0, 64739.0, 117119.0, 211301.0, 371836.0, 594448.0, 776310.0, 736693.0, 522398.0, 312973.0, 175267.0, 97050.0, 54132.0, 30011.0, 17441.0, 10175.0, 5935.0, 3721.0, 2251.0, 1371.0, 844.0, 554.0, 383.0, 238.0, 149.0, 93.0, 52.0, 50.0, 29.0, 21.0, 8.0, 11.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0], "bins": [-10.359375, -10.0340576171875, -9.708740234375, -9.3834228515625, -9.05810546875, -8.7327880859375, -8.407470703125, -8.0821533203125, -7.7568359375, -7.4315185546875, -7.106201171875, -6.7808837890625, -6.45556640625, -6.1302490234375, -5.804931640625, -5.4796142578125, -5.154296875, -4.8289794921875, -4.503662109375, -4.1783447265625, -3.85302734375, -3.5277099609375, -3.202392578125, -2.8770751953125, -2.5517578125, -2.2264404296875, -1.901123046875, -1.5758056640625, -1.25048828125, -0.9251708984375, -0.599853515625, -0.2745361328125, 0.05078125, 0.3760986328125, 0.701416015625, 1.0267333984375, 1.35205078125, 1.6773681640625, 2.002685546875, 2.3280029296875, 2.6533203125, 2.9786376953125, 3.303955078125, 3.6292724609375, 3.95458984375, 4.2799072265625, 4.605224609375, 4.9305419921875, 5.255859375, 5.5811767578125, 5.906494140625, 6.2318115234375, 6.55712890625, 6.8824462890625, 7.207763671875, 7.5330810546875, 7.8583984375, 8.1837158203125, 8.509033203125, 8.8343505859375, 9.15966796875, 9.4849853515625, 9.810302734375, 10.1356201171875, 10.4609375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 27.0, 37.0, 47.0, 50.0, 72.0, 70.0, 111.0, 158.0, 150.0, 181.0, 203.0, 264.0, 296.0, 276.0, 294.0, 287.0, 265.0, 241.0, 214.0, 188.0, 132.0, 105.0, 88.0, 71.0, 58.0, 38.0, 38.0, 28.0, 13.0, 17.0, 11.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.73828125, -4.61676025390625, -4.4952392578125, -4.37371826171875, -4.252197265625, -4.13067626953125, -4.0091552734375, -3.88763427734375, -3.76611328125, -3.64459228515625, -3.5230712890625, -3.40155029296875, -3.280029296875, -3.15850830078125, -3.0369873046875, -2.91546630859375, -2.7939453125, -2.67242431640625, -2.5509033203125, -2.42938232421875, -2.307861328125, -2.18634033203125, -2.0648193359375, -1.94329833984375, -1.82177734375, -1.70025634765625, -1.5787353515625, -1.45721435546875, -1.335693359375, -1.21417236328125, -1.0926513671875, -0.97113037109375, -0.849609375, -0.72808837890625, -0.6065673828125, -0.48504638671875, -0.363525390625, -0.24200439453125, -0.1204833984375, 0.00103759765625, 0.12255859375, 0.24407958984375, 0.3656005859375, 0.48712158203125, 0.608642578125, 0.73016357421875, 0.8516845703125, 0.97320556640625, 1.0947265625, 1.21624755859375, 1.3377685546875, 1.45928955078125, 1.580810546875, 1.70233154296875, 1.8238525390625, 1.94537353515625, 2.06689453125, 2.18841552734375, 2.3099365234375, 2.43145751953125, 2.552978515625, 2.67449951171875, 2.7960205078125, 2.91754150390625, 3.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 6.0, 10.0, 10.0, 17.0, 14.0, 18.0, 32.0, 32.0, 30.0, 41.0, 42.0, 55.0, 56.0, 61.0, 65.0, 65.0, 50.0, 64.0, 46.0, 38.0, 43.0, 37.0, 31.0, 28.0, 24.0, 20.0, 14.0, 11.0, 9.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.759474754333496, -13.364616394042969, -12.969757080078125, -12.574898719787598, -12.18004035949707, -11.785181999206543, -11.390323638916016, -10.995464324951172, -10.600605964660645, -10.205747604370117, -9.810888290405273, -9.416029930114746, -9.021171569824219, -8.626313209533691, -8.231454849243164, -7.83659553527832, -7.441737174987793, -7.046878814697266, -6.65201997756958, -6.2571611404418945, -5.862302780151367, -5.46744441986084, -5.072585582733154, -4.677726745605469, -4.282868385314941, -3.888009786605835, -3.4931511878967285, -3.098292589187622, -2.7034339904785156, -2.308575391769409, -1.9137167930603027, -1.5188581943511963, -1.1240005493164062, -0.7291419506072998, -0.33428335189819336, 0.060575246810913086, 0.45543384552001953, 0.850292444229126, 1.2451510429382324, 1.6400096416473389, 2.0348682403564453, 2.4297268390655518, 2.824585437774658, 3.2194440364837646, 3.614302635192871, 4.009160995483398, 4.404019832611084, 4.7988786697387695, 5.193737030029297, 5.588595390319824, 5.98345422744751, 6.378313064575195, 6.773171424865723, 7.16802978515625, 7.5628886222839355, 7.957747459411621, 8.352605819702148, 8.747464179992676, 9.142322540283203, 9.537181854248047, 9.932040214538574, 10.326898574829102, 10.721757888793945, 11.116616249084473, 11.511474609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 6.0, 10.0, 8.0, 16.0, 16.0, 14.0, 19.0, 20.0, 18.0, 27.0, 28.0, 13.0, 36.0, 34.0, 27.0, 50.0, 34.0, 40.0, 37.0, 38.0, 33.0, 42.0, 50.0, 34.0, 35.0, 33.0, 37.0, 28.0, 35.0, 21.0, 24.0, 23.0, 17.0, 18.0, 18.0, 7.0, 13.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.569639205932617, -6.363455295562744, -6.157271385192871, -5.95108699798584, -5.744903087615967, -5.538719177246094, -5.332535266876221, -5.126351356506348, -4.920166969299316, -4.713983058929443, -4.50779914855957, -4.301614761352539, -4.095430850982666, -3.889246940612793, -3.68306303024292, -3.4768788814544678, -3.2706949710845947, -3.0645110607147217, -2.8583269119262695, -2.6521430015563965, -2.4459588527679443, -2.2397749423980713, -2.033590793609619, -1.827406883239746, -1.6212228536605835, -1.415038824081421, -1.2088547945022583, -1.0026707649230957, -0.7964867949485779, -0.5903028249740601, -0.38411879539489746, -0.17793476581573486, 0.028249263763427734, 0.23443327844142914, 0.44061729311943054, 0.6468012928962708, 0.8529853224754333, 1.0591692924499512, 1.2653533220291138, 1.4715373516082764, 1.677721381187439, 1.8839054107666016, 2.0900893211364746, 2.2962734699249268, 2.5024573802948, 2.708641529083252, 2.914825439453125, 3.121009349822998, 3.32719349861145, 3.5333774089813232, 3.7395615577697754, 3.9457454681396484, 4.1519293785095215, 4.3581132888793945, 4.564297676086426, 4.770481586456299, 4.976665496826172, 5.182849407196045, 5.389033317565918, 5.595217704772949, 5.801401615142822, 6.007585525512695, 6.213769435882568, 6.419953346252441, 6.626137733459473]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 9.0, 18.0, 23.0, 32.0, 60.0, 67.0, 128.0, 201.0, 292.0, 444.0, 774.0, 1144.0, 2008.0, 3053.0, 5206.0, 8671.0, 14477.0, 24862.0, 42141.0, 69471.0, 110331.0, 155324.0, 178288.0, 153745.0, 108365.0, 67847.0, 41207.0, 24246.0, 14281.0, 8375.0, 5058.0, 3184.0, 1971.0, 1200.0, 724.0, 485.0, 291.0, 183.0, 138.0, 76.0, 43.0, 33.0, 25.0, 13.0, 17.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.806640625, -0.7818069458007812, -0.7569732666015625, -0.7321395874023438, -0.707305908203125, -0.6824722290039062, -0.6576385498046875, -0.6328048706054688, -0.60797119140625, -0.5831375122070312, -0.5583038330078125, -0.5334701538085938, -0.508636474609375, -0.48380279541015625, -0.4589691162109375, -0.43413543701171875, -0.4093017578125, -0.38446807861328125, -0.3596343994140625, -0.33480072021484375, -0.309967041015625, -0.28513336181640625, -0.2602996826171875, -0.23546600341796875, -0.21063232421875, -0.18579864501953125, -0.1609649658203125, -0.13613128662109375, -0.111297607421875, -0.08646392822265625, -0.0616302490234375, -0.03679656982421875, -0.011962890625, 0.01287078857421875, 0.0377044677734375, 0.06253814697265625, 0.087371826171875, 0.11220550537109375, 0.1370391845703125, 0.16187286376953125, 0.18670654296875, 0.21154022216796875, 0.2363739013671875, 0.26120758056640625, 0.286041259765625, 0.31087493896484375, 0.3357086181640625, 0.36054229736328125, 0.3853759765625, 0.41020965576171875, 0.4350433349609375, 0.45987701416015625, 0.484710693359375, 0.5095443725585938, 0.5343780517578125, 0.5592117309570312, 0.58404541015625, 0.6088790893554688, 0.6337127685546875, 0.6585464477539062, 0.683380126953125, 0.7082138061523438, 0.7330474853515625, 0.7578811645507812, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 9.0, 10.0, 13.0, 13.0, 23.0, 21.0, 27.0, 34.0, 23.0, 28.0, 27.0, 34.0, 36.0, 36.0, 38.0, 47.0, 47.0, 47.0, 34.0, 29.0, 37.0, 34.0, 35.0, 33.0, 32.0, 28.0, 31.0, 27.0, 26.0, 26.0, 17.0, 12.0, 12.0, 7.0, 10.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7830810546875, -6.550537109375, -6.3179931640625, -6.08544921875, -5.8529052734375, -5.620361328125, -5.3878173828125, -5.1552734375, -4.9227294921875, -4.690185546875, -4.4576416015625, -4.22509765625, -3.9925537109375, -3.760009765625, -3.5274658203125, -3.294921875, -3.0623779296875, -2.829833984375, -2.5972900390625, -2.36474609375, -2.1322021484375, -1.899658203125, -1.6671142578125, -1.4345703125, -1.2020263671875, -0.969482421875, -0.7369384765625, -0.50439453125, -0.2718505859375, -0.039306640625, 0.1932373046875, 0.42578125, 0.6583251953125, 0.890869140625, 1.1234130859375, 1.35595703125, 1.5885009765625, 1.821044921875, 2.0535888671875, 2.2861328125, 2.5186767578125, 2.751220703125, 2.9837646484375, 3.21630859375, 3.4488525390625, 3.681396484375, 3.9139404296875, 4.146484375, 4.3790283203125, 4.611572265625, 4.8441162109375, 5.07666015625, 5.3092041015625, 5.541748046875, 5.7742919921875, 6.0068359375, 6.2393798828125, 6.471923828125, 6.7044677734375, 6.93701171875, 7.1695556640625, 7.402099609375, 7.6346435546875, 7.8671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 10.0, 18.0, 18.0, 24.0, 36.0, 51.0, 47.0, 99.0, 99.0, 133.0, 210.0, 290.0, 451.0, 741.0, 1117.0, 1722.0, 2954.0, 5358.0, 10455.0, 21488.0, 80016.0, 819859.0, 61323.0, 19788.0, 9534.0, 5093.0, 2824.0, 1635.0, 996.0, 647.0, 431.0, 307.0, 240.0, 135.0, 100.0, 77.0, 66.0, 49.0, 26.0, 19.0, 10.0, 16.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.517578125, -2.4375, -2.357421875, -2.27734375, -2.197265625, -2.1171875, -2.037109375, -1.95703125, -1.876953125, -1.796875, -1.716796875, -1.63671875, -1.556640625, -1.4765625, -1.396484375, -1.31640625, -1.236328125, -1.15625, -1.076171875, -0.99609375, -0.916015625, -0.8359375, -0.755859375, -0.67578125, -0.595703125, -0.515625, -0.435546875, -0.35546875, -0.275390625, -0.1953125, -0.115234375, -0.03515625, 0.044921875, 0.125, 0.205078125, 0.28515625, 0.365234375, 0.4453125, 0.525390625, 0.60546875, 0.685546875, 0.765625, 0.845703125, 0.92578125, 1.005859375, 1.0859375, 1.166015625, 1.24609375, 1.326171875, 1.40625, 1.486328125, 1.56640625, 1.646484375, 1.7265625, 1.806640625, 1.88671875, 1.966796875, 2.046875, 2.126953125, 2.20703125, 2.287109375, 2.3671875, 2.447265625, 2.52734375, 2.607421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 25.0, 14.0, 12.0, 17.0, 24.0, 24.0, 26.0, 28.0, 37.0, 32.0, 36.0, 34.0, 29.0, 36.0, 30.0, 40.0, 34.0, 31.0, 35.0, 36.0, 29.0, 35.0, 31.0, 29.0, 29.0, 26.0, 18.0, 22.0, 17.0, 22.0, 14.0, 19.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.69140625, -4.5523681640625, -4.413330078125, -4.2742919921875, -4.13525390625, -3.9962158203125, -3.857177734375, -3.7181396484375, -3.5791015625, -3.4400634765625, -3.301025390625, -3.1619873046875, -3.02294921875, -2.8839111328125, -2.744873046875, -2.6058349609375, -2.466796875, -2.3277587890625, -2.188720703125, -2.0496826171875, -1.91064453125, -1.7716064453125, -1.632568359375, -1.4935302734375, -1.3544921875, -1.2154541015625, -1.076416015625, -0.9373779296875, -0.79833984375, -0.6593017578125, -0.520263671875, -0.3812255859375, -0.2421875, -0.1031494140625, 0.035888671875, 0.1749267578125, 0.31396484375, 0.4530029296875, 0.592041015625, 0.7310791015625, 0.8701171875, 1.0091552734375, 1.148193359375, 1.2872314453125, 1.42626953125, 1.5653076171875, 1.704345703125, 1.8433837890625, 1.982421875, 2.1214599609375, 2.260498046875, 2.3995361328125, 2.53857421875, 2.6776123046875, 2.816650390625, 2.9556884765625, 3.0947265625, 3.2337646484375, 3.372802734375, 3.5118408203125, 3.65087890625, 3.7899169921875, 3.928955078125, 4.0679931640625, 4.20703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 16.0, 23.0, 28.0, 37.0, 45.0, 88.0, 101.0, 182.0, 284.0, 445.0, 776.0, 1356.0, 2425.0, 4539.0, 8823.0, 18025.0, 47365.0, 884669.0, 43601.0, 17247.0, 8395.0, 4345.0, 2357.0, 1328.0, 756.0, 460.0, 295.0, 185.0, 105.0, 75.0, 58.0, 33.0, 20.0, 19.0, 6.0, 8.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7001953125, -0.677947998046875, -0.65570068359375, -0.633453369140625, -0.6112060546875, -0.588958740234375, -0.56671142578125, -0.544464111328125, -0.522216796875, -0.499969482421875, -0.47772216796875, -0.455474853515625, -0.4332275390625, -0.410980224609375, -0.38873291015625, -0.366485595703125, -0.34423828125, -0.321990966796875, -0.29974365234375, -0.277496337890625, -0.2552490234375, -0.233001708984375, -0.21075439453125, -0.188507080078125, -0.166259765625, -0.144012451171875, -0.12176513671875, -0.099517822265625, -0.0772705078125, -0.055023193359375, -0.03277587890625, -0.010528564453125, 0.01171875, 0.033966064453125, 0.05621337890625, 0.078460693359375, 0.1007080078125, 0.122955322265625, 0.14520263671875, 0.167449951171875, 0.189697265625, 0.211944580078125, 0.23419189453125, 0.256439208984375, 0.2786865234375, 0.300933837890625, 0.32318115234375, 0.345428466796875, 0.36767578125, 0.389923095703125, 0.41217041015625, 0.434417724609375, 0.4566650390625, 0.478912353515625, 0.50115966796875, 0.523406982421875, 0.545654296875, 0.567901611328125, 0.59014892578125, 0.612396240234375, 0.6346435546875, 0.656890869140625, 0.67913818359375, 0.701385498046875, 0.7236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 1.0, 7.0, 6.0, 4.0, 6.0, 9.0, 8.0, 12.0, 7.0, 15.0, 20.0, 12.0, 19.0, 22.0, 24.0, 25.0, 36.0, 24.0, 33.0, 34.0, 44.0, 39.0, 40.0, 36.0, 31.0, 40.0, 30.0, 36.0, 29.0, 42.0, 34.0, 29.0, 34.0, 28.0, 25.0, 14.0, 18.0, 17.0, 17.0, 19.0, 14.0, 15.0, 5.0, 6.0, 3.0, 8.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3845583200454712e-05, -2.3074448108673096e-05, -2.230331301689148e-05, -2.1532177925109863e-05, -2.0761042833328247e-05, -1.998990774154663e-05, -1.9218772649765015e-05, -1.84476375579834e-05, -1.7676502466201782e-05, -1.6905367374420166e-05, -1.613423228263855e-05, -1.5363097190856934e-05, -1.4591962099075317e-05, -1.3820827007293701e-05, -1.3049691915512085e-05, -1.2278556823730469e-05, -1.1507421731948853e-05, -1.0736286640167236e-05, -9.96515154838562e-06, -9.194016456604004e-06, -8.422881364822388e-06, -7.651746273040771e-06, -6.880611181259155e-06, -6.109476089477539e-06, -5.338340997695923e-06, -4.567205905914307e-06, -3.7960708141326904e-06, -3.0249357223510742e-06, -2.253800630569458e-06, -1.4826655387878418e-06, -7.115304470062256e-07, 5.960464477539063e-08, 8.307397365570068e-07, 1.601874828338623e-06, 2.3730099201202393e-06, 3.1441450119018555e-06, 3.915280103683472e-06, 4.686415195465088e-06, 5.457550287246704e-06, 6.22868537902832e-06, 6.9998204708099365e-06, 7.770955562591553e-06, 8.542090654373169e-06, 9.313225746154785e-06, 1.0084360837936401e-05, 1.0855495929718018e-05, 1.1626631021499634e-05, 1.239776611328125e-05, 1.3168901205062866e-05, 1.3940036296844482e-05, 1.4711171388626099e-05, 1.5482306480407715e-05, 1.625344157218933e-05, 1.7024576663970947e-05, 1.7795711755752563e-05, 1.856684684753418e-05, 1.9337981939315796e-05, 2.0109117031097412e-05, 2.088025212287903e-05, 2.1651387214660645e-05, 2.242252230644226e-05, 2.3193657398223877e-05, 2.3964792490005493e-05, 2.473592758178711e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 16.0, 14.0, 20.0, 33.0, 40.0, 73.0, 91.0, 162.0, 199.0, 307.0, 508.0, 997.0, 1810.0, 3555.0, 7661.0, 17385.0, 41635.0, 103331.0, 235637.0, 317743.0, 184929.0, 76237.0, 30901.0, 13100.0, 5798.0, 2757.0, 1435.0, 836.0, 427.0, 282.0, 195.0, 112.0, 76.0, 62.0, 46.0, 33.0, 27.0, 22.0, 15.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3826026916503906, -0.36750030517578125, -0.3523979187011719, -0.3372955322265625, -0.3221931457519531, -0.30709075927734375, -0.2919883728027344, -0.276885986328125, -0.2617835998535156, -0.24668121337890625, -0.23157882690429688, -0.2164764404296875, -0.20137405395507812, -0.18627166748046875, -0.17116928100585938, -0.15606689453125, -0.14096450805664062, -0.12586212158203125, -0.11075973510742188, -0.0956573486328125, -0.08055496215820312, -0.06545257568359375, -0.050350189208984375, -0.035247802734375, -0.020145416259765625, -0.00504302978515625, 0.010059356689453125, 0.0251617431640625, 0.040264129638671875, 0.05536651611328125, 0.07046890258789062, 0.0855712890625, 0.10067367553710938, 0.11577606201171875, 0.13087844848632812, 0.1459808349609375, 0.16108322143554688, 0.17618560791015625, 0.19128799438476562, 0.206390380859375, 0.22149276733398438, 0.23659515380859375, 0.2516975402832031, 0.2667999267578125, 0.2819023132324219, 0.29700469970703125, 0.3121070861816406, 0.32720947265625, 0.3423118591308594, 0.35741424560546875, 0.3725166320800781, 0.3876190185546875, 0.4027214050292969, 0.41782379150390625, 0.4329261779785156, 0.448028564453125, 0.4631309509277344, 0.47823333740234375, 0.4933357238769531, 0.5084381103515625, 0.5235404968261719, 0.5386428833007812, 0.5537452697753906, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 8.0, 6.0, 13.0, 17.0, 20.0, 19.0, 23.0, 27.0, 34.0, 35.0, 46.0, 60.0, 53.0, 56.0, 59.0, 48.0, 57.0, 53.0, 55.0, 48.0, 37.0, 27.0, 29.0, 19.0, 31.0, 20.0, 24.0, 15.0, 11.0, 12.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.092529296875, -0.08972930908203125, -0.0869293212890625, -0.08412933349609375, -0.081329345703125, -0.07852935791015625, -0.0757293701171875, -0.07292938232421875, -0.07012939453125, -0.06732940673828125, -0.0645294189453125, -0.06172943115234375, -0.058929443359375, -0.05612945556640625, -0.0533294677734375, -0.05052947998046875, -0.0477294921875, -0.04492950439453125, -0.0421295166015625, -0.03932952880859375, -0.036529541015625, -0.03372955322265625, -0.0309295654296875, -0.02812957763671875, -0.02532958984375, -0.02252960205078125, -0.0197296142578125, -0.01692962646484375, -0.014129638671875, -0.01132965087890625, -0.0085296630859375, -0.00572967529296875, -0.0029296875, -0.00012969970703125, 0.0026702880859375, 0.00547027587890625, 0.008270263671875, 0.01107025146484375, 0.0138702392578125, 0.01667022705078125, 0.01947021484375, 0.02227020263671875, 0.0250701904296875, 0.02787017822265625, 0.030670166015625, 0.03347015380859375, 0.0362701416015625, 0.03907012939453125, 0.0418701171875, 0.04467010498046875, 0.0474700927734375, 0.05027008056640625, 0.053070068359375, 0.05587005615234375, 0.0586700439453125, 0.06147003173828125, 0.06427001953125, 0.06707000732421875, 0.0698699951171875, 0.07266998291015625, 0.075469970703125, 0.07826995849609375, 0.0810699462890625, 0.08386993408203125, 0.086669921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 15.0, 16.0, 27.0, 30.0, 27.0, 41.0, 40.0, 44.0, 54.0, 55.0, 66.0, 58.0, 64.0, 49.0, 66.0, 43.0, 31.0, 49.0, 28.0, 35.0, 25.0, 25.0, 19.0, 13.0, 6.0, 10.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.455452919006348, -13.064770698547363, -12.674088478088379, -12.283407211303711, -11.892724990844727, -11.502042770385742, -11.111360549926758, -10.720678329467773, -10.329996109008789, -9.939313888549805, -9.54863166809082, -9.157949447631836, -8.767268180847168, -8.376585960388184, -7.985903739929199, -7.595221519470215, -7.204539775848389, -6.813857555389404, -6.423175811767578, -6.032493591308594, -5.641811370849609, -5.251129150390625, -4.860447406768799, -4.4697651863098145, -4.079083442687988, -3.688401460647583, -3.2977192401885986, -2.9070372581481934, -2.516355037689209, -2.1256730556488037, -1.7349910736083984, -1.344308853149414, -0.9536266326904297, -0.5629445314407349, -0.17226248979568481, 0.21841955184936523, 0.6091016530990601, 0.9997837543487549, 1.3904657363891602, 1.7811479568481445, 2.17182993888855, 2.562511920928955, 2.9531941413879395, 3.3438761234283447, 3.73455810546875, 4.125240325927734, 4.515922546386719, 4.906604766845703, 5.297286510467529, 5.687968730926514, 6.07865047454834, 6.469332695007324, 6.860014915466309, 7.250697135925293, 7.641378879547119, 8.032060623168945, 8.42274284362793, 8.813425064086914, 9.204107284545898, 9.594789505004883, 9.98547077178955, 10.376152992248535, 10.76683521270752, 11.157517433166504, 11.548199653625488]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 3.0, 13.0, 9.0, 17.0, 14.0, 14.0, 21.0, 18.0, 20.0, 28.0, 23.0, 17.0, 33.0, 36.0, 35.0, 38.0, 39.0, 40.0, 39.0, 36.0, 32.0, 46.0, 51.0, 27.0, 39.0, 32.0, 39.0, 29.0, 32.0, 20.0, 23.0, 25.0, 14.0, 17.0, 19.0, 6.0, 13.0, 13.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5517683029174805, -6.345795631408691, -6.1398234367370605, -5.9338507652282715, -5.727878093719482, -5.521905899047852, -5.3159332275390625, -5.109960556030273, -4.903987884521484, -4.698015213012695, -4.4920430183410645, -4.286070346832275, -4.080097675323486, -3.8741252422332764, -3.6681528091430664, -3.4621801376342773, -3.2562079429626465, -3.0502355098724365, -2.8442628383636475, -2.6382904052734375, -2.4323177337646484, -2.2263453006744385, -2.0203728675842285, -1.814400315284729, -1.6084277629852295, -1.40245521068573, -1.1964826583862305, -0.9905102252960205, -0.784537672996521, -0.5785651206970215, -0.3725926876068115, -0.166620135307312, 0.0393519401550293, 0.24532446265220642, 0.45129698514938354, 0.6572694778442383, 0.8632420301437378, 1.0692145824432373, 1.2751870155334473, 1.4811595678329468, 1.6871321201324463, 1.8931046724319458, 2.0990772247314453, 2.3050496578216553, 2.5110220909118652, 2.7169947624206543, 2.9229671955108643, 3.128939628601074, 3.3349123001098633, 3.5408847332000732, 3.7468574047088623, 3.9528298377990723, 4.158802509307861, 4.364774703979492, 4.570747375488281, 4.77672004699707, 4.982692718505859, 5.188665390014648, 5.394637584686279, 5.600610256195068, 5.806582927703857, 6.012555122375488, 6.218527793884277, 6.424500465393066, 6.630472660064697]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 15.0, 28.0, 21.0, 30.0, 62.0, 76.0, 105.0, 192.0, 239.0, 348.0, 499.0, 773.0, 1181.0, 1806.0, 2907.0, 4703.0, 8132.0, 14097.0, 26150.0, 47564.0, 83948.0, 134435.0, 177946.0, 182407.0, 144607.0, 93684.0, 53896.0, 29445.0, 16049.0, 9009.0, 5171.0, 3129.0, 1947.0, 1312.0, 834.0, 565.0, 393.0, 263.0, 188.0, 114.0, 87.0, 54.0, 42.0, 20.0, 20.0, 16.0, 12.0, 11.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.5303955078125, -8.256103515625, -7.9818115234375, -7.70751953125, -7.4332275390625, -7.158935546875, -6.8846435546875, -6.6103515625, -6.3360595703125, -6.061767578125, -5.7874755859375, -5.51318359375, -5.2388916015625, -4.964599609375, -4.6903076171875, -4.416015625, -4.1417236328125, -3.867431640625, -3.5931396484375, -3.31884765625, -3.0445556640625, -2.770263671875, -2.4959716796875, -2.2216796875, -1.9473876953125, -1.673095703125, -1.3988037109375, -1.12451171875, -0.8502197265625, -0.575927734375, -0.3016357421875, -0.02734375, 0.2469482421875, 0.521240234375, 0.7955322265625, 1.06982421875, 1.3441162109375, 1.618408203125, 1.8927001953125, 2.1669921875, 2.4412841796875, 2.715576171875, 2.9898681640625, 3.26416015625, 3.5384521484375, 3.812744140625, 4.0870361328125, 4.361328125, 4.6356201171875, 4.909912109375, 5.1842041015625, 5.45849609375, 5.7327880859375, 6.007080078125, 6.2813720703125, 6.5556640625, 6.8299560546875, 7.104248046875, 7.3785400390625, 7.65283203125, 7.9271240234375, 8.201416015625, 8.4757080078125, 8.75]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 12.0, 9.0, 14.0, 11.0, 14.0, 16.0, 24.0, 20.0, 24.0, 29.0, 29.0, 34.0, 32.0, 27.0, 29.0, 39.0, 41.0, 34.0, 39.0, 39.0, 36.0, 30.0, 34.0, 38.0, 43.0, 35.0, 33.0, 21.0, 29.0, 18.0, 21.0, 25.0, 16.0, 18.0, 21.0, 11.0, 13.0, 11.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.73046875, -6.5091552734375, -6.287841796875, -6.0665283203125, -5.84521484375, -5.6239013671875, -5.402587890625, -5.1812744140625, -4.9599609375, -4.7386474609375, -4.517333984375, -4.2960205078125, -4.07470703125, -3.8533935546875, -3.632080078125, -3.4107666015625, -3.189453125, -2.9681396484375, -2.746826171875, -2.5255126953125, -2.30419921875, -2.0828857421875, -1.861572265625, -1.6402587890625, -1.4189453125, -1.1976318359375, -0.976318359375, -0.7550048828125, -0.53369140625, -0.3123779296875, -0.091064453125, 0.1302490234375, 0.3515625, 0.5728759765625, 0.794189453125, 1.0155029296875, 1.23681640625, 1.4581298828125, 1.679443359375, 1.9007568359375, 2.1220703125, 2.3433837890625, 2.564697265625, 2.7860107421875, 3.00732421875, 3.2286376953125, 3.449951171875, 3.6712646484375, 3.892578125, 4.1138916015625, 4.335205078125, 4.5565185546875, 4.77783203125, 4.9991455078125, 5.220458984375, 5.4417724609375, 5.6630859375, 5.8843994140625, 6.105712890625, 6.3270263671875, 6.54833984375, 6.7696533203125, 6.990966796875, 7.2122802734375, 7.43359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 15.0, 22.0, 28.0, 36.0, 46.0, 67.0, 124.0, 162.0, 210.0, 358.0, 541.0, 844.0, 1308.0, 2122.0, 3337.0, 5762.0, 11154.0, 22845.0, 52159.0, 118479.0, 220413.0, 261365.0, 182233.0, 88098.0, 38327.0, 17188.0, 8820.0, 4715.0, 2860.0, 1749.0, 1069.0, 725.0, 427.0, 305.0, 192.0, 144.0, 99.0, 52.0, 55.0, 25.0, 24.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.34375, -14.8831787109375, -14.422607421875, -13.9620361328125, -13.50146484375, -13.0408935546875, -12.580322265625, -12.1197509765625, -11.6591796875, -11.1986083984375, -10.738037109375, -10.2774658203125, -9.81689453125, -9.3563232421875, -8.895751953125, -8.4351806640625, -7.974609375, -7.5140380859375, -7.053466796875, -6.5928955078125, -6.13232421875, -5.6717529296875, -5.211181640625, -4.7506103515625, -4.2900390625, -3.8294677734375, -3.368896484375, -2.9083251953125, -2.44775390625, -1.9871826171875, -1.526611328125, -1.0660400390625, -0.60546875, -0.1448974609375, 0.315673828125, 0.7762451171875, 1.23681640625, 1.6973876953125, 2.157958984375, 2.6185302734375, 3.0791015625, 3.5396728515625, 4.000244140625, 4.4608154296875, 4.92138671875, 5.3819580078125, 5.842529296875, 6.3031005859375, 6.763671875, 7.2242431640625, 7.684814453125, 8.1453857421875, 8.60595703125, 9.0665283203125, 9.527099609375, 9.9876708984375, 10.4482421875, 10.9088134765625, 11.369384765625, 11.8299560546875, 12.29052734375, 12.7510986328125, 13.211669921875, 13.6722412109375, 14.1328125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 7.0, 6.0, 10.0, 19.0, 14.0, 23.0, 21.0, 18.0, 19.0, 18.0, 19.0, 26.0, 44.0, 27.0, 35.0, 44.0, 39.0, 41.0, 27.0, 53.0, 37.0, 39.0, 36.0, 37.0, 30.0, 31.0, 41.0, 36.0, 29.0, 24.0, 11.0, 18.0, 13.0, 20.0, 13.0, 12.0, 11.0, 8.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.30078125, -5.1474609375, -4.994140625, -4.8408203125, -4.6875, -4.5341796875, -4.380859375, -4.2275390625, -4.07421875, -3.9208984375, -3.767578125, -3.6142578125, -3.4609375, -3.3076171875, -3.154296875, -3.0009765625, -2.84765625, -2.6943359375, -2.541015625, -2.3876953125, -2.234375, -2.0810546875, -1.927734375, -1.7744140625, -1.62109375, -1.4677734375, -1.314453125, -1.1611328125, -1.0078125, -0.8544921875, -0.701171875, -0.5478515625, -0.39453125, -0.2412109375, -0.087890625, 0.0654296875, 0.21875, 0.3720703125, 0.525390625, 0.6787109375, 0.83203125, 0.9853515625, 1.138671875, 1.2919921875, 1.4453125, 1.5986328125, 1.751953125, 1.9052734375, 2.05859375, 2.2119140625, 2.365234375, 2.5185546875, 2.671875, 2.8251953125, 2.978515625, 3.1318359375, 3.28515625, 3.4384765625, 3.591796875, 3.7451171875, 3.8984375, 4.0517578125, 4.205078125, 4.3583984375, 4.51171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 6.0, 12.0, 15.0, 18.0, 47.0, 50.0, 92.0, 118.0, 209.0, 291.0, 446.0, 682.0, 964.0, 1487.0, 2279.0, 3673.0, 5540.0, 8893.0, 14221.0, 24116.0, 41475.0, 71925.0, 121726.0, 177615.0, 194099.0, 150739.0, 94222.0, 53590.0, 30876.0, 18253.0, 10935.0, 7003.0, 4451.0, 2928.0, 2001.0, 1236.0, 720.0, 513.0, 361.0, 232.0, 169.0, 113.0, 67.0, 50.0, 29.0, 27.0, 17.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.4285888671875, -6.208740234375, -5.9888916015625, -5.76904296875, -5.5491943359375, -5.329345703125, -5.1094970703125, -4.8896484375, -4.6697998046875, -4.449951171875, -4.2301025390625, -4.01025390625, -3.7904052734375, -3.570556640625, -3.3507080078125, -3.130859375, -2.9110107421875, -2.691162109375, -2.4713134765625, -2.25146484375, -2.0316162109375, -1.811767578125, -1.5919189453125, -1.3720703125, -1.1522216796875, -0.932373046875, -0.7125244140625, -0.49267578125, -0.2728271484375, -0.052978515625, 0.1668701171875, 0.38671875, 0.6065673828125, 0.826416015625, 1.0462646484375, 1.26611328125, 1.4859619140625, 1.705810546875, 1.9256591796875, 2.1455078125, 2.3653564453125, 2.585205078125, 2.8050537109375, 3.02490234375, 3.2447509765625, 3.464599609375, 3.6844482421875, 3.904296875, 4.1241455078125, 4.343994140625, 4.5638427734375, 4.78369140625, 5.0035400390625, 5.223388671875, 5.4432373046875, 5.6630859375, 5.8829345703125, 6.102783203125, 6.3226318359375, 6.54248046875, 6.7623291015625, 6.982177734375, 7.2020263671875, 7.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 9.0, 14.0, 25.0, 30.0, 26.0, 28.0, 43.0, 49.0, 53.0, 64.0, 74.0, 65.0, 63.0, 66.0, 54.0, 41.0, 44.0, 39.0, 32.0, 30.0, 23.0, 18.0, 18.0, 7.0, 9.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0006823539733886719, -0.0006618201732635498, -0.0006412863731384277, -0.0006207525730133057, -0.0006002187728881836, -0.0005796849727630615, -0.0005591511726379395, -0.0005386173725128174, -0.0005180835723876953, -0.0004975497722625732, -0.00047701597213745117, -0.0004564821720123291, -0.00043594837188720703, -0.00041541457176208496, -0.0003948807716369629, -0.0003743469715118408, -0.00035381317138671875, -0.0003332793712615967, -0.0003127455711364746, -0.00029221177101135254, -0.00027167797088623047, -0.0002511441707611084, -0.00023061037063598633, -0.00021007657051086426, -0.0001895427703857422, -0.00016900897026062012, -0.00014847517013549805, -0.00012794137001037598, -0.0001074075698852539, -8.687376976013184e-05, -6.633996963500977e-05, -4.5806169509887695e-05, -2.5272369384765625e-05, -4.738569259643555e-06, 1.5795230865478516e-05, 3.6329030990600586e-05, 5.6862831115722656e-05, 7.739663124084473e-05, 9.79304313659668e-05, 0.00011846423149108887, 0.00013899803161621094, 0.000159531831741333, 0.00018006563186645508, 0.00020059943199157715, 0.00022113323211669922, 0.0002416670322418213, 0.00026220083236694336, 0.00028273463249206543, 0.0003032684326171875, 0.00032380223274230957, 0.00034433603286743164, 0.0003648698329925537, 0.0003854036331176758, 0.00040593743324279785, 0.0004264712333679199, 0.000447005033493042, 0.00046753883361816406, 0.00048807263374328613, 0.0005086064338684082, 0.0005291402339935303, 0.0005496740341186523, 0.0005702078342437744, 0.0005907416343688965, 0.0006112754344940186, 0.0006318092346191406]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 20.0, 23.0, 30.0, 49.0, 80.0, 156.0, 198.0, 323.0, 447.0, 807.0, 1241.0, 1956.0, 3018.0, 5184.0, 8589.0, 14171.0, 24929.0, 43293.0, 76179.0, 129863.0, 188642.0, 197682.0, 144733.0, 87379.0, 50112.0, 28230.0, 16387.0, 9754.0, 5806.0, 3439.0, 2191.0, 1292.0, 810.0, 523.0, 355.0, 222.0, 160.0, 85.0, 64.0, 52.0, 30.0, 17.0, 13.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.7520751953125, -6.511962890625, -6.2718505859375, -6.03173828125, -5.7916259765625, -5.551513671875, -5.3114013671875, -5.0712890625, -4.8311767578125, -4.591064453125, -4.3509521484375, -4.11083984375, -3.8707275390625, -3.630615234375, -3.3905029296875, -3.150390625, -2.9102783203125, -2.670166015625, -2.4300537109375, -2.18994140625, -1.9498291015625, -1.709716796875, -1.4696044921875, -1.2294921875, -0.9893798828125, -0.749267578125, -0.5091552734375, -0.26904296875, -0.0289306640625, 0.211181640625, 0.4512939453125, 0.69140625, 0.9315185546875, 1.171630859375, 1.4117431640625, 1.65185546875, 1.8919677734375, 2.132080078125, 2.3721923828125, 2.6123046875, 2.8524169921875, 3.092529296875, 3.3326416015625, 3.57275390625, 3.8128662109375, 4.052978515625, 4.2930908203125, 4.533203125, 4.7733154296875, 5.013427734375, 5.2535400390625, 5.49365234375, 5.7337646484375, 5.973876953125, 6.2139892578125, 6.4541015625, 6.6942138671875, 6.934326171875, 7.1744384765625, 7.41455078125, 7.6546630859375, 7.894775390625, 8.1348876953125, 8.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 5.0, 11.0, 13.0, 14.0, 18.0, 28.0, 20.0, 26.0, 27.0, 46.0, 48.0, 53.0, 58.0, 67.0, 65.0, 62.0, 58.0, 54.0, 54.0, 54.0, 38.0, 30.0, 24.0, 17.0, 17.0, 19.0, 8.0, 11.0, 2.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.99609375, -1.93450927734375, -1.8729248046875, -1.81134033203125, -1.749755859375, -1.68817138671875, -1.6265869140625, -1.56500244140625, -1.50341796875, -1.44183349609375, -1.3802490234375, -1.31866455078125, -1.257080078125, -1.19549560546875, -1.1339111328125, -1.07232666015625, -1.0107421875, -0.94915771484375, -0.8875732421875, -0.82598876953125, -0.764404296875, -0.70281982421875, -0.6412353515625, -0.57965087890625, -0.51806640625, -0.45648193359375, -0.3948974609375, -0.33331298828125, -0.271728515625, -0.21014404296875, -0.1485595703125, -0.08697509765625, -0.025390625, 0.03619384765625, 0.0977783203125, 0.15936279296875, 0.220947265625, 0.28253173828125, 0.3441162109375, 0.40570068359375, 0.46728515625, 0.52886962890625, 0.5904541015625, 0.65203857421875, 0.713623046875, 0.77520751953125, 0.8367919921875, 0.89837646484375, 0.9599609375, 1.02154541015625, 1.0831298828125, 1.14471435546875, 1.206298828125, 1.26788330078125, 1.3294677734375, 1.39105224609375, 1.45263671875, 1.51422119140625, 1.5758056640625, 1.63739013671875, 1.698974609375, 1.76055908203125, 1.8221435546875, 1.88372802734375, 1.9453125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 15.0, 19.0, 24.0, 21.0, 20.0, 40.0, 27.0, 47.0, 49.0, 39.0, 47.0, 61.0, 49.0, 51.0, 60.0, 73.0, 31.0, 33.0, 48.0, 35.0, 31.0, 25.0, 19.0, 12.0, 11.0, 20.0, 17.0, 8.0, 13.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.122962951660156, -11.743892669677734, -11.364823341369629, -10.985753059387207, -10.606683731079102, -10.22761344909668, -9.848543167114258, -9.469472885131836, -9.09040355682373, -8.711333274841309, -8.332263946533203, -7.953193664550781, -7.574123859405518, -7.195054054260254, -6.815983772277832, -6.436913967132568, -6.057844161987305, -5.678774356842041, -5.299704551696777, -4.9206342697143555, -4.541564464569092, -4.162494659423828, -3.7834246158599854, -3.4043545722961426, -3.025284767150879, -2.6462149620056152, -2.2671449184417725, -1.8880749940872192, -1.509005069732666, -1.1299351453781128, -0.7508652210235596, -0.3717951774597168, 0.007274627685546875, 0.3863445520401001, 0.7654144763946533, 1.1444844007492065, 1.5235543251037598, 1.902624249458313, 2.281694173812866, 2.660764217376709, 3.0398340225219727, 3.4189038276672363, 3.797973871231079, 4.177043914794922, 4.5561137199401855, 4.935183525085449, 5.314253807067871, 5.693323612213135, 6.072393417358398, 6.451463222503662, 6.830533027648926, 7.209603309631348, 7.588673114776611, 7.967742919921875, 8.346813201904297, 8.725883483886719, 9.104952812194824, 9.484023094177246, 9.863092422485352, 10.242162704467773, 10.621232986450195, 11.0003023147583, 11.379372596740723, 11.758441925048828, 12.13751220703125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 13.0, 10.0, 11.0, 14.0, 21.0, 21.0, 13.0, 19.0, 24.0, 21.0, 40.0, 30.0, 38.0, 51.0, 43.0, 30.0, 46.0, 35.0, 39.0, 46.0, 30.0, 42.0, 41.0, 29.0, 22.0, 28.0, 27.0, 29.0, 31.0, 17.0, 20.0, 24.0, 11.0, 16.0, 15.0, 15.0, 8.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.735739707946777, -7.48982572555542, -7.2439117431640625, -6.997997760772705, -6.752083778381348, -6.50616979598999, -6.260255813598633, -6.014341831207275, -5.768427848815918, -5.5225138664245605, -5.276599884033203, -5.030685901641846, -4.784771919250488, -4.538857936859131, -4.292943954467773, -4.047029972076416, -3.8011162281036377, -3.5552022457122803, -3.309288263320923, -3.0633742809295654, -2.817460298538208, -2.5715465545654297, -2.3256325721740723, -2.079718589782715, -1.8338044881820679, -1.5878905057907104, -1.341976523399353, -1.0960626602172852, -0.850148618221283, -0.6042346954345703, -0.3583207130432129, -0.11240673065185547, 0.13350725173950195, 0.3794212341308594, 0.6253352165222168, 0.8712491393089294, 1.1171631813049316, 1.3630770444869995, 1.608991026878357, 1.8549050092697144, 2.1008191108703613, 2.3467330932617188, 2.592647075653076, 2.8385610580444336, 3.084475040435791, 3.3303890228271484, 3.576303005218506, 3.8222169876098633, 4.0681304931640625, 4.31404447555542, 4.559958457946777, 4.805872440338135, 5.051786422729492, 5.29770040512085, 5.543614387512207, 5.7895283699035645, 6.035442352294922, 6.281356334686279, 6.527270317077637, 6.773184299468994, 7.019098281860352, 7.265012264251709, 7.510926246643066, 7.756840229034424, 8.002754211425781]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 10.0, 7.0, 18.0, 28.0, 36.0, 69.0, 87.0, 150.0, 233.0, 367.0, 582.0, 850.0, 1477.0, 2163.0, 3567.0, 6069.0, 10181.0, 17147.0, 30263.0, 52705.0, 97186.0, 180228.0, 335413.0, 581254.0, 807711.0, 798423.0, 562165.0, 321863.0, 172463.0, 91872.0, 50666.0, 28436.0, 16379.0, 9590.0, 5677.0, 3495.0, 2082.0, 1280.0, 766.0, 446.0, 325.0, 183.0, 135.0, 90.0, 54.0, 45.0, 23.0, 11.0, 10.0, 7.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.73388671875, -8.3974609375, -8.06103515625, -7.724609375, -7.38818359375, -7.0517578125, -6.71533203125, -6.37890625, -6.04248046875, -5.7060546875, -5.36962890625, -5.033203125, -4.69677734375, -4.3603515625, -4.02392578125, -3.6875, -3.35107421875, -3.0146484375, -2.67822265625, -2.341796875, -2.00537109375, -1.6689453125, -1.33251953125, -0.99609375, -0.65966796875, -0.3232421875, 0.01318359375, 0.349609375, 0.68603515625, 1.0224609375, 1.35888671875, 1.6953125, 2.03173828125, 2.3681640625, 2.70458984375, 3.041015625, 3.37744140625, 3.7138671875, 4.05029296875, 4.38671875, 4.72314453125, 5.0595703125, 5.39599609375, 5.732421875, 6.06884765625, 6.4052734375, 6.74169921875, 7.078125, 7.41455078125, 7.7509765625, 8.08740234375, 8.423828125, 8.76025390625, 9.0966796875, 9.43310546875, 9.76953125, 10.10595703125, 10.4423828125, 10.77880859375, 11.115234375, 11.45166015625, 11.7880859375, 12.12451171875, 12.4609375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 11.0, 7.0, 10.0, 21.0, 11.0, 17.0, 21.0, 22.0, 31.0, 45.0, 27.0, 27.0, 30.0, 33.0, 43.0, 44.0, 43.0, 47.0, 36.0, 46.0, 42.0, 51.0, 36.0, 33.0, 34.0, 26.0, 31.0, 22.0, 32.0, 22.0, 16.0, 16.0, 12.0, 7.0, 10.0, 8.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.80462646484375, -8.5389404296875, -8.27325439453125, -8.007568359375, -7.74188232421875, -7.4761962890625, -7.21051025390625, -6.94482421875, -6.67913818359375, -6.4134521484375, -6.14776611328125, -5.882080078125, -5.61639404296875, -5.3507080078125, -5.08502197265625, -4.8193359375, -4.55364990234375, -4.2879638671875, -4.02227783203125, -3.756591796875, -3.49090576171875, -3.2252197265625, -2.95953369140625, -2.69384765625, -2.42816162109375, -2.1624755859375, -1.89678955078125, -1.631103515625, -1.36541748046875, -1.0997314453125, -0.83404541015625, -0.568359375, -0.30267333984375, -0.0369873046875, 0.22869873046875, 0.494384765625, 0.76007080078125, 1.0257568359375, 1.29144287109375, 1.55712890625, 1.82281494140625, 2.0885009765625, 2.35418701171875, 2.619873046875, 2.88555908203125, 3.1512451171875, 3.41693115234375, 3.6826171875, 3.94830322265625, 4.2139892578125, 4.47967529296875, 4.745361328125, 5.01104736328125, 5.2767333984375, 5.54241943359375, 5.80810546875, 6.07379150390625, 6.3394775390625, 6.60516357421875, 6.870849609375, 7.13653564453125, 7.4022216796875, 7.66790771484375, 7.93359375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 18.0, 19.0, 37.0, 34.0, 69.0, 96.0, 145.0, 276.0, 357.0, 558.0, 945.0, 1575.0, 2480.0, 3986.0, 6762.0, 11503.0, 20078.0, 35114.0, 64625.0, 118348.0, 219939.0, 399606.0, 654743.0, 843349.0, 738913.0, 477081.0, 269107.0, 145174.0, 78291.0, 42624.0, 24169.0, 13807.0, 8005.0, 4717.0, 2893.0, 1748.0, 1088.0, 673.0, 434.0, 334.0, 183.0, 145.0, 77.0, 53.0, 34.0, 24.0, 13.0, 11.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-16.125, -15.64599609375, -15.1669921875, -14.68798828125, -14.208984375, -13.72998046875, -13.2509765625, -12.77197265625, -12.29296875, -11.81396484375, -11.3349609375, -10.85595703125, -10.376953125, -9.89794921875, -9.4189453125, -8.93994140625, -8.4609375, -7.98193359375, -7.5029296875, -7.02392578125, -6.544921875, -6.06591796875, -5.5869140625, -5.10791015625, -4.62890625, -4.14990234375, -3.6708984375, -3.19189453125, -2.712890625, -2.23388671875, -1.7548828125, -1.27587890625, -0.796875, -0.31787109375, 0.1611328125, 0.64013671875, 1.119140625, 1.59814453125, 2.0771484375, 2.55615234375, 3.03515625, 3.51416015625, 3.9931640625, 4.47216796875, 4.951171875, 5.43017578125, 5.9091796875, 6.38818359375, 6.8671875, 7.34619140625, 7.8251953125, 8.30419921875, 8.783203125, 9.26220703125, 9.7412109375, 10.22021484375, 10.69921875, 11.17822265625, 11.6572265625, 12.13623046875, 12.615234375, 13.09423828125, 13.5732421875, 14.05224609375, 14.53125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 17.0, 20.0, 20.0, 32.0, 38.0, 52.0, 58.0, 58.0, 72.0, 98.0, 137.0, 182.0, 192.0, 227.0, 251.0, 224.0, 255.0, 273.0, 298.0, 246.0, 199.0, 194.0, 186.0, 144.0, 140.0, 108.0, 81.0, 52.0, 49.0, 40.0, 43.0, 30.0, 13.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.36590576171875, -4.2044677734375, -4.04302978515625, -3.881591796875, -3.72015380859375, -3.5587158203125, -3.39727783203125, -3.23583984375, -3.07440185546875, -2.9129638671875, -2.75152587890625, -2.590087890625, -2.42864990234375, -2.2672119140625, -2.10577392578125, -1.9443359375, -1.78289794921875, -1.6214599609375, -1.46002197265625, -1.298583984375, -1.13714599609375, -0.9757080078125, -0.81427001953125, -0.65283203125, -0.49139404296875, -0.3299560546875, -0.16851806640625, -0.007080078125, 0.15435791015625, 0.3157958984375, 0.47723388671875, 0.638671875, 0.80010986328125, 0.9615478515625, 1.12298583984375, 1.284423828125, 1.44586181640625, 1.6072998046875, 1.76873779296875, 1.93017578125, 2.09161376953125, 2.2530517578125, 2.41448974609375, 2.575927734375, 2.73736572265625, 2.8988037109375, 3.06024169921875, 3.2216796875, 3.38311767578125, 3.5445556640625, 3.70599365234375, 3.867431640625, 4.02886962890625, 4.1903076171875, 4.35174560546875, 4.51318359375, 4.67462158203125, 4.8360595703125, 4.99749755859375, 5.158935546875, 5.32037353515625, 5.4818115234375, 5.64324951171875, 5.8046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 8.0, 5.0, 14.0, 10.0, 14.0, 20.0, 14.0, 27.0, 26.0, 40.0, 35.0, 35.0, 46.0, 54.0, 50.0, 52.0, 53.0, 54.0, 53.0, 47.0, 47.0, 47.0, 37.0, 23.0, 28.0, 39.0, 25.0, 20.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.755992889404297, -17.209001541137695, -16.662010192871094, -16.115018844604492, -15.56802749633789, -15.021036148071289, -14.474045753479004, -13.927054405212402, -13.3800630569458, -12.8330717086792, -12.286080360412598, -11.739089012145996, -11.192098617553711, -10.64510726928711, -10.098115921020508, -9.551124572753906, -9.004133224487305, -8.457141876220703, -7.910150527954102, -7.363159656524658, -6.816168308258057, -6.269176959991455, -5.722186088562012, -5.17519474029541, -4.628203392028809, -4.081212043762207, -3.5342209339141846, -2.987229824066162, -2.4402384757995605, -1.893247127532959, -1.3462560176849365, -0.7992649078369141, -0.2522735595703125, 0.2947176694869995, 0.8417088985443115, 1.3887001276016235, 1.9356913566589355, 2.482682704925537, 3.0296738147735596, 3.576664924621582, 4.123656272888184, 4.670647621154785, 5.217638969421387, 5.76462984085083, 6.311621189117432, 6.858612537384033, 7.405603408813477, 7.952594757080078, 8.49958610534668, 9.046577453613281, 9.593568801879883, 10.140560150146484, 10.687551498413086, 11.234542846679688, 11.781533241271973, 12.328524589538574, 12.875515937805176, 13.422507286071777, 13.969498634338379, 14.51648998260498, 15.063480377197266, 15.610471725463867, 16.15746307373047, 16.70445442199707, 17.251445770263672]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 11.0, 11.0, 10.0, 14.0, 19.0, 19.0, 19.0, 25.0, 18.0, 25.0, 35.0, 27.0, 28.0, 30.0, 43.0, 33.0, 32.0, 38.0, 27.0, 38.0, 38.0, 34.0, 32.0, 34.0, 25.0, 32.0, 23.0, 30.0, 35.0, 26.0, 19.0, 18.0, 16.0, 17.0, 18.0, 16.0, 19.0, 6.0, 11.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.7020845413208, -9.396124839782715, -9.090165138244629, -8.78420639038086, -8.478246688842773, -8.172286987304688, -7.866327285766602, -7.560368061065674, -7.254408836364746, -6.94844913482666, -6.642489910125732, -6.3365302085876465, -6.030570983886719, -5.724611282348633, -5.418651580810547, -5.112692356109619, -4.806732654571533, -4.500772953033447, -4.1948137283325195, -3.8888540267944336, -3.582894802093506, -3.27693510055542, -2.970975637435913, -2.6650161743164062, -2.3590567111968994, -2.0530972480773926, -1.7471377849578857, -1.4411782026290894, -1.1352187395095825, -0.8292592763900757, -0.5232996940612793, -0.21734023094177246, 0.08861923217773438, 0.3945787250995636, 0.7005382180213928, 1.0064977407455444, 1.3124572038650513, 1.618416666984558, 1.9243762493133545, 2.2303357124328613, 2.536295175552368, 2.842254638671875, 3.148214101791382, 3.4541735649108887, 3.7601332664489746, 4.066092491149902, 4.372052192687988, 4.678011894226074, 4.983971118927002, 5.289930820465088, 5.595890045166016, 5.901849746704102, 6.207808971405029, 6.513768672943115, 6.819727897644043, 7.125687599182129, 7.431647300720215, 7.737607002258301, 8.043566703796387, 8.349525451660156, 8.655485153198242, 8.961444854736328, 9.267404556274414, 9.5733642578125, 9.87932300567627]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 11.0, 27.0, 27.0, 69.0, 91.0, 125.0, 232.0, 364.0, 584.0, 996.0, 1530.0, 2577.0, 4309.0, 7073.0, 11893.0, 20196.0, 34496.0, 59493.0, 98685.0, 150991.0, 188987.0, 170730.0, 117805.0, 73009.0, 42597.0, 25169.0, 14509.0, 8687.0, 5158.0, 3199.0, 1912.0, 1131.0, 690.0, 431.0, 269.0, 159.0, 94.0, 79.0, 48.0, 30.0, 20.0, 15.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.4033203125, -1.3603973388671875, -1.317474365234375, -1.2745513916015625, -1.23162841796875, -1.1887054443359375, -1.145782470703125, -1.1028594970703125, -1.0599365234375, -1.0170135498046875, -0.974090576171875, -0.9311676025390625, -0.88824462890625, -0.8453216552734375, -0.802398681640625, -0.7594757080078125, -0.716552734375, -0.6736297607421875, -0.630706787109375, -0.5877838134765625, -0.54486083984375, -0.5019378662109375, -0.459014892578125, -0.4160919189453125, -0.3731689453125, -0.3302459716796875, -0.287322998046875, -0.2444000244140625, -0.20147705078125, -0.1585540771484375, -0.115631103515625, -0.0727081298828125, -0.02978515625, 0.0131378173828125, 0.056060791015625, 0.0989837646484375, 0.14190673828125, 0.1848297119140625, 0.227752685546875, 0.2706756591796875, 0.3135986328125, 0.3565216064453125, 0.399444580078125, 0.4423675537109375, 0.48529052734375, 0.5282135009765625, 0.571136474609375, 0.6140594482421875, 0.656982421875, 0.6999053955078125, 0.742828369140625, 0.7857513427734375, 0.82867431640625, 0.8715972900390625, 0.914520263671875, 0.9574432373046875, 1.0003662109375, 1.0432891845703125, 1.086212158203125, 1.1291351318359375, 1.17205810546875, 1.2149810791015625, 1.257904052734375, 1.3008270263671875, 1.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 4.0, 7.0, 10.0, 8.0, 15.0, 12.0, 15.0, 17.0, 21.0, 31.0, 27.0, 30.0, 34.0, 27.0, 38.0, 36.0, 35.0, 44.0, 44.0, 49.0, 30.0, 32.0, 37.0, 33.0, 32.0, 38.0, 33.0, 32.0, 26.0, 34.0, 24.0, 18.0, 18.0, 18.0, 18.0, 12.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.4921875, -12.1234130859375, -11.754638671875, -11.3858642578125, -11.01708984375, -10.6483154296875, -10.279541015625, -9.9107666015625, -9.5419921875, -9.1732177734375, -8.804443359375, -8.4356689453125, -8.06689453125, -7.6981201171875, -7.329345703125, -6.9605712890625, -6.591796875, -6.2230224609375, -5.854248046875, -5.4854736328125, -5.11669921875, -4.7479248046875, -4.379150390625, -4.0103759765625, -3.6416015625, -3.2728271484375, -2.904052734375, -2.5352783203125, -2.16650390625, -1.7977294921875, -1.428955078125, -1.0601806640625, -0.69140625, -0.3226318359375, 0.046142578125, 0.4149169921875, 0.78369140625, 1.1524658203125, 1.521240234375, 1.8900146484375, 2.2587890625, 2.6275634765625, 2.996337890625, 3.3651123046875, 3.73388671875, 4.1026611328125, 4.471435546875, 4.8402099609375, 5.208984375, 5.5777587890625, 5.946533203125, 6.3153076171875, 6.68408203125, 7.0528564453125, 7.421630859375, 7.7904052734375, 8.1591796875, 8.5279541015625, 8.896728515625, 9.2655029296875, 9.63427734375, 10.0030517578125, 10.371826171875, 10.7406005859375, 11.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 11.0, 20.0, 35.0, 33.0, 46.0, 78.0, 104.0, 118.0, 214.0, 298.0, 435.0, 776.0, 1276.0, 2116.0, 3972.0, 7776.0, 16320.0, 42024.0, 786443.0, 137701.0, 24650.0, 11268.0, 5604.0, 2917.0, 1628.0, 981.0, 580.0, 362.0, 221.0, 175.0, 114.0, 80.0, 43.0, 41.0, 21.0, 16.0, 12.0, 11.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.849609375, -3.715728759765625, -3.58184814453125, -3.447967529296875, -3.3140869140625, -3.180206298828125, -3.04632568359375, -2.912445068359375, -2.778564453125, -2.644683837890625, -2.51080322265625, -2.376922607421875, -2.2430419921875, -2.109161376953125, -1.97528076171875, -1.841400146484375, -1.70751953125, -1.573638916015625, -1.43975830078125, -1.305877685546875, -1.1719970703125, -1.038116455078125, -0.90423583984375, -0.770355224609375, -0.636474609375, -0.502593994140625, -0.36871337890625, -0.234832763671875, -0.1009521484375, 0.032928466796875, 0.16680908203125, 0.300689697265625, 0.4345703125, 0.568450927734375, 0.70233154296875, 0.836212158203125, 0.9700927734375, 1.103973388671875, 1.23785400390625, 1.371734619140625, 1.505615234375, 1.639495849609375, 1.77337646484375, 1.907257080078125, 2.0411376953125, 2.175018310546875, 2.30889892578125, 2.442779541015625, 2.57666015625, 2.710540771484375, 2.84442138671875, 2.978302001953125, 3.1121826171875, 3.246063232421875, 3.37994384765625, 3.513824462890625, 3.647705078125, 3.781585693359375, 3.91546630859375, 4.049346923828125, 4.1832275390625, 4.317108154296875, 4.45098876953125, 4.584869384765625, 4.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 7.0, 5.0, 12.0, 15.0, 16.0, 20.0, 23.0, 18.0, 27.0, 25.0, 28.0, 26.0, 30.0, 37.0, 38.0, 36.0, 40.0, 33.0, 38.0, 41.0, 41.0, 45.0, 37.0, 40.0, 39.0, 48.0, 28.0, 29.0, 22.0, 29.0, 24.0, 20.0, 20.0, 16.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.7265625, -7.4775390625, -7.228515625, -6.9794921875, -6.73046875, -6.4814453125, -6.232421875, -5.9833984375, -5.734375, -5.4853515625, -5.236328125, -4.9873046875, -4.73828125, -4.4892578125, -4.240234375, -3.9912109375, -3.7421875, -3.4931640625, -3.244140625, -2.9951171875, -2.74609375, -2.4970703125, -2.248046875, -1.9990234375, -1.75, -1.5009765625, -1.251953125, -1.0029296875, -0.75390625, -0.5048828125, -0.255859375, -0.0068359375, 0.2421875, 0.4912109375, 0.740234375, 0.9892578125, 1.23828125, 1.4873046875, 1.736328125, 1.9853515625, 2.234375, 2.4833984375, 2.732421875, 2.9814453125, 3.23046875, 3.4794921875, 3.728515625, 3.9775390625, 4.2265625, 4.4755859375, 4.724609375, 4.9736328125, 5.22265625, 5.4716796875, 5.720703125, 5.9697265625, 6.21875, 6.4677734375, 6.716796875, 6.9658203125, 7.21484375, 7.4638671875, 7.712890625, 7.9619140625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 5.0, 17.0, 15.0, 25.0, 30.0, 49.0, 57.0, 96.0, 129.0, 170.0, 254.0, 382.0, 517.0, 836.0, 1167.0, 1884.0, 2714.0, 4381.0, 7050.0, 11797.0, 22009.0, 73907.0, 841025.0, 36589.0, 17271.0, 9673.0, 5833.0, 3620.0, 2292.0, 1498.0, 989.0, 617.0, 484.0, 378.0, 243.0, 170.0, 101.0, 81.0, 63.0, 32.0, 30.0, 23.0, 14.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8271484375, -0.79986572265625, -0.7725830078125, -0.74530029296875, -0.718017578125, -0.69073486328125, -0.6634521484375, -0.63616943359375, -0.60888671875, -0.58160400390625, -0.5543212890625, -0.52703857421875, -0.499755859375, -0.47247314453125, -0.4451904296875, -0.41790771484375, -0.390625, -0.36334228515625, -0.3360595703125, -0.30877685546875, -0.281494140625, -0.25421142578125, -0.2269287109375, -0.19964599609375, -0.17236328125, -0.14508056640625, -0.1177978515625, -0.09051513671875, -0.063232421875, -0.03594970703125, -0.0086669921875, 0.01861572265625, 0.0458984375, 0.07318115234375, 0.1004638671875, 0.12774658203125, 0.155029296875, 0.18231201171875, 0.2095947265625, 0.23687744140625, 0.26416015625, 0.29144287109375, 0.3187255859375, 0.34600830078125, 0.373291015625, 0.40057373046875, 0.4278564453125, 0.45513916015625, 0.482421875, 0.50970458984375, 0.5369873046875, 0.56427001953125, 0.591552734375, 0.61883544921875, 0.6461181640625, 0.67340087890625, 0.70068359375, 0.72796630859375, 0.7552490234375, 0.78253173828125, 0.809814453125, 0.83709716796875, 0.8643798828125, 0.89166259765625, 0.9189453125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 1.0, 8.0, 8.0, 7.0, 5.0, 19.0, 20.0, 12.0, 11.0, 18.0, 24.0, 21.0, 26.0, 37.0, 34.0, 36.0, 41.0, 58.0, 48.0, 30.0, 54.0, 54.0, 47.0, 36.0, 39.0, 36.0, 40.0, 27.0, 32.0, 35.0, 27.0, 21.0, 9.0, 11.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5762786865234375e-05, -3.473460674285889e-05, -3.37064266204834e-05, -3.267824649810791e-05, -3.165006637573242e-05, -3.0621886253356934e-05, -2.9593706130981445e-05, -2.8565526008605957e-05, -2.753734588623047e-05, -2.650916576385498e-05, -2.5480985641479492e-05, -2.4452805519104004e-05, -2.3424625396728516e-05, -2.2396445274353027e-05, -2.136826515197754e-05, -2.034008502960205e-05, -1.9311904907226562e-05, -1.8283724784851074e-05, -1.7255544662475586e-05, -1.6227364540100098e-05, -1.519918441772461e-05, -1.4171004295349121e-05, -1.3142824172973633e-05, -1.2114644050598145e-05, -1.1086463928222656e-05, -1.0058283805847168e-05, -9.03010368347168e-06, -8.001923561096191e-06, -6.973743438720703e-06, -5.945563316345215e-06, -4.9173831939697266e-06, -3.889203071594238e-06, -2.86102294921875e-06, -1.8328428268432617e-06, -8.046627044677734e-07, 2.2351741790771484e-07, 1.2516975402832031e-06, 2.2798776626586914e-06, 3.3080577850341797e-06, 4.336237907409668e-06, 5.364418029785156e-06, 6.3925981521606445e-06, 7.420778274536133e-06, 8.448958396911621e-06, 9.47713851928711e-06, 1.0505318641662598e-05, 1.1533498764038086e-05, 1.2561678886413574e-05, 1.3589859008789062e-05, 1.461803913116455e-05, 1.564621925354004e-05, 1.6674399375915527e-05, 1.7702579498291016e-05, 1.8730759620666504e-05, 1.9758939743041992e-05, 2.078711986541748e-05, 2.181529998779297e-05, 2.2843480110168457e-05, 2.3871660232543945e-05, 2.4899840354919434e-05, 2.5928020477294922e-05, 2.695620059967041e-05, 2.79843807220459e-05, 2.9012560844421387e-05, 3.0040740966796875e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 10.0, 5.0, 14.0, 21.0, 30.0, 30.0, 61.0, 102.0, 148.0, 265.0, 351.0, 525.0, 790.0, 1276.0, 2000.0, 3231.0, 5389.0, 8569.0, 14668.0, 25077.0, 42856.0, 73323.0, 121559.0, 179500.0, 195575.0, 147362.0, 92709.0, 54384.0, 31865.0, 18355.0, 10925.0, 6657.0, 4012.0, 2469.0, 1560.0, 1006.0, 661.0, 404.0, 287.0, 200.0, 119.0, 76.0, 46.0, 31.0, 21.0, 20.0, 8.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5256805419921875, -0.509857177734375, -0.4940338134765625, -0.47821044921875, -0.4623870849609375, -0.446563720703125, -0.4307403564453125, -0.4149169921875, -0.3990936279296875, -0.383270263671875, -0.3674468994140625, -0.35162353515625, -0.3358001708984375, -0.319976806640625, -0.3041534423828125, -0.288330078125, -0.2725067138671875, -0.256683349609375, -0.2408599853515625, -0.22503662109375, -0.2092132568359375, -0.193389892578125, -0.1775665283203125, -0.1617431640625, -0.1459197998046875, -0.130096435546875, -0.1142730712890625, -0.09844970703125, -0.0826263427734375, -0.066802978515625, -0.0509796142578125, -0.03515625, -0.0193328857421875, -0.003509521484375, 0.0123138427734375, 0.02813720703125, 0.0439605712890625, 0.059783935546875, 0.0756072998046875, 0.0914306640625, 0.1072540283203125, 0.123077392578125, 0.1389007568359375, 0.15472412109375, 0.1705474853515625, 0.186370849609375, 0.2021942138671875, 0.218017578125, 0.2338409423828125, 0.249664306640625, 0.2654876708984375, 0.28131103515625, 0.2971343994140625, 0.312957763671875, 0.3287811279296875, 0.3446044921875, 0.3604278564453125, 0.376251220703125, 0.3920745849609375, 0.40789794921875, 0.4237213134765625, 0.439544677734375, 0.4553680419921875, 0.47119140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 14.0, 13.0, 8.0, 18.0, 16.0, 15.0, 19.0, 39.0, 39.0, 47.0, 55.0, 55.0, 64.0, 68.0, 64.0, 72.0, 55.0, 65.0, 52.0, 41.0, 21.0, 23.0, 29.0, 19.0, 19.0, 13.0, 9.0, 4.0, 6.0, 9.0, 6.0, 2.0, 1.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18789291381835938, -0.18267059326171875, -0.17744827270507812, -0.1722259521484375, -0.16700363159179688, -0.16178131103515625, -0.15655899047851562, -0.151336669921875, -0.14611434936523438, -0.14089202880859375, -0.13566970825195312, -0.1304473876953125, -0.12522506713867188, -0.12000274658203125, -0.11478042602539062, -0.10955810546875, -0.10433578491210938, -0.09911346435546875, -0.09389114379882812, -0.0886688232421875, -0.08344650268554688, -0.07822418212890625, -0.07300186157226562, -0.067779541015625, -0.06255722045898438, -0.05733489990234375, -0.052112579345703125, -0.0468902587890625, -0.041667938232421875, -0.03644561767578125, -0.031223297119140625, -0.0260009765625, -0.020778656005859375, -0.01555633544921875, -0.010334014892578125, -0.0051116943359375, 0.000110626220703125, 0.00533294677734375, 0.010555267333984375, 0.015777587890625, 0.020999908447265625, 0.02622222900390625, 0.031444549560546875, 0.0366668701171875, 0.041889190673828125, 0.04711151123046875, 0.052333831787109375, 0.05755615234375, 0.06277847290039062, 0.06800079345703125, 0.07322311401367188, 0.0784454345703125, 0.08366775512695312, 0.08889007568359375, 0.09411239624023438, 0.099334716796875, 0.10455703735351562, 0.10977935791015625, 0.11500167846679688, 0.1202239990234375, 0.12544631958007812, 0.13066864013671875, 0.13589096069335938, 0.14111328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 14.0, 11.0, 13.0, 20.0, 15.0, 19.0, 26.0, 37.0, 37.0, 36.0, 44.0, 47.0, 55.0, 50.0, 54.0, 48.0, 47.0, 54.0, 41.0, 49.0, 42.0, 30.0, 26.0, 35.0, 30.0, 19.0, 18.0, 16.0, 8.0, 7.0, 7.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.071125030517578, -16.5330867767334, -15.995046615600586, -15.457008361816406, -14.91896915435791, -14.380929946899414, -13.842891693115234, -13.304852485656738, -12.766813278198242, -12.228774070739746, -11.69073486328125, -11.15269660949707, -10.614657402038574, -10.076618194580078, -9.538579940795898, -9.000540733337402, -8.462501525878906, -7.92446231842041, -7.386423587799072, -6.848384857177734, -6.310345649719238, -5.772306442260742, -5.234267711639404, -4.696228981018066, -4.15818977355957, -3.6201508045196533, -3.0821118354797363, -2.5440728664398193, -2.0060338973999023, -1.4679949283599854, -0.9299559593200684, -0.39191699028015137, 0.14612388610839844, 0.6841628551483154, 1.2222018241882324, 1.7602407932281494, 2.2982797622680664, 2.8363187313079834, 3.3743577003479004, 3.9123966693878174, 4.450435638427734, 4.9884748458862305, 5.526513576507568, 6.064552307128906, 6.602591514587402, 7.140630722045898, 7.678669452667236, 8.216708183288574, 8.75474739074707, 9.292786598205566, 9.830825805664062, 10.368864059448242, 10.906903266906738, 11.444942474365234, 11.982980728149414, 12.52101993560791, 13.059059143066406, 13.597098350524902, 14.135137557983398, 14.673175811767578, 15.211215019226074, 15.74925422668457, 16.28729248046875, 16.825332641601562, 17.363370895385742]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 7.0, 4.0, 6.0, 5.0, 6.0, 13.0, 10.0, 10.0, 13.0, 19.0, 18.0, 18.0, 27.0, 18.0, 25.0, 32.0, 31.0, 27.0, 29.0, 46.0, 32.0, 31.0, 37.0, 35.0, 33.0, 37.0, 36.0, 28.0, 37.0, 24.0, 34.0, 25.0, 28.0, 34.0, 26.0, 19.0, 16.0, 18.0, 18.0, 16.0, 15.0, 19.0, 7.0, 11.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.865306854248047, -9.556503295898438, -9.247699737548828, -8.938896179199219, -8.63009262084961, -8.321290016174316, -8.012486457824707, -7.703682899475098, -7.394879341125488, -7.086075782775879, -6.7772722244262695, -6.468469142913818, -6.159665584564209, -5.8508620262146, -5.542058944702148, -5.233255386352539, -4.92445182800293, -4.61564826965332, -4.306844711303711, -3.9980416297912598, -3.6892380714416504, -3.380434513092041, -3.0716311931610107, -2.7628278732299805, -2.454024314880371, -2.1452207565307617, -1.8364174365997314, -1.5276139974594116, -1.2188105583190918, -0.910007119178772, -0.6012036800384521, -0.2924003601074219, 0.016402244567871094, 0.3252056837081909, 0.6340091228485107, 0.9428125619888306, 1.2516160011291504, 1.5604194402694702, 1.86922287940979, 2.1780261993408203, 2.4868297576904297, 2.795633316040039, 3.1044366359710693, 3.4132399559020996, 3.722043514251709, 4.030847072601318, 4.3396501541137695, 4.648453712463379, 4.957257270812988, 5.266060829162598, 5.574864387512207, 5.883667469024658, 6.192471027374268, 6.501274585723877, 6.810077667236328, 7.1188812255859375, 7.427684783935547, 7.736488342285156, 8.045291900634766, 8.354095458984375, 8.662899017333984, 8.971701622009277, 9.280505180358887, 9.589308738708496, 9.898112297058105]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 16.0, 15.0, 24.0, 33.0, 70.0, 83.0, 162.0, 247.0, 390.0, 630.0, 1089.0, 1913.0, 3379.0, 6409.0, 11348.0, 21308.0, 38771.0, 68895.0, 113305.0, 161112.0, 184051.0, 162827.0, 114693.0, 70139.0, 39483.0, 21756.0, 11647.0, 6384.0, 3496.0, 1967.0, 1159.0, 662.0, 416.0, 230.0, 162.0, 92.0, 59.0, 36.0, 28.0, 18.0, 8.0, 15.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.015625, -11.6461181640625, -11.276611328125, -10.9071044921875, -10.53759765625, -10.1680908203125, -9.798583984375, -9.4290771484375, -9.0595703125, -8.6900634765625, -8.320556640625, -7.9510498046875, -7.58154296875, -7.2120361328125, -6.842529296875, -6.4730224609375, -6.103515625, -5.7340087890625, -5.364501953125, -4.9949951171875, -4.62548828125, -4.2559814453125, -3.886474609375, -3.5169677734375, -3.1474609375, -2.7779541015625, -2.408447265625, -2.0389404296875, -1.66943359375, -1.2999267578125, -0.930419921875, -0.5609130859375, -0.19140625, 0.1781005859375, 0.547607421875, 0.9171142578125, 1.28662109375, 1.6561279296875, 2.025634765625, 2.3951416015625, 2.7646484375, 3.1341552734375, 3.503662109375, 3.8731689453125, 4.24267578125, 4.6121826171875, 4.981689453125, 5.3511962890625, 5.720703125, 6.0902099609375, 6.459716796875, 6.8292236328125, 7.19873046875, 7.5682373046875, 7.937744140625, 8.3072509765625, 8.6767578125, 9.0462646484375, 9.415771484375, 9.7852783203125, 10.15478515625, 10.5242919921875, 10.893798828125, 11.2633056640625, 11.6328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 9.0, 10.0, 16.0, 9.0, 18.0, 23.0, 27.0, 23.0, 36.0, 24.0, 25.0, 40.0, 43.0, 39.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 44.0, 34.0, 37.0, 43.0, 26.0, 28.0, 36.0, 28.0, 14.0, 23.0, 17.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.0390625, -12.6461181640625, -12.253173828125, -11.8602294921875, -11.46728515625, -11.0743408203125, -10.681396484375, -10.2884521484375, -9.8955078125, -9.5025634765625, -9.109619140625, -8.7166748046875, -8.32373046875, -7.9307861328125, -7.537841796875, -7.1448974609375, -6.751953125, -6.3590087890625, -5.966064453125, -5.5731201171875, -5.18017578125, -4.7872314453125, -4.394287109375, -4.0013427734375, -3.6083984375, -3.2154541015625, -2.822509765625, -2.4295654296875, -2.03662109375, -1.6436767578125, -1.250732421875, -0.8577880859375, -0.46484375, -0.0718994140625, 0.321044921875, 0.7139892578125, 1.10693359375, 1.4998779296875, 1.892822265625, 2.2857666015625, 2.6787109375, 3.0716552734375, 3.464599609375, 3.8575439453125, 4.25048828125, 4.6434326171875, 5.036376953125, 5.4293212890625, 5.822265625, 6.2152099609375, 6.608154296875, 7.0010986328125, 7.39404296875, 7.7869873046875, 8.179931640625, 8.5728759765625, 8.9658203125, 9.3587646484375, 9.751708984375, 10.1446533203125, 10.53759765625, 10.9305419921875, 11.323486328125, 11.7164306640625, 12.109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 19.0, 21.0, 37.0, 48.0, 74.0, 107.0, 169.0, 247.0, 374.0, 612.0, 1005.0, 1660.0, 2869.0, 4783.0, 8542.0, 15858.0, 29247.0, 56062.0, 103252.0, 172553.0, 217229.0, 183935.0, 114379.0, 62566.0, 32618.0, 17423.0, 9641.0, 5345.0, 3053.0, 1798.0, 1060.0, 679.0, 458.0, 270.0, 174.0, 108.0, 83.0, 55.0, 43.0, 31.0, 17.0, 15.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-19.125, -18.5380859375, -17.951171875, -17.3642578125, -16.77734375, -16.1904296875, -15.603515625, -15.0166015625, -14.4296875, -13.8427734375, -13.255859375, -12.6689453125, -12.08203125, -11.4951171875, -10.908203125, -10.3212890625, -9.734375, -9.1474609375, -8.560546875, -7.9736328125, -7.38671875, -6.7998046875, -6.212890625, -5.6259765625, -5.0390625, -4.4521484375, -3.865234375, -3.2783203125, -2.69140625, -2.1044921875, -1.517578125, -0.9306640625, -0.34375, 0.2431640625, 0.830078125, 1.4169921875, 2.00390625, 2.5908203125, 3.177734375, 3.7646484375, 4.3515625, 4.9384765625, 5.525390625, 6.1123046875, 6.69921875, 7.2861328125, 7.873046875, 8.4599609375, 9.046875, 9.6337890625, 10.220703125, 10.8076171875, 11.39453125, 11.9814453125, 12.568359375, 13.1552734375, 13.7421875, 14.3291015625, 14.916015625, 15.5029296875, 16.08984375, 16.6767578125, 17.263671875, 17.8505859375, 18.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 10.0, 16.0, 18.0, 17.0, 13.0, 20.0, 33.0, 21.0, 30.0, 38.0, 42.0, 44.0, 44.0, 48.0, 43.0, 37.0, 47.0, 48.0, 44.0, 47.0, 35.0, 33.0, 24.0, 32.0, 15.0, 33.0, 21.0, 27.0, 18.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9375, -6.701904296875, -6.46630859375, -6.230712890625, -5.9951171875, -5.759521484375, -5.52392578125, -5.288330078125, -5.052734375, -4.817138671875, -4.58154296875, -4.345947265625, -4.1103515625, -3.874755859375, -3.63916015625, -3.403564453125, -3.16796875, -2.932373046875, -2.69677734375, -2.461181640625, -2.2255859375, -1.989990234375, -1.75439453125, -1.518798828125, -1.283203125, -1.047607421875, -0.81201171875, -0.576416015625, -0.3408203125, -0.105224609375, 0.13037109375, 0.365966796875, 0.6015625, 0.837158203125, 1.07275390625, 1.308349609375, 1.5439453125, 1.779541015625, 2.01513671875, 2.250732421875, 2.486328125, 2.721923828125, 2.95751953125, 3.193115234375, 3.4287109375, 3.664306640625, 3.89990234375, 4.135498046875, 4.37109375, 4.606689453125, 4.84228515625, 5.077880859375, 5.3134765625, 5.549072265625, 5.78466796875, 6.020263671875, 6.255859375, 6.491455078125, 6.72705078125, 6.962646484375, 7.1982421875, 7.433837890625, 7.66943359375, 7.905029296875, 8.140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 9.0, 11.0, 26.0, 31.0, 45.0, 53.0, 89.0, 134.0, 175.0, 230.0, 340.0, 515.0, 681.0, 947.0, 1463.0, 2214.0, 3277.0, 5222.0, 8441.0, 13862.0, 23301.0, 39998.0, 68952.0, 112389.0, 161351.0, 182344.0, 156916.0, 106713.0, 64578.0, 37127.0, 21955.0, 12818.0, 7762.0, 4865.0, 3041.0, 2000.0, 1394.0, 954.0, 705.0, 477.0, 336.0, 221.0, 168.0, 104.0, 79.0, 77.0, 46.0, 34.0, 22.0, 25.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0], "bins": [-9.578125, -9.2828369140625, -8.987548828125, -8.6922607421875, -8.39697265625, -8.1016845703125, -7.806396484375, -7.5111083984375, -7.2158203125, -6.9205322265625, -6.625244140625, -6.3299560546875, -6.03466796875, -5.7393798828125, -5.444091796875, -5.1488037109375, -4.853515625, -4.5582275390625, -4.262939453125, -3.9676513671875, -3.67236328125, -3.3770751953125, -3.081787109375, -2.7864990234375, -2.4912109375, -2.1959228515625, -1.900634765625, -1.6053466796875, -1.31005859375, -1.0147705078125, -0.719482421875, -0.4241943359375, -0.12890625, 0.1663818359375, 0.461669921875, 0.7569580078125, 1.05224609375, 1.3475341796875, 1.642822265625, 1.9381103515625, 2.2333984375, 2.5286865234375, 2.823974609375, 3.1192626953125, 3.41455078125, 3.7098388671875, 4.005126953125, 4.3004150390625, 4.595703125, 4.8909912109375, 5.186279296875, 5.4815673828125, 5.77685546875, 6.0721435546875, 6.367431640625, 6.6627197265625, 6.9580078125, 7.2532958984375, 7.548583984375, 7.8438720703125, 8.13916015625, 8.4344482421875, 8.729736328125, 9.0250244140625, 9.3203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 10.0, 13.0, 22.0, 16.0, 22.0, 38.0, 52.0, 55.0, 46.0, 69.0, 80.0, 81.0, 66.0, 69.0, 71.0, 43.0, 48.0, 38.0, 27.0, 24.0, 17.0, 13.0, 13.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0016374588012695312, -0.0015962719917297363, -0.0015550851821899414, -0.0015138983726501465, -0.0014727115631103516, -0.0014315247535705566, -0.0013903379440307617, -0.0013491511344909668, -0.0013079643249511719, -0.001266777515411377, -0.001225590705871582, -0.0011844038963317871, -0.0011432170867919922, -0.0011020302772521973, -0.0010608434677124023, -0.0010196566581726074, -0.0009784698486328125, -0.0009372830390930176, -0.0008960962295532227, -0.0008549094200134277, -0.0008137226104736328, -0.0007725358009338379, -0.000731348991394043, -0.000690162181854248, -0.0006489753723144531, -0.0006077885627746582, -0.0005666017532348633, -0.0005254149436950684, -0.00048422813415527344, -0.0004430413246154785, -0.0004018545150756836, -0.00036066770553588867, -0.00031948089599609375, -0.00027829408645629883, -0.0002371072769165039, -0.00019592046737670898, -0.00015473365783691406, -0.00011354684829711914, -7.236003875732422e-05, -3.11732292175293e-05, 1.0013580322265625e-05, 5.120038986206055e-05, 9.238719940185547e-05, 0.0001335740089416504, 0.0001747608184814453, 0.00021594762802124023, 0.00025713443756103516, 0.0002983212471008301, 0.000339508056640625, 0.0003806948661804199, 0.00042188167572021484, 0.00046306848526000977, 0.0005042552947998047, 0.0005454421043395996, 0.0005866289138793945, 0.0006278157234191895, 0.0006690025329589844, 0.0007101893424987793, 0.0007513761520385742, 0.0007925629615783691, 0.0008337497711181641, 0.000874936580657959, 0.0009161233901977539, 0.0009573101997375488, 0.0009984970092773438]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 22.0, 27.0, 36.0, 61.0, 76.0, 107.0, 143.0, 228.0, 354.0, 479.0, 786.0, 1113.0, 1630.0, 2717.0, 4018.0, 6463.0, 10238.0, 17417.0, 29917.0, 51659.0, 87266.0, 137393.0, 178373.0, 176341.0, 133329.0, 84709.0, 49992.0, 28935.0, 16909.0, 10116.0, 6105.0, 4069.0, 2532.0, 1671.0, 1074.0, 738.0, 482.0, 311.0, 214.0, 141.0, 119.0, 72.0, 47.0, 31.0, 36.0, 15.0, 6.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.578125, -9.296142578125, -9.01416015625, -8.732177734375, -8.4501953125, -8.168212890625, -7.88623046875, -7.604248046875, -7.322265625, -7.040283203125, -6.75830078125, -6.476318359375, -6.1943359375, -5.912353515625, -5.63037109375, -5.348388671875, -5.06640625, -4.784423828125, -4.50244140625, -4.220458984375, -3.9384765625, -3.656494140625, -3.37451171875, -3.092529296875, -2.810546875, -2.528564453125, -2.24658203125, -1.964599609375, -1.6826171875, -1.400634765625, -1.11865234375, -0.836669921875, -0.5546875, -0.272705078125, 0.00927734375, 0.291259765625, 0.5732421875, 0.855224609375, 1.13720703125, 1.419189453125, 1.701171875, 1.983154296875, 2.26513671875, 2.547119140625, 2.8291015625, 3.111083984375, 3.39306640625, 3.675048828125, 3.95703125, 4.239013671875, 4.52099609375, 4.802978515625, 5.0849609375, 5.366943359375, 5.64892578125, 5.930908203125, 6.212890625, 6.494873046875, 6.77685546875, 7.058837890625, 7.3408203125, 7.622802734375, 7.90478515625, 8.186767578125, 8.46875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 7.0, 6.0, 6.0, 8.0, 11.0, 20.0, 21.0, 24.0, 24.0, 38.0, 36.0, 52.0, 61.0, 71.0, 65.0, 72.0, 51.0, 55.0, 56.0, 48.0, 41.0, 45.0, 28.0, 25.0, 16.0, 16.0, 12.0, 15.0, 15.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.455078125, -2.377197265625, -2.29931640625, -2.221435546875, -2.1435546875, -2.065673828125, -1.98779296875, -1.909912109375, -1.83203125, -1.754150390625, -1.67626953125, -1.598388671875, -1.5205078125, -1.442626953125, -1.36474609375, -1.286865234375, -1.208984375, -1.131103515625, -1.05322265625, -0.975341796875, -0.8974609375, -0.819580078125, -0.74169921875, -0.663818359375, -0.5859375, -0.508056640625, -0.43017578125, -0.352294921875, -0.2744140625, -0.196533203125, -0.11865234375, -0.040771484375, 0.037109375, 0.114990234375, 0.19287109375, 0.270751953125, 0.3486328125, 0.426513671875, 0.50439453125, 0.582275390625, 0.66015625, 0.738037109375, 0.81591796875, 0.893798828125, 0.9716796875, 1.049560546875, 1.12744140625, 1.205322265625, 1.283203125, 1.361083984375, 1.43896484375, 1.516845703125, 1.5947265625, 1.672607421875, 1.75048828125, 1.828369140625, 1.90625, 1.984130859375, 2.06201171875, 2.139892578125, 2.2177734375, 2.295654296875, 2.37353515625, 2.451416015625, 2.529296875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 17.0, 16.0, 21.0, 23.0, 23.0, 26.0, 36.0, 42.0, 41.0, 31.0, 52.0, 52.0, 53.0, 67.0, 49.0, 54.0, 49.0, 52.0, 37.0, 36.0, 31.0, 30.0, 28.0, 19.0, 17.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.077926635742188, -20.463621139526367, -19.849315643310547, -19.235010147094727, -18.620704650878906, -18.006399154663086, -17.392093658447266, -16.777786254882812, -16.163482666015625, -15.549177169799805, -14.934871673583984, -14.320566177368164, -13.706260681152344, -13.091955184936523, -12.477648735046387, -11.863343238830566, -11.24903678894043, -10.63473129272461, -10.020425796508789, -9.406120300292969, -8.791814804077148, -8.177509307861328, -7.563202857971191, -6.948897361755371, -6.334591865539551, -5.7202863693237305, -5.10598087310791, -4.491674900054932, -3.8773694038391113, -3.263063907623291, -2.6487581729888916, -2.034452438354492, -1.4201488494873047, -0.8058432340621948, -0.19153761863708496, 0.4227679967880249, 1.0370736122131348, 1.651379108428955, 2.2656848430633545, 2.879990577697754, 3.494296073913574, 4.1086015701293945, 4.722907066345215, 5.337213039398193, 5.951518535614014, 6.565824031829834, 7.1801300048828125, 7.794435501098633, 8.408740997314453, 9.023046493530273, 9.637351989746094, 10.251657485961914, 10.865962982177734, 11.480268478393555, 12.094574928283691, 12.708880424499512, 13.323185920715332, 13.937491416931152, 14.551796913146973, 15.166102409362793, 15.78040885925293, 16.39471435546875, 17.00901985168457, 17.62332534790039, 18.23763084411621]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 7.0, 10.0, 15.0, 17.0, 12.0, 10.0, 15.0, 21.0, 19.0, 33.0, 29.0, 26.0, 34.0, 33.0, 37.0, 47.0, 34.0, 38.0, 39.0, 40.0, 55.0, 27.0, 31.0, 34.0, 27.0, 36.0, 36.0, 27.0, 29.0, 23.0, 27.0, 12.0, 13.0, 13.0, 7.0, 18.0, 7.0, 7.0, 5.0, 7.0, 5.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.295456886291504, -12.856975555419922, -12.41849422454834, -11.980012893676758, -11.541531562805176, -11.103050231933594, -10.664569854736328, -10.22608757019043, -9.787607192993164, -9.349125862121582, -8.91064453125, -8.472163200378418, -8.033681869506836, -7.595200538635254, -7.15671968460083, -6.718238353729248, -6.279756546020508, -5.841275215148926, -5.402793884277344, -4.964312553405762, -4.52583122253418, -4.087349891662598, -3.648869037628174, -3.210387706756592, -2.7719063758850098, -2.3334250450134277, -1.8949438333511353, -1.4564626216888428, -1.0179812908172607, -0.5794999599456787, -0.14101886749267578, 0.29746246337890625, 0.7359437942504883, 1.1744251251220703, 1.6129063367843628, 2.0513875484466553, 2.4898688793182373, 2.9283502101898193, 3.3668313026428223, 3.8053126335144043, 4.243793964385986, 4.682275295257568, 5.12075662612915, 5.559237480163574, 5.997718811035156, 6.436200141906738, 6.87468147277832, 7.313162803649902, 7.751644134521484, 8.190125465393066, 8.628606796264648, 9.06708812713623, 9.505569458007812, 9.944050788879395, 10.382532119750977, 10.821012496948242, 11.25949478149414, 11.697976112365723, 12.136457443237305, 12.574938774108887, 13.013420104980469, 13.45190143585205, 13.890382766723633, 14.328863143920898, 14.76734447479248]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 6.0, 13.0, 8.0, 23.0, 24.0, 29.0, 42.0, 49.0, 74.0, 90.0, 130.0, 185.0, 258.0, 410.0, 593.0, 1104.0, 1882.0, 4602.0, 496139.0, 10543.0, 3664.0, 1690.0, 909.0, 598.0, 325.0, 210.0, 174.0, 121.0, 111.0, 64.0, 33.0, 30.0, 28.0, 22.0, 25.0, 16.0, 9.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.6606140136719, -263.2204895019531, -253.78036499023438, -244.34024047851562, -234.90011596679688, -225.45999145507812, -216.0198516845703, -206.57972717285156, -197.1396026611328, -187.69947814941406, -178.2593536376953, -168.81922912597656, -159.37908935546875, -149.93896484375, -140.49884033203125, -131.0587158203125, -121.61859130859375, -112.178466796875, -102.73834228515625, -93.29821014404297, -83.85808563232422, -74.41796112060547, -64.97782897949219, -55.53770446777344, -46.09757995605469, -36.65745544433594, -27.217327117919922, -17.77720069885254, -8.337074279785156, 1.1030502319335938, 10.54317855834961, 19.983306884765625, 29.423431396484375, 38.863555908203125, 48.30368423461914, 57.743812561035156, 67.1839370727539, 76.62406158447266, 86.06419372558594, 95.50431823730469, 104.94444274902344, 114.38456726074219, 123.82469177246094, 133.2648162841797, 142.7049560546875, 152.14508056640625, 161.585205078125, 171.02532958984375, 180.4654541015625, 189.90557861328125, 199.345703125, 208.78582763671875, 218.2259521484375, 227.66607666015625, 237.10621643066406, 246.5463409423828, 255.98646545410156, 265.4266052246094, 274.8667297363281, 284.3068542480469, 293.7469787597656, 303.1871032714844, 312.6272277832031, 322.0673522949219, 331.5074768066406]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 10.0, 12.0, 14.0, 18.0, 14.0, 6.0, 19.0, 18.0, 22.0, 30.0, 31.0, 27.0, 39.0, 31.0, 39.0, 40.0, 33.0, 32.0, 43.0, 1076.0, 44.0, 31.0, 28.0, 37.0, 26.0, 37.0, 30.0, 33.0, 21.0, 29.0, 19.0, 20.0, 9.0, 17.0, 10.0, 15.0, 4.0, 8.0, 4.0, 7.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-412.3919372558594, -398.66351318359375, -384.93511962890625, -371.20672607421875, -357.4783020019531, -343.7498779296875, -330.021484375, -316.2930908203125, -302.5646667480469, -288.83624267578125, -275.10784912109375, -261.37945556640625, -247.65103149414062, -233.92262268066406, -220.1942138671875, -206.46580505371094, -192.73739624023438, -179.0089874267578, -165.28057861328125, -151.5521697998047, -137.82376098632812, -124.09535217285156, -110.366943359375, -96.63853454589844, -82.91012573242188, -69.18171691894531, -55.45330810546875, -41.72489929199219, -27.996490478515625, -14.268081665039062, -0.5396728515625, 13.188735961914062, 26.917144775390625, 40.64555358886719, 54.37396240234375, 68.10237121582031, 81.83078002929688, 95.55918884277344, 109.28759765625, 123.01600646972656, 136.74441528320312, 150.4728240966797, 164.20123291015625, 177.9296417236328, 191.65805053710938, 205.38645935058594, 219.1148681640625, 232.84327697753906, 246.57168579101562, 260.30010986328125, 274.02850341796875, 287.75689697265625, 301.4853210449219, 315.2137451171875, 328.942138671875, 342.6705322265625, 356.3989562988281, 370.12738037109375, 383.85577392578125, 397.58416748046875, 411.3125915527344, 425.041015625, 438.7694091796875, 452.497802734375, 466.2262268066406]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 6.0, 4.0, 9.0, 12.0, 6.0, 11.0, 10.0, 15.0, 26.0, 31.0, 28.0, 35.0, 50.0, 83.0, 110.0, 157.0, 258.0, 328.0, 512.0, 690.0, 926.0, 1171.0, 1581.0, 2182.0, 3398.0, 4810.0, 11404.0, 31146528.0, 52135.0, 10468.0, 7266.0, 6639.0, 1471.0, 632.0, 417.0, 279.0, 247.0, 168.0, 126.0, 108.0, 85.0, 41.0, 22.0, 8.0, 7.0, 0.0, 0.0, 1.0], "bins": [-690.6199951171875, -674.8472900390625, -659.0745849609375, -643.3018798828125, -627.5291137695312, -611.7564086914062, -595.9837036132812, -580.2109985351562, -564.4382934570312, -548.6655883789062, -532.8928833007812, -517.1201171875, -501.3474426269531, -485.57470703125, -469.802001953125, -454.029296875, -438.2565612792969, -422.4838562011719, -406.71112060546875, -390.93841552734375, -375.16571044921875, -359.39300537109375, -343.6202697753906, -327.8475646972656, -312.0748291015625, -296.3021240234375, -280.5293884277344, -264.7566833496094, -248.98397827148438, -233.2112579345703, -217.43853759765625, -201.66583251953125, -185.89309692382812, -170.12037658691406, -154.34767150878906, -138.574951171875, -122.80223846435547, -107.02952575683594, -91.25680541992188, -75.48409271240234, -59.71138000488281, -43.93866729736328, -28.165950775146484, -12.393234252929688, 3.3794784545898438, 19.152191162109375, 34.92491149902344, 50.69762420654297, 66.4703369140625, 82.24304962158203, 98.01576232910156, 113.78848266601562, 129.56118774414062, 145.3339080810547, 161.10662841796875, 176.87933349609375, 192.6520538330078, 208.42477416992188, 224.19747924804688, 239.97019958496094, 255.742919921875, 271.515625, 287.288330078125, 303.0610656738281, 318.8337707519531]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 20.0, 23.0, 20.0, 40.0, 43.0, 57.0, 62.0, 93.0, 99.0, 88.0, 80.0, 83.0, 54.0, 51.0, 33.0, 34.0, 17.0, 20.0, 17.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-550.7784423828125, -535.5905151367188, -520.402587890625, -505.21466064453125, -490.0267028808594, -474.8387756347656, -459.6508483886719, -444.4629211425781, -429.27496337890625, -414.0870361328125, -398.89910888671875, -383.711181640625, -368.5232238769531, -353.3352966308594, -338.1473693847656, -322.9594421386719, -307.7715148925781, -292.5835876464844, -277.3956604003906, -262.20770263671875, -247.019775390625, -231.83184814453125, -216.6439208984375, -201.45599365234375, -186.26805114746094, -171.0801239013672, -155.89218139648438, -140.70425415039062, -125.51631927490234, -110.32838439941406, -95.14045715332031, -79.95252227783203, -64.76458740234375, -49.57665252685547, -34.38872146606445, -19.200790405273438, -4.012855529785156, 11.175079345703125, 26.363006591796875, 41.550941467285156, 56.73887634277344, 71.92681121826172, 87.11474609375, 102.30267333984375, 117.49060821533203, 132.6785430908203, 147.86647033691406, 163.05441284179688, 178.24234008789062, 193.43026733398438, 208.6182098388672, 223.80613708496094, 238.99407958984375, 254.1820068359375, 269.36993408203125, 284.557861328125, 299.74578857421875, 314.9337158203125, 330.12164306640625, 345.3095703125, 360.4975280761719, 375.6854553222656, 390.8733825683594, 406.0613098144531, 421.249267578125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 7.0, 4.0, 13.0, 11.0, 12.0, 16.0, 15.0, 7.0, 23.0, 21.0, 30.0, 30.0, 35.0, 49.0, 58.0, 71.0, 85.0, 69.0, 77.0, 55.0, 37.0, 36.0, 31.0, 28.0, 22.0, 28.0, 15.0, 13.0, 13.0, 9.0, 9.0, 20.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-474.1795654296875, -460.4901428222656, -446.80072021484375, -433.111328125, -419.4219055175781, -405.73248291015625, -392.0430908203125, -378.3536682128906, -364.66424560546875, -350.9748229980469, -337.285400390625, -323.59600830078125, -309.9065856933594, -296.2171630859375, -282.52777099609375, -268.8383483886719, -255.14892578125, -241.45950317382812, -227.7700958251953, -214.0806884765625, -200.39126586914062, -186.70184326171875, -173.01243591308594, -159.32302856445312, -145.63360595703125, -131.94418334960938, -118.25477600097656, -104.56536102294922, -90.87594604492188, -77.18653106689453, -63.49711608886719, -49.807701110839844, -36.118255615234375, -22.42884063720703, -8.739425659179688, 4.949989318847656, 18.639404296875, 32.328819274902344, 46.01823425292969, 59.70764923095703, 73.39706420898438, 87.08647918701172, 100.77589416503906, 114.4653091430664, 128.15472412109375, 141.84414672851562, 155.53355407714844, 169.22296142578125, 182.91238403320312, 196.601806640625, 210.2912139892578, 223.98062133789062, 237.6700439453125, 251.35946655273438, 265.04888916015625, 278.73828125, 292.4277038574219, 306.11712646484375, 319.8065185546875, 333.4959411621094, 347.18536376953125, 360.8747863769531, 374.564208984375, 388.25360107421875, 401.9430236816406]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 12.0, 12.0, 27.0, 39.0, 63.0, 91.0, 125.0, 198.0, 280.0, 422.0, 666.0, 972.0, 1409.0, 2289.0, 3595.0, 5950.0, 9764.0, 17205.0, 31923.0, 61449.0, 123836.0, 264246.0, 607553.0, 1620773.0, 789513.0, 336472.0, 153290.0, 74528.0, 38695.0, 20849.0, 11672.0, 6685.0, 3998.0, 2374.0, 1374.0, 784.0, 444.0, 283.0, 178.0, 91.0, 51.0, 47.0, 26.0, 13.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.313232421875, -9.00927734375, -8.705322265625, -8.4013671875, -8.097412109375, -7.79345703125, -7.489501953125, -7.185546875, -6.881591796875, -6.57763671875, -6.273681640625, -5.9697265625, -5.665771484375, -5.36181640625, -5.057861328125, -4.75390625, -4.449951171875, -4.14599609375, -3.842041015625, -3.5380859375, -3.234130859375, -2.93017578125, -2.626220703125, -2.322265625, -2.018310546875, -1.71435546875, -1.410400390625, -1.1064453125, -0.802490234375, -0.49853515625, -0.194580078125, 0.109375, 0.413330078125, 0.71728515625, 1.021240234375, 1.3251953125, 1.629150390625, 1.93310546875, 2.237060546875, 2.541015625, 2.844970703125, 3.14892578125, 3.452880859375, 3.7568359375, 4.060791015625, 4.36474609375, 4.668701171875, 4.97265625, 5.276611328125, 5.58056640625, 5.884521484375, 6.1884765625, 6.492431640625, 6.79638671875, 7.100341796875, 7.404296875, 7.708251953125, 8.01220703125, 8.316162109375, 8.6201171875, 8.924072265625, 9.22802734375, 9.531982421875, 9.8359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 3.0, 13.0, 18.0, 7.0, 19.0, 13.0, 20.0, 26.0, 40.0, 54.0, 44.0, 41.0, 59.0, 62.0, 64.0, 62.0, 65.0, 60.0, 62.0, 38.0, 46.0, 25.0, 24.0, 24.0, 19.0, 16.0, 8.0, 9.0, 6.0, 6.0, 7.0, 2.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8542861938476562, -0.8282012939453125, -0.8021163940429688, -0.776031494140625, -0.7499465942382812, -0.7238616943359375, -0.6977767944335938, -0.67169189453125, -0.6456069946289062, -0.6195220947265625, -0.5934371948242188, -0.567352294921875, -0.5412673950195312, -0.5151824951171875, -0.48909759521484375, -0.4630126953125, -0.43692779541015625, -0.4108428955078125, -0.38475799560546875, -0.358673095703125, -0.33258819580078125, -0.3065032958984375, -0.28041839599609375, -0.25433349609375, -0.22824859619140625, -0.2021636962890625, -0.17607879638671875, -0.149993896484375, -0.12390899658203125, -0.0978240966796875, -0.07173919677734375, -0.045654296875, -0.01956939697265625, 0.0065155029296875, 0.03260040283203125, 0.058685302734375, 0.08477020263671875, 0.1108551025390625, 0.13694000244140625, 0.16302490234375, 0.18910980224609375, 0.2151947021484375, 0.24127960205078125, 0.267364501953125, 0.29344940185546875, 0.3195343017578125, 0.34561920166015625, 0.3717041015625, 0.39778900146484375, 0.4238739013671875, 0.44995880126953125, 0.476043701171875, 0.5021286010742188, 0.5282135009765625, 0.5542984008789062, 0.58038330078125, 0.6064682006835938, 0.6325531005859375, 0.6586380004882812, 0.684722900390625, 0.7108078002929688, 0.7368927001953125, 0.7629776000976562, 0.7890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 15.0, 19.0, 19.0, 27.0, 48.0, 47.0, 92.0, 133.0, 199.0, 337.0, 635.0, 1200.0, 2583.0, 6389.0, 17607.0, 55745.0, 199260.0, 735735.0, 1958032.0, 877025.0, 239232.0, 66075.0, 20448.0, 7354.0, 2967.0, 1358.0, 690.0, 371.0, 217.0, 124.0, 93.0, 55.0, 37.0, 24.0, 10.0, 13.0, 11.0, 10.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.7890625, -10.4857177734375, -10.182373046875, -9.8790283203125, -9.57568359375, -9.2723388671875, -8.968994140625, -8.6656494140625, -8.3623046875, -8.0589599609375, -7.755615234375, -7.4522705078125, -7.14892578125, -6.8455810546875, -6.542236328125, -6.2388916015625, -5.935546875, -5.6322021484375, -5.328857421875, -5.0255126953125, -4.72216796875, -4.4188232421875, -4.115478515625, -3.8121337890625, -3.5087890625, -3.2054443359375, -2.902099609375, -2.5987548828125, -2.29541015625, -1.9920654296875, -1.688720703125, -1.3853759765625, -1.08203125, -0.7786865234375, -0.475341796875, -0.1719970703125, 0.13134765625, 0.4346923828125, 0.738037109375, 1.0413818359375, 1.3447265625, 1.6480712890625, 1.951416015625, 2.2547607421875, 2.55810546875, 2.8614501953125, 3.164794921875, 3.4681396484375, 3.771484375, 4.0748291015625, 4.378173828125, 4.6815185546875, 4.98486328125, 5.2882080078125, 5.591552734375, 5.8948974609375, 6.1982421875, 6.5015869140625, 6.804931640625, 7.1082763671875, 7.41162109375, 7.7149658203125, 8.018310546875, 8.3216552734375, 8.625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 17.0, 34.0, 46.0, 45.0, 81.0, 91.0, 104.0, 115.0, 180.0, 194.0, 282.0, 289.0, 417.0, 485.0, 322.0, 266.0, 235.0, 189.0, 144.0, 114.0, 86.0, 83.0, 61.0, 33.0, 42.0, 16.0, 15.0, 19.0, 10.0, 7.0, 5.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.408966064453125, -2.31988525390625, -2.230804443359375, -2.1417236328125, -2.052642822265625, -1.96356201171875, -1.874481201171875, -1.785400390625, -1.696319580078125, -1.60723876953125, -1.518157958984375, -1.4290771484375, -1.339996337890625, -1.25091552734375, -1.161834716796875, -1.07275390625, -0.983673095703125, -0.89459228515625, -0.805511474609375, -0.7164306640625, -0.627349853515625, -0.53826904296875, -0.449188232421875, -0.360107421875, -0.271026611328125, -0.18194580078125, -0.092864990234375, -0.0037841796875, 0.085296630859375, 0.17437744140625, 0.263458251953125, 0.3525390625, 0.441619873046875, 0.53070068359375, 0.619781494140625, 0.7088623046875, 0.797943115234375, 0.88702392578125, 0.976104736328125, 1.065185546875, 1.154266357421875, 1.24334716796875, 1.332427978515625, 1.4215087890625, 1.510589599609375, 1.59967041015625, 1.688751220703125, 1.77783203125, 1.866912841796875, 1.95599365234375, 2.045074462890625, 2.1341552734375, 2.223236083984375, 2.31231689453125, 2.401397705078125, 2.490478515625, 2.579559326171875, 2.66864013671875, 2.757720947265625, 2.8468017578125, 2.935882568359375, 3.02496337890625, 3.114044189453125, 3.203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 12.0, 19.0, 22.0, 35.0, 40.0, 53.0, 65.0, 64.0, 65.0, 67.0, 87.0, 65.0, 80.0, 62.0, 60.0, 41.0, 37.0, 16.0, 15.0, 13.0, 9.0, 9.0, 6.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.275325775146484, -27.48114585876465, -26.686967849731445, -25.89278793334961, -25.098608016967773, -24.30443000793457, -23.510250091552734, -22.71607208251953, -21.921892166137695, -21.12771224975586, -20.333534240722656, -19.53935432434082, -18.745174407958984, -17.95099639892578, -17.156816482543945, -16.36263656616211, -15.56845760345459, -14.77427864074707, -13.980098724365234, -13.185919761657715, -12.391740798950195, -11.59756088256836, -10.80338191986084, -10.00920295715332, -9.215023040771484, -8.420844078063965, -7.626664638519287, -6.832485198974609, -6.03830623626709, -5.244126796722412, -4.449947357177734, -3.655768394470215, -2.8615894317626953, -2.0674102306365967, -1.2732309103012085, -0.4790515899658203, 0.3151276111602783, 1.109306812286377, 1.9034862518310547, 2.697665214538574, 3.491844654083252, 4.28602409362793, 5.080203056335449, 5.874382495880127, 6.668561935424805, 7.462740898132324, 8.256919860839844, 9.05109977722168, 9.8452787399292, 10.639457702636719, 11.433637619018555, 12.227816581726074, 13.021995544433594, 13.81617546081543, 14.61035442352295, 15.404533386230469, 16.198713302612305, 16.99289321899414, 17.787071228027344, 18.58125114440918, 19.375431060791016, 20.16960906982422, 20.963788986206055, 21.75796890258789, 22.552146911621094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 5.0, 8.0, 14.0, 12.0, 7.0, 20.0, 16.0, 13.0, 22.0, 30.0, 37.0, 33.0, 40.0, 36.0, 40.0, 40.0, 44.0, 54.0, 40.0, 39.0, 33.0, 28.0, 35.0, 46.0, 39.0, 39.0, 32.0, 15.0, 22.0, 34.0, 13.0, 18.0, 14.0, 5.0, 10.0, 7.0, 5.0, 12.0, 5.0, 3.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-16.215167999267578, -15.719022750854492, -15.222877502441406, -14.72673225402832, -14.230587005615234, -13.734441757202148, -13.238296508789062, -12.742151260375977, -12.24600601196289, -11.749860763549805, -11.253715515136719, -10.757570266723633, -10.261425018310547, -9.765279769897461, -9.269134521484375, -8.772989273071289, -8.276844024658203, -7.780698776245117, -7.284553527832031, -6.788408279418945, -6.292263031005859, -5.796117782592773, -5.2999725341796875, -4.803827285766602, -4.307682037353516, -3.8115367889404297, -3.3153915405273438, -2.819246292114258, -2.323101043701172, -1.826955795288086, -1.330810546875, -0.8346652984619141, -0.3385200500488281, 0.1576251983642578, 0.6537704467773438, 1.1499156951904297, 1.6460609436035156, 2.1422061920166016, 2.6383514404296875, 3.1344966888427734, 3.6306419372558594, 4.126787185668945, 4.622932434082031, 5.119077682495117, 5.615222930908203, 6.111368179321289, 6.607513427734375, 7.103658676147461, 7.599803924560547, 8.095949172973633, 8.592094421386719, 9.088239669799805, 9.58438491821289, 10.080530166625977, 10.576675415039062, 11.072820663452148, 11.568965911865234, 12.06511116027832, 12.561256408691406, 13.057401657104492, 13.553546905517578, 14.049692153930664, 14.54583740234375, 15.041982650756836, 15.538127899169922]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 2.0, 4.0, 8.0, 9.0, 9.0, 22.0, 32.0, 33.0, 53.0, 73.0, 127.0, 150.0, 233.0, 371.0, 507.0, 845.0, 1300.0, 2082.0, 3552.0, 6047.0, 10742.0, 20464.0, 40791.0, 86796.0, 187705.0, 304868.0, 198050.0, 91642.0, 42811.0, 21433.0, 11550.0, 6435.0, 3712.0, 2208.0, 1355.0, 886.0, 554.0, 363.0, 205.0, 155.0, 112.0, 70.0, 49.0, 33.0, 27.0, 25.0, 17.0, 11.0, 4.0, 9.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.91796875, -5.736083984375, -5.55419921875, -5.372314453125, -5.1904296875, -5.008544921875, -4.82666015625, -4.644775390625, -4.462890625, -4.281005859375, -4.09912109375, -3.917236328125, -3.7353515625, -3.553466796875, -3.37158203125, -3.189697265625, -3.0078125, -2.825927734375, -2.64404296875, -2.462158203125, -2.2802734375, -2.098388671875, -1.91650390625, -1.734619140625, -1.552734375, -1.370849609375, -1.18896484375, -1.007080078125, -0.8251953125, -0.643310546875, -0.46142578125, -0.279541015625, -0.09765625, 0.084228515625, 0.26611328125, 0.447998046875, 0.6298828125, 0.811767578125, 0.99365234375, 1.175537109375, 1.357421875, 1.539306640625, 1.72119140625, 1.903076171875, 2.0849609375, 2.266845703125, 2.44873046875, 2.630615234375, 2.8125, 2.994384765625, 3.17626953125, 3.358154296875, 3.5400390625, 3.721923828125, 3.90380859375, 4.085693359375, 4.267578125, 4.449462890625, 4.63134765625, 4.813232421875, 4.9951171875, 5.177001953125, 5.35888671875, 5.540771484375, 5.72265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 8.0, 10.0, 22.0, 18.0, 18.0, 26.0, 36.0, 31.0, 36.0, 64.0, 55.0, 53.0, 47.0, 55.0, 61.0, 57.0, 59.0, 44.0, 32.0, 37.0, 48.0, 26.0, 21.0, 19.0, 19.0, 15.0, 13.0, 8.0, 4.0, 9.0, 6.0, 4.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0234375, -0.9931640625, -0.962890625, -0.9326171875, -0.90234375, -0.8720703125, -0.841796875, -0.8115234375, -0.78125, -0.7509765625, -0.720703125, -0.6904296875, -0.66015625, -0.6298828125, -0.599609375, -0.5693359375, -0.5390625, -0.5087890625, -0.478515625, -0.4482421875, -0.41796875, -0.3876953125, -0.357421875, -0.3271484375, -0.296875, -0.2666015625, -0.236328125, -0.2060546875, -0.17578125, -0.1455078125, -0.115234375, -0.0849609375, -0.0546875, -0.0244140625, 0.005859375, 0.0361328125, 0.06640625, 0.0966796875, 0.126953125, 0.1572265625, 0.1875, 0.2177734375, 0.248046875, 0.2783203125, 0.30859375, 0.3388671875, 0.369140625, 0.3994140625, 0.4296875, 0.4599609375, 0.490234375, 0.5205078125, 0.55078125, 0.5810546875, 0.611328125, 0.6416015625, 0.671875, 0.7021484375, 0.732421875, 0.7626953125, 0.79296875, 0.8232421875, 0.853515625, 0.8837890625, 0.9140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 12.0, 8.0, 8.0, 16.0, 25.0, 24.0, 44.0, 69.0, 100.0, 200.0, 357.0, 641.0, 1296.0, 2770.0, 6974.0, 20730.0, 84097.0, 496751.0, 348553.0, 59587.0, 15989.0, 5595.0, 2295.0, 1076.0, 544.0, 300.0, 176.0, 108.0, 66.0, 35.0, 23.0, 21.0, 9.0, 6.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.99609375, -7.73724365234375, -7.4783935546875, -7.21954345703125, -6.960693359375, -6.70184326171875, -6.4429931640625, -6.18414306640625, -5.92529296875, -5.66644287109375, -5.4075927734375, -5.14874267578125, -4.889892578125, -4.63104248046875, -4.3721923828125, -4.11334228515625, -3.8544921875, -3.59564208984375, -3.3367919921875, -3.07794189453125, -2.819091796875, -2.56024169921875, -2.3013916015625, -2.04254150390625, -1.78369140625, -1.52484130859375, -1.2659912109375, -1.00714111328125, -0.748291015625, -0.48944091796875, -0.2305908203125, 0.02825927734375, 0.287109375, 0.54595947265625, 0.8048095703125, 1.06365966796875, 1.322509765625, 1.58135986328125, 1.8402099609375, 2.09906005859375, 2.35791015625, 2.61676025390625, 2.8756103515625, 3.13446044921875, 3.393310546875, 3.65216064453125, 3.9110107421875, 4.16986083984375, 4.4287109375, 4.68756103515625, 4.9464111328125, 5.20526123046875, 5.464111328125, 5.72296142578125, 5.9818115234375, 6.24066162109375, 6.49951171875, 6.75836181640625, 7.0172119140625, 7.27606201171875, 7.534912109375, 7.79376220703125, 8.0526123046875, 8.31146240234375, 8.5703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 19.0, 13.0, 11.0, 15.0, 21.0, 30.0, 21.0, 36.0, 28.0, 27.0, 36.0, 28.0, 38.0, 38.0, 39.0, 32.0, 41.0, 35.0, 32.0, 43.0, 27.0, 29.0, 41.0, 38.0, 27.0, 20.0, 27.0, 22.0, 23.0, 17.0, 17.0, 8.0, 6.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.763671875, -3.645416259765625, -3.52716064453125, -3.408905029296875, -3.2906494140625, -3.172393798828125, -3.05413818359375, -2.935882568359375, -2.817626953125, -2.699371337890625, -2.58111572265625, -2.462860107421875, -2.3446044921875, -2.226348876953125, -2.10809326171875, -1.989837646484375, -1.87158203125, -1.753326416015625, -1.63507080078125, -1.516815185546875, -1.3985595703125, -1.280303955078125, -1.16204833984375, -1.043792724609375, -0.925537109375, -0.807281494140625, -0.68902587890625, -0.570770263671875, -0.4525146484375, -0.334259033203125, -0.21600341796875, -0.097747802734375, 0.0205078125, 0.138763427734375, 0.25701904296875, 0.375274658203125, 0.4935302734375, 0.611785888671875, 0.73004150390625, 0.848297119140625, 0.966552734375, 1.084808349609375, 1.20306396484375, 1.321319580078125, 1.4395751953125, 1.557830810546875, 1.67608642578125, 1.794342041015625, 1.91259765625, 2.030853271484375, 2.14910888671875, 2.267364501953125, 2.3856201171875, 2.503875732421875, 2.62213134765625, 2.740386962890625, 2.858642578125, 2.976898193359375, 3.09515380859375, 3.213409423828125, 3.3316650390625, 3.449920654296875, 3.56817626953125, 3.686431884765625, 3.8046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 7.0, 15.0, 38.0, 73.0, 133.0, 322.0, 1689.0, 38011.0, 1000172.0, 6875.0, 762.0, 252.0, 89.0, 36.0, 24.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -63.69140625, -62.0703125, -60.44921875, -58.828125, -57.20703125, -55.5859375, -53.96484375, -52.34375, -50.72265625, -49.1015625, -47.48046875, -45.859375, -44.23828125, -42.6171875, -40.99609375, -39.375, -37.75390625, -36.1328125, -34.51171875, -32.890625, -31.26953125, -29.6484375, -28.02734375, -26.40625, -24.78515625, -23.1640625, -21.54296875, -19.921875, -18.30078125, -16.6796875, -15.05859375, -13.4375, -11.81640625, -10.1953125, -8.57421875, -6.953125, -5.33203125, -3.7109375, -2.08984375, -0.46875, 1.15234375, 2.7734375, 4.39453125, 6.015625, 7.63671875, 9.2578125, 10.87890625, 12.5, 14.12109375, 15.7421875, 17.36328125, 18.984375, 20.60546875, 22.2265625, 23.84765625, 25.46875, 27.08984375, 28.7109375, 30.33203125, 31.953125, 33.57421875, 35.1953125, 36.81640625, 38.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 20.0, 30.0, 51.0, 50.0, 58.0, 78.0, 91.0, 89.0, 96.0, 95.0, 74.0, 49.0, 34.0, 29.0, 34.0, 13.0, 18.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042724609375, -0.0004123672842979431, -0.00039748847484588623, -0.00038260966539382935, -0.00036773085594177246, -0.0003528520464897156, -0.0003379732370376587, -0.0003230944275856018, -0.0003082156181335449, -0.00029333680868148804, -0.00027845799922943115, -0.00026357918977737427, -0.0002487003803253174, -0.0002338215708732605, -0.0002189427614212036, -0.00020406395196914673, -0.00018918514251708984, -0.00017430633306503296, -0.00015942752361297607, -0.0001445487141609192, -0.0001296699047088623, -0.00011479109525680542, -9.991228580474854e-05, -8.503347635269165e-05, -7.015466690063477e-05, -5.527585744857788e-05, -4.0397047996520996e-05, -2.551823854446411e-05, -1.0639429092407227e-05, 4.239380359649658e-06, 1.9118189811706543e-05, 3.399699926376343e-05, 4.887580871582031e-05, 6.37546181678772e-05, 7.863342761993408e-05, 9.351223707199097e-05, 0.00010839104652404785, 0.00012326985597610474, 0.00013814866542816162, 0.0001530274748802185, 0.0001679062843322754, 0.00018278509378433228, 0.00019766390323638916, 0.00021254271268844604, 0.00022742152214050293, 0.00024230033159255981, 0.0002571791410446167, 0.0002720579504966736, 0.00028693675994873047, 0.00030181556940078735, 0.00031669437885284424, 0.0003315731883049011, 0.000346451997756958, 0.0003613308072090149, 0.0003762096166610718, 0.00039108842611312866, 0.00040596723556518555, 0.00042084604501724243, 0.0004357248544692993, 0.0004506036639213562, 0.0004654824733734131, 0.00048036128282546997, 0.0004952400922775269, 0.0005101189017295837, 0.0005249977111816406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 5.0, 13.0, 21.0, 14.0, 23.0, 41.0, 46.0, 68.0, 108.0, 143.0, 223.0, 422.0, 706.0, 1335.0, 2847.0, 6937.0, 21371.0, 101802.0, 614353.0, 241318.0, 37880.0, 10630.0, 4083.0, 1885.0, 871.0, 512.0, 284.0, 182.0, 125.0, 84.0, 47.0, 40.0, 34.0, 26.0, 13.0, 15.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.03125, -8.7166748046875, -8.402099609375, -8.0875244140625, -7.77294921875, -7.4583740234375, -7.143798828125, -6.8292236328125, -6.5146484375, -6.2000732421875, -5.885498046875, -5.5709228515625, -5.25634765625, -4.9417724609375, -4.627197265625, -4.3126220703125, -3.998046875, -3.6834716796875, -3.368896484375, -3.0543212890625, -2.73974609375, -2.4251708984375, -2.110595703125, -1.7960205078125, -1.4814453125, -1.1668701171875, -0.852294921875, -0.5377197265625, -0.22314453125, 0.0914306640625, 0.406005859375, 0.7205810546875, 1.03515625, 1.3497314453125, 1.664306640625, 1.9788818359375, 2.29345703125, 2.6080322265625, 2.922607421875, 3.2371826171875, 3.5517578125, 3.8663330078125, 4.180908203125, 4.4954833984375, 4.81005859375, 5.1246337890625, 5.439208984375, 5.7537841796875, 6.068359375, 6.3829345703125, 6.697509765625, 7.0120849609375, 7.32666015625, 7.6412353515625, 7.955810546875, 8.2703857421875, 8.5849609375, 8.8995361328125, 9.214111328125, 9.5286865234375, 9.84326171875, 10.1578369140625, 10.472412109375, 10.7869873046875, 11.1015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 18.0, 28.0, 37.0, 52.0, 112.0, 154.0, 184.0, 166.0, 98.0, 44.0, 30.0, 21.0, 7.0, 6.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.46875, -9.20721435546875, -8.9456787109375, -8.68414306640625, -8.422607421875, -8.16107177734375, -7.8995361328125, -7.63800048828125, -7.37646484375, -7.11492919921875, -6.8533935546875, -6.59185791015625, -6.330322265625, -6.06878662109375, -5.8072509765625, -5.54571533203125, -5.2841796875, -5.02264404296875, -4.7611083984375, -4.49957275390625, -4.238037109375, -3.97650146484375, -3.7149658203125, -3.45343017578125, -3.19189453125, -2.93035888671875, -2.6688232421875, -2.40728759765625, -2.145751953125, -1.88421630859375, -1.6226806640625, -1.36114501953125, -1.099609375, -0.83807373046875, -0.5765380859375, -0.31500244140625, -0.053466796875, 0.20806884765625, 0.4696044921875, 0.73114013671875, 0.99267578125, 1.25421142578125, 1.5157470703125, 1.77728271484375, 2.038818359375, 2.30035400390625, 2.5618896484375, 2.82342529296875, 3.0849609375, 3.34649658203125, 3.6080322265625, 3.86956787109375, 4.131103515625, 4.39263916015625, 4.6541748046875, 4.91571044921875, 5.17724609375, 5.43878173828125, 5.7003173828125, 5.96185302734375, 6.223388671875, 6.48492431640625, 6.7464599609375, 7.00799560546875, 7.26953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 14.0, 18.0, 62.0, 248.0, 390.0, 163.0, 63.0, 18.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.04808807373047, -68.29481506347656, -63.54153823852539, -58.788265228271484, -54.03498840332031, -49.281715393066406, -44.5284423828125, -39.77516555786133, -35.02189254760742, -30.268617630004883, -25.515342712402344, -20.762069702148438, -16.0087947845459, -11.25551986694336, -6.502246856689453, -1.7489700317382812, 3.004302978515625, 7.757577419281006, 12.510851860046387, 17.26412582397461, 22.01740074157715, 26.770675659179688, 31.523948669433594, 36.277225494384766, 41.03049850463867, 45.78377151489258, 50.53704833984375, 55.290321350097656, 60.04359436035156, 64.796875, 69.55014038085938, 74.30342102050781, 79.05668640136719, 83.8099594116211, 88.563232421875, 93.31651306152344, 98.06978607177734, 102.82305908203125, 107.57633209228516, 112.32960510253906, 117.0828857421875, 121.8361587524414, 126.58943176269531, 131.34271240234375, 136.09597778320312, 140.84925842285156, 145.6025390625, 150.35580444335938, 155.10906982421875, 159.8623504638672, 164.61561584472656, 169.368896484375, 174.12216186523438, 178.8754425048828, 183.62872314453125, 188.38198852539062, 193.13526916503906, 197.8885498046875, 202.64181518554688, 207.3950958251953, 212.1483612060547, 216.90164184570312, 221.6549072265625, 226.40818786621094, 231.16146850585938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 6.0, 10.0, 15.0, 24.0, 27.0, 45.0, 64.0, 102.0, 134.0, 141.0, 132.0, 94.0, 74.0, 42.0, 28.0, 8.0, 13.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.29398345947266, -88.3702392578125, -85.44650268554688, -82.52275848388672, -79.59901428222656, -76.67527770996094, -73.75153350830078, -70.82778930664062, -67.904052734375, -64.98030853271484, -62.05657196044922, -59.13282775878906, -56.20908737182617, -53.28534698486328, -50.361602783203125, -47.437862396240234, -44.514122009277344, -41.59038162231445, -38.66664123535156, -35.742897033691406, -32.819156646728516, -29.895416259765625, -26.9716739654541, -24.047931671142578, -21.124191284179688, -18.200450897216797, -15.276708602905273, -12.352967262268066, -9.42922592163086, -6.505484580993652, -3.5817432403564453, -0.6580009460449219, 2.2657318115234375, 5.1894731521606445, 8.113214492797852, 11.036955833435059, 13.960697174072266, 16.884437561035156, 19.80817985534668, 22.731922149658203, 25.655662536621094, 28.579402923583984, 31.503145217895508, 34.42688751220703, 37.35062789916992, 40.27436828613281, 43.19811248779297, 46.12185287475586, 49.04559326171875, 51.96933364868164, 54.89307403564453, 57.81681823730469, 60.74055862426758, 63.66429901123047, 66.58804321289062, 69.51177978515625, 72.4355239868164, 75.35926818847656, 78.28300476074219, 81.20674896240234, 84.1304931640625, 87.05422973632812, 89.97797393798828, 92.90171813964844, 95.82545471191406]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 12.0, 17.0, 31.0, 47.0, 76.0, 105.0, 214.0, 358.0, 579.0, 1131.0, 2268.0, 4944.0, 11589.0, 30242.0, 94326.0, 424416.0, 3273166.0, 244358.0, 66140.0, 22919.0, 9320.0, 4120.0, 1868.0, 890.0, 490.0, 219.0, 168.0, 83.0, 48.0, 39.0, 25.0, 21.0, 12.0, 7.0, 8.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5625, -22.810791015625, -22.05908203125, -21.307373046875, -20.5556640625, -19.803955078125, -19.05224609375, -18.300537109375, -17.548828125, -16.797119140625, -16.04541015625, -15.293701171875, -14.5419921875, -13.790283203125, -13.03857421875, -12.286865234375, -11.53515625, -10.783447265625, -10.03173828125, -9.280029296875, -8.5283203125, -7.776611328125, -7.02490234375, -6.273193359375, -5.521484375, -4.769775390625, -4.01806640625, -3.266357421875, -2.5146484375, -1.762939453125, -1.01123046875, -0.259521484375, 0.4921875, 1.243896484375, 1.99560546875, 2.747314453125, 3.4990234375, 4.250732421875, 5.00244140625, 5.754150390625, 6.505859375, 7.257568359375, 8.00927734375, 8.760986328125, 9.5126953125, 10.264404296875, 11.01611328125, 11.767822265625, 12.51953125, 13.271240234375, 14.02294921875, 14.774658203125, 15.5263671875, 16.278076171875, 17.02978515625, 17.781494140625, 18.533203125, 19.284912109375, 20.03662109375, 20.788330078125, 21.5400390625, 22.291748046875, 23.04345703125, 23.795166015625, 24.546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 8.0, 11.0, 19.0, 17.0, 27.0, 30.0, 28.0, 45.0, 54.0, 67.0, 55.0, 74.0, 70.0, 66.0, 56.0, 57.0, 66.0, 44.0, 39.0, 37.0, 26.0, 22.0, 14.0, 13.0, 7.0, 10.0, 5.0, 8.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9886627197265625, -0.949005126953125, -0.9093475341796875, -0.86968994140625, -0.8300323486328125, -0.790374755859375, -0.7507171630859375, -0.7110595703125, -0.6714019775390625, -0.631744384765625, -0.5920867919921875, -0.55242919921875, -0.5127716064453125, -0.473114013671875, -0.4334564208984375, -0.393798828125, -0.3541412353515625, -0.314483642578125, -0.2748260498046875, -0.23516845703125, -0.1955108642578125, -0.155853271484375, -0.1161956787109375, -0.0765380859375, -0.0368804931640625, 0.002777099609375, 0.0424346923828125, 0.08209228515625, 0.1217498779296875, 0.161407470703125, 0.2010650634765625, 0.24072265625, 0.2803802490234375, 0.320037841796875, 0.3596954345703125, 0.39935302734375, 0.4390106201171875, 0.478668212890625, 0.5183258056640625, 0.5579833984375, 0.5976409912109375, 0.637298583984375, 0.6769561767578125, 0.71661376953125, 0.7562713623046875, 0.795928955078125, 0.8355865478515625, 0.875244140625, 0.9149017333984375, 0.954559326171875, 0.9942169189453125, 1.03387451171875, 1.0735321044921875, 1.113189697265625, 1.1528472900390625, 1.1925048828125, 1.2321624755859375, 1.271820068359375, 1.3114776611328125, 1.35113525390625, 1.3907928466796875, 1.430450439453125, 1.4701080322265625, 1.509765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 24.0, 27.0, 48.0, 57.0, 80.0, 135.0, 201.0, 305.0, 535.0, 891.0, 1513.0, 2807.0, 5225.0, 10036.0, 20916.0, 44031.0, 100203.0, 256582.0, 1094945.0, 2180721.0, 278093.0, 106710.0, 46070.0, 21353.0, 10510.0, 5333.0, 2782.0, 1620.0, 930.0, 574.0, 370.0, 235.0, 132.0, 88.0, 54.0, 27.0, 23.0, 17.0, 17.0, 17.0, 12.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.8828125, -14.432373046875, -13.98193359375, -13.531494140625, -13.0810546875, -12.630615234375, -12.18017578125, -11.729736328125, -11.279296875, -10.828857421875, -10.37841796875, -9.927978515625, -9.4775390625, -9.027099609375, -8.57666015625, -8.126220703125, -7.67578125, -7.225341796875, -6.77490234375, -6.324462890625, -5.8740234375, -5.423583984375, -4.97314453125, -4.522705078125, -4.072265625, -3.621826171875, -3.17138671875, -2.720947265625, -2.2705078125, -1.820068359375, -1.36962890625, -0.919189453125, -0.46875, -0.018310546875, 0.43212890625, 0.882568359375, 1.3330078125, 1.783447265625, 2.23388671875, 2.684326171875, 3.134765625, 3.585205078125, 4.03564453125, 4.486083984375, 4.9365234375, 5.386962890625, 5.83740234375, 6.287841796875, 6.73828125, 7.188720703125, 7.63916015625, 8.089599609375, 8.5400390625, 8.990478515625, 9.44091796875, 9.891357421875, 10.341796875, 10.792236328125, 11.24267578125, 11.693115234375, 12.1435546875, 12.593994140625, 13.04443359375, 13.494873046875, 13.9453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 6.0, 7.0, 19.0, 22.0, 28.0, 30.0, 45.0, 57.0, 65.0, 66.0, 107.0, 119.0, 153.0, 267.0, 557.0, 1416.0, 326.0, 184.0, 156.0, 107.0, 67.0, 64.0, 44.0, 46.0, 29.0, 23.0, 16.0, 12.0, 6.0, 1.0, 6.0, 1.0, 7.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.026947021484375, -2.93280029296875, -2.838653564453125, -2.7445068359375, -2.650360107421875, -2.55621337890625, -2.462066650390625, -2.367919921875, -2.273773193359375, -2.17962646484375, -2.085479736328125, -1.9913330078125, -1.897186279296875, -1.80303955078125, -1.708892822265625, -1.61474609375, -1.520599365234375, -1.42645263671875, -1.332305908203125, -1.2381591796875, -1.144012451171875, -1.04986572265625, -0.955718994140625, -0.861572265625, -0.767425537109375, -0.67327880859375, -0.579132080078125, -0.4849853515625, -0.390838623046875, -0.29669189453125, -0.202545166015625, -0.1083984375, -0.014251708984375, 0.07989501953125, 0.174041748046875, 0.2681884765625, 0.362335205078125, 0.45648193359375, 0.550628662109375, 0.644775390625, 0.738922119140625, 0.83306884765625, 0.927215576171875, 1.0213623046875, 1.115509033203125, 1.20965576171875, 1.303802490234375, 1.39794921875, 1.492095947265625, 1.58624267578125, 1.680389404296875, 1.7745361328125, 1.868682861328125, 1.96282958984375, 2.056976318359375, 2.151123046875, 2.245269775390625, 2.33941650390625, 2.433563232421875, 2.5277099609375, 2.621856689453125, 2.71600341796875, 2.810150146484375, 2.904296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 3.0, 6.0, 10.0, 10.0, 6.0, 25.0, 21.0, 47.0, 67.0, 96.0, 120.0, 139.0, 113.0, 95.0, 78.0, 46.0, 39.0, 24.0, 11.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.469757080078125, -22.664220809936523, -21.858684539794922, -21.05314826965332, -20.24761199951172, -19.442075729370117, -18.636539459228516, -17.831003189086914, -17.025466918945312, -16.21993064880371, -15.41439437866211, -14.608858108520508, -13.803321838378906, -12.997785568237305, -12.192249298095703, -11.386713027954102, -10.581177711486816, -9.775641441345215, -8.970105171203613, -8.164568901062012, -7.35903263092041, -6.553496837615967, -5.747960567474365, -4.942424297332764, -4.136888027191162, -3.3313517570495605, -2.525815486907959, -1.7202794551849365, -0.914743185043335, -0.1092071533203125, 0.6963291168212891, 1.5018653869628906, 2.307401657104492, 3.1129379272460938, 3.9184741973876953, 4.724010467529297, 5.529546737670898, 6.335082530975342, 7.140618801116943, 7.946155071258545, 8.751691818237305, 9.557228088378906, 10.362764358520508, 11.16830062866211, 11.973836898803711, 12.779373168945312, 13.584909439086914, 14.390445709228516, 15.1959810256958, 16.001516342163086, 16.807052612304688, 17.61258888244629, 18.41812515258789, 19.223661422729492, 20.029197692871094, 20.834733963012695, 21.640270233154297, 22.4458065032959, 23.2513427734375, 24.0568790435791, 24.862415313720703, 25.667951583862305, 26.473487854003906, 27.279024124145508, 28.08456039428711]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 22.0, 26.0, 28.0, 20.0, 33.0, 26.0, 45.0, 45.0, 52.0, 43.0, 67.0, 47.0, 52.0, 68.0, 52.0, 49.0, 41.0, 46.0, 33.0, 23.0, 29.0, 29.0, 16.0, 11.0, 9.0, 7.0, 11.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.70572566986084, -13.225020408630371, -12.744315147399902, -12.263609886169434, -11.782905578613281, -11.302200317382812, -10.821495056152344, -10.340789794921875, -9.860084533691406, -9.379379272460938, -8.898674011230469, -8.41796875, -7.9372639656066895, -7.456558704376221, -6.97585391998291, -6.495148658752441, -6.014443397521973, -5.533738136291504, -5.053032875061035, -4.572328090667725, -4.091622829437256, -3.610917568206787, -3.1302125453948975, -2.649507522583008, -2.168802261352539, -1.6880971193313599, -1.2073919773101807, -0.7266868352890015, -0.24598169326782227, 0.23472356796264648, 0.7154285907745361, 1.1961336135864258, 1.6768379211425781, 2.157543182373047, 2.6382482051849365, 3.118953227996826, 3.599658489227295, 4.080363750457764, 4.561068534851074, 5.041773796081543, 5.522479057312012, 6.0031843185424805, 6.483889579772949, 6.96459436416626, 7.4452996253967285, 7.926004886627197, 8.406709671020508, 8.887414932250977, 9.368120193481445, 9.848825454711914, 10.329530715942383, 10.810235977172852, 11.29094123840332, 11.771646499633789, 12.252350807189941, 12.73305606842041, 13.213761329650879, 13.694466590881348, 14.175171852111816, 14.655877113342285, 15.136581420898438, 15.617286682128906, 16.097991943359375, 16.578697204589844, 17.059402465820312]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 6.0, 8.0, 30.0, 37.0, 49.0, 94.0, 120.0, 229.0, 383.0, 678.0, 1350.0, 2630.0, 5040.0, 11658.0, 30493.0, 110833.0, 552842.0, 246600.0, 52898.0, 17690.0, 7391.0, 3464.0, 1811.0, 928.0, 521.0, 282.0, 177.0, 100.0, 56.0, 53.0, 19.0, 17.0, 12.0, 10.0, 5.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.090087890625, -20.44580078125, -19.801513671875, -19.1572265625, -18.512939453125, -17.86865234375, -17.224365234375, -16.580078125, -15.935791015625, -15.29150390625, -14.647216796875, -14.0029296875, -13.358642578125, -12.71435546875, -12.070068359375, -11.42578125, -10.781494140625, -10.13720703125, -9.492919921875, -8.8486328125, -8.204345703125, -7.56005859375, -6.915771484375, -6.271484375, -5.627197265625, -4.98291015625, -4.338623046875, -3.6943359375, -3.050048828125, -2.40576171875, -1.761474609375, -1.1171875, -0.472900390625, 0.17138671875, 0.815673828125, 1.4599609375, 2.104248046875, 2.74853515625, 3.392822265625, 4.037109375, 4.681396484375, 5.32568359375, 5.969970703125, 6.6142578125, 7.258544921875, 7.90283203125, 8.547119140625, 9.19140625, 9.835693359375, 10.47998046875, 11.124267578125, 11.7685546875, 12.412841796875, 13.05712890625, 13.701416015625, 14.345703125, 14.989990234375, 15.63427734375, 16.278564453125, 16.9228515625, 17.567138671875, 18.21142578125, 18.855712890625, 19.5]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 9.0, 14.0, 13.0, 25.0, 25.0, 23.0, 40.0, 35.0, 51.0, 51.0, 45.0, 51.0, 61.0, 39.0, 53.0, 59.0, 59.0, 52.0, 39.0, 40.0, 44.0, 25.0, 23.0, 19.0, 14.0, 10.0, 15.0, 13.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2275390625, -1.1898345947265625, -1.152130126953125, -1.1144256591796875, -1.07672119140625, -1.0390167236328125, -1.001312255859375, -0.9636077880859375, -0.9259033203125, -0.8881988525390625, -0.850494384765625, -0.8127899169921875, -0.77508544921875, -0.7373809814453125, -0.699676513671875, -0.6619720458984375, -0.624267578125, -0.5865631103515625, -0.548858642578125, -0.5111541748046875, -0.47344970703125, -0.4357452392578125, -0.398040771484375, -0.3603363037109375, -0.3226318359375, -0.2849273681640625, -0.247222900390625, -0.2095184326171875, -0.17181396484375, -0.1341094970703125, -0.096405029296875, -0.0587005615234375, -0.02099609375, 0.0167083740234375, 0.054412841796875, 0.0921173095703125, 0.12982177734375, 0.1675262451171875, 0.205230712890625, 0.2429351806640625, 0.2806396484375, 0.3183441162109375, 0.356048583984375, 0.3937530517578125, 0.43145751953125, 0.4691619873046875, 0.506866455078125, 0.5445709228515625, 0.582275390625, 0.6199798583984375, 0.657684326171875, 0.6953887939453125, 0.73309326171875, 0.7707977294921875, 0.808502197265625, 0.8462066650390625, 0.8839111328125, 0.9216156005859375, 0.959320068359375, 0.9970245361328125, 1.03472900390625, 1.0724334716796875, 1.110137939453125, 1.1478424072265625, 1.185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 9.0, 4.0, 11.0, 26.0, 47.0, 290.0, 3531.0, 504185.0, 536521.0, 3451.0, 281.0, 44.0, 15.0, 14.0, 10.0, 13.0, 7.0, 5.0, 6.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.3125, -59.123046875, -56.93359375, -54.744140625, -52.5546875, -50.365234375, -48.17578125, -45.986328125, -43.796875, -41.607421875, -39.41796875, -37.228515625, -35.0390625, -32.849609375, -30.66015625, -28.470703125, -26.28125, -24.091796875, -21.90234375, -19.712890625, -17.5234375, -15.333984375, -13.14453125, -10.955078125, -8.765625, -6.576171875, -4.38671875, -2.197265625, -0.0078125, 2.181640625, 4.37109375, 6.560546875, 8.75, 10.939453125, 13.12890625, 15.318359375, 17.5078125, 19.697265625, 21.88671875, 24.076171875, 26.265625, 28.455078125, 30.64453125, 32.833984375, 35.0234375, 37.212890625, 39.40234375, 41.591796875, 43.78125, 45.970703125, 48.16015625, 50.349609375, 52.5390625, 54.728515625, 56.91796875, 59.107421875, 61.296875, 63.486328125, 65.67578125, 67.865234375, 70.0546875, 72.244140625, 74.43359375, 76.623046875, 78.8125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 5.0, 10.0, 2.0, 9.0, 7.0, 17.0, 13.0, 18.0, 20.0, 23.0, 23.0, 24.0, 31.0, 46.0, 38.0, 31.0, 47.0, 32.0, 40.0, 36.0, 48.0, 45.0, 48.0, 44.0, 38.0, 43.0, 37.0, 29.0, 27.0, 34.0, 18.0, 22.0, 10.0, 13.0, 14.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.28094482421875, -5.1165771484375, -4.95220947265625, -4.787841796875, -4.62347412109375, -4.4591064453125, -4.29473876953125, -4.13037109375, -3.96600341796875, -3.8016357421875, -3.63726806640625, -3.472900390625, -3.30853271484375, -3.1441650390625, -2.97979736328125, -2.8154296875, -2.65106201171875, -2.4866943359375, -2.32232666015625, -2.157958984375, -1.99359130859375, -1.8292236328125, -1.66485595703125, -1.50048828125, -1.33612060546875, -1.1717529296875, -1.00738525390625, -0.843017578125, -0.67864990234375, -0.5142822265625, -0.34991455078125, -0.185546875, -0.02117919921875, 0.1431884765625, 0.30755615234375, 0.471923828125, 0.63629150390625, 0.8006591796875, 0.96502685546875, 1.12939453125, 1.29376220703125, 1.4581298828125, 1.62249755859375, 1.786865234375, 1.95123291015625, 2.1156005859375, 2.27996826171875, 2.4443359375, 2.60870361328125, 2.7730712890625, 2.93743896484375, 3.101806640625, 3.26617431640625, 3.4305419921875, 3.59490966796875, 3.75927734375, 3.92364501953125, 4.0880126953125, 4.25238037109375, 4.416748046875, 4.58111572265625, 4.7454833984375, 4.90985107421875, 5.07421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 4.0, 0.0, 5.0, 11.0, 7.0, 11.0, 10.0, 13.0, 37.0, 122.0, 514.0, 14516.0, 1029814.0, 3027.0, 286.0, 74.0, 22.0, 20.0, 12.0, 5.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.4873046875, -100.287109375, -97.0869140625, -93.88671875, -90.6865234375, -87.486328125, -84.2861328125, -81.0859375, -77.8857421875, -74.685546875, -71.4853515625, -68.28515625, -65.0849609375, -61.884765625, -58.6845703125, -55.484375, -52.2841796875, -49.083984375, -45.8837890625, -42.68359375, -39.4833984375, -36.283203125, -33.0830078125, -29.8828125, -26.6826171875, -23.482421875, -20.2822265625, -17.08203125, -13.8818359375, -10.681640625, -7.4814453125, -4.28125, -1.0810546875, 2.119140625, 5.3193359375, 8.51953125, 11.7197265625, 14.919921875, 18.1201171875, 21.3203125, 24.5205078125, 27.720703125, 30.9208984375, 34.12109375, 37.3212890625, 40.521484375, 43.7216796875, 46.921875, 50.1220703125, 53.322265625, 56.5224609375, 59.72265625, 62.9228515625, 66.123046875, 69.3232421875, 72.5234375, 75.7236328125, 78.923828125, 82.1240234375, 85.32421875, 88.5244140625, 91.724609375, 94.9248046875, 98.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 10.0, 14.0, 33.0, 34.0, 64.0, 105.0, 172.0, 173.0, 145.0, 81.0, 55.0, 36.0, 19.0, 8.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010538101196289062, -0.0010282471776008606, -0.001002684235572815, -0.0009771212935447693, -0.0009515583515167236, -0.000925995409488678, -0.0009004324674606323, -0.0008748695254325867, -0.000849306583404541, -0.0008237436413764954, -0.0007981806993484497, -0.000772617757320404, -0.0007470548152923584, -0.0007214918732643127, -0.0006959289312362671, -0.0006703659892082214, -0.0006448030471801758, -0.0006192401051521301, -0.0005936771631240845, -0.0005681142210960388, -0.0005425512790679932, -0.0005169883370399475, -0.0004914253950119019, -0.0004658624529838562, -0.00044029951095581055, -0.0004147365689277649, -0.00038917362689971924, -0.0003636106848716736, -0.00033804774284362793, -0.0003124848008155823, -0.0002869218587875366, -0.00026135891675949097, -0.0002357959747314453, -0.00021023303270339966, -0.000184670090675354, -0.00015910714864730835, -0.0001335442066192627, -0.00010798126459121704, -8.241832256317139e-05, -5.685538053512573e-05, -3.129243850708008e-05, -5.729496479034424e-06, 1.983344554901123e-05, 4.5396387577056885e-05, 7.095932960510254e-05, 9.65222716331482e-05, 0.00012208521366119385, 0.0001476481556892395, 0.00017321109771728516, 0.0001987740397453308, 0.00022433698177337646, 0.0002498999238014221, 0.0002754628658294678, 0.00030102580785751343, 0.0003265887498855591, 0.00035215169191360474, 0.0003777146339416504, 0.00040327757596969604, 0.0004288405179977417, 0.00045440346002578735, 0.000479966402053833, 0.0005055293440818787, 0.0005310922861099243, 0.00055665522813797, 0.0005822181701660156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 2.0, 3.0, 6.0, 13.0, 9.0, 22.0, 36.0, 62.0, 83.0, 111.0, 196.0, 349.0, 557.0, 1004.0, 2134.0, 5179.0, 16617.0, 143552.0, 807262.0, 54095.0, 10036.0, 3595.0, 1627.0, 833.0, 455.0, 276.0, 150.0, 100.0, 63.0, 43.0, 33.0, 16.0, 12.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.21533203125, -33.0869140625, -31.95849609375, -30.830078125, -29.70166015625, -28.5732421875, -27.44482421875, -26.31640625, -25.18798828125, -24.0595703125, -22.93115234375, -21.802734375, -20.67431640625, -19.5458984375, -18.41748046875, -17.2890625, -16.16064453125, -15.0322265625, -13.90380859375, -12.775390625, -11.64697265625, -10.5185546875, -9.39013671875, -8.26171875, -7.13330078125, -6.0048828125, -4.87646484375, -3.748046875, -2.61962890625, -1.4912109375, -0.36279296875, 0.765625, 1.89404296875, 3.0224609375, 4.15087890625, 5.279296875, 6.40771484375, 7.5361328125, 8.66455078125, 9.79296875, 10.92138671875, 12.0498046875, 13.17822265625, 14.306640625, 15.43505859375, 16.5634765625, 17.69189453125, 18.8203125, 19.94873046875, 21.0771484375, 22.20556640625, 23.333984375, 24.46240234375, 25.5908203125, 26.71923828125, 27.84765625, 28.97607421875, 30.1044921875, 31.23291015625, 32.361328125, 33.48974609375, 34.6181640625, 35.74658203125, 36.875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 10.0, 9.0, 11.0, 9.0, 22.0, 27.0, 28.0, 29.0, 56.0, 72.0, 92.0, 142.0, 89.0, 92.0, 64.0, 62.0, 46.0, 33.0, 24.0, 17.0, 13.0, 16.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.47772216796875, -9.2210693359375, -8.96441650390625, -8.707763671875, -8.45111083984375, -8.1944580078125, -7.93780517578125, -7.68115234375, -7.42449951171875, -7.1678466796875, -6.91119384765625, -6.654541015625, -6.39788818359375, -6.1412353515625, -5.88458251953125, -5.6279296875, -5.37127685546875, -5.1146240234375, -4.85797119140625, -4.601318359375, -4.34466552734375, -4.0880126953125, -3.83135986328125, -3.57470703125, -3.31805419921875, -3.0614013671875, -2.80474853515625, -2.548095703125, -2.29144287109375, -2.0347900390625, -1.77813720703125, -1.521484375, -1.26483154296875, -1.0081787109375, -0.75152587890625, -0.494873046875, -0.23822021484375, 0.0184326171875, 0.27508544921875, 0.53173828125, 0.78839111328125, 1.0450439453125, 1.30169677734375, 1.558349609375, 1.81500244140625, 2.0716552734375, 2.32830810546875, 2.5849609375, 2.84161376953125, 3.0982666015625, 3.35491943359375, 3.611572265625, 3.86822509765625, 4.1248779296875, 4.38153076171875, 4.63818359375, 4.89483642578125, 5.1514892578125, 5.40814208984375, 5.664794921875, 5.92144775390625, 6.1781005859375, 6.43475341796875, 6.69140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 20.0, 36.0, 62.0, 119.0, 166.0, 172.0, 178.0, 94.0, 61.0, 30.0, 18.0, 13.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.8785400390625, -99.69815063476562, -96.51775360107422, -93.33736419677734, -90.15696716308594, -86.97657775878906, -83.79618835449219, -80.61579895019531, -77.4354019165039, -74.25501251220703, -71.07461547851562, -67.89422607421875, -64.71383666992188, -61.53343963623047, -58.353050231933594, -55.17265701293945, -51.99226379394531, -48.81187057495117, -45.63147735595703, -42.451087951660156, -39.270694732666016, -36.090301513671875, -32.909912109375, -29.72951889038086, -26.54912567138672, -23.368732452392578, -20.18834114074707, -17.007949829101562, -13.827556610107422, -10.647164344787598, -7.466772079467773, -4.286380767822266, -1.105987548828125, 2.074404716491699, 5.254796981811523, 8.435189247131348, 11.615581512451172, 14.795973777770996, 17.97636604309082, 21.156757354736328, 24.33715057373047, 27.51754379272461, 30.697935104370117, 33.878326416015625, 37.058719635009766, 40.239112854003906, 43.41950225830078, 46.59989547729492, 49.78028869628906, 52.9606819152832, 56.141075134277344, 59.32146453857422, 62.50185775756836, 65.6822509765625, 68.86264038085938, 72.04302978515625, 75.22342681884766, 78.40381622314453, 81.58421325683594, 84.76460266113281, 87.94499206542969, 91.1253890991211, 94.30577850341797, 97.48617553710938, 100.66656494140625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 4.0, 8.0, 10.0, 18.0, 10.0, 8.0, 16.0, 20.0, 20.0, 30.0, 35.0, 42.0, 45.0, 41.0, 52.0, 49.0, 62.0, 60.0, 58.0, 60.0, 40.0, 34.0, 32.0, 41.0, 30.0, 26.0, 27.0, 22.0, 21.0, 11.0, 13.0, 8.0, 9.0, 4.0, 10.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.935176849365234, -40.591121673583984, -39.247066497802734, -37.903011322021484, -36.558956146240234, -35.21490478515625, -33.870849609375, -32.52679443359375, -31.1827392578125, -29.83868408203125, -28.49462890625, -27.15057373046875, -25.806520462036133, -24.462465286254883, -23.118410110473633, -21.774356842041016, -20.430299758911133, -19.086244583129883, -17.742189407348633, -16.398136138916016, -15.054080963134766, -13.710025787353516, -12.365970611572266, -11.021916389465332, -9.677861213684082, -8.333806037902832, -6.989751815795898, -5.645696640014648, -4.301641941070557, -2.957587242126465, -1.6135320663452148, -0.26947784423828125, 1.0745773315429688, 2.4186320304870605, 3.7626869678497314, 5.106741905212402, 6.450796604156494, 7.794851303100586, 9.138906478881836, 10.48296070098877, 11.82701587677002, 13.17107105255127, 14.515125274658203, 15.859180450439453, 17.203235626220703, 18.547290802001953, 19.891345977783203, 21.23539924621582, 22.57945442199707, 23.92350959777832, 25.26756477355957, 26.611618041992188, 27.955673217773438, 29.299728393554688, 30.643783569335938, 31.987838745117188, 33.33189392089844, 34.67594909667969, 36.02000427246094, 37.36405944824219, 38.70811462402344, 40.05216979980469, 41.39622497558594, 42.74027633666992, 44.08433151245117]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 11.0, 14.0, 15.0, 25.0, 44.0, 52.0, 77.0, 134.0, 182.0, 280.0, 472.0, 870.0, 1637.0, 3189.0, 7330.0, 18273.0, 60448.0, 408501.0, 3539880.0, 105648.0, 28027.0, 10079.0, 4295.0, 2085.0, 1125.0, 647.0, 372.0, 198.0, 141.0, 67.0, 38.0, 27.0, 21.0, 16.0, 11.0, 7.0, 0.0, 2.0, 5.0], "bins": [-48.3125, -47.19384765625, -46.0751953125, -44.95654296875, -43.837890625, -42.71923828125, -41.6005859375, -40.48193359375, -39.36328125, -38.24462890625, -37.1259765625, -36.00732421875, -34.888671875, -33.77001953125, -32.6513671875, -31.53271484375, -30.4140625, -29.29541015625, -28.1767578125, -27.05810546875, -25.939453125, -24.82080078125, -23.7021484375, -22.58349609375, -21.46484375, -20.34619140625, -19.2275390625, -18.10888671875, -16.990234375, -15.87158203125, -14.7529296875, -13.63427734375, -12.515625, -11.39697265625, -10.2783203125, -9.15966796875, -8.041015625, -6.92236328125, -5.8037109375, -4.68505859375, -3.56640625, -2.44775390625, -1.3291015625, -0.21044921875, 0.908203125, 2.02685546875, 3.1455078125, 4.26416015625, 5.3828125, 6.50146484375, 7.6201171875, 8.73876953125, 9.857421875, 10.97607421875, 12.0947265625, 13.21337890625, 14.33203125, 15.45068359375, 16.5693359375, 17.68798828125, 18.806640625, 19.92529296875, 21.0439453125, 22.16259765625, 23.28125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 14.0, 18.0, 24.0, 30.0, 43.0, 42.0, 34.0, 39.0, 41.0, 44.0, 44.0, 37.0, 48.0, 53.0, 55.0, 53.0, 53.0, 43.0, 26.0, 29.0, 29.0, 31.0, 16.0, 22.0, 19.0, 13.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.04296875, -1.0087890625, -0.974609375, -0.9404296875, -0.90625, -0.8720703125, -0.837890625, -0.8037109375, -0.76953125, -0.7353515625, -0.701171875, -0.6669921875, -0.6328125, -0.5986328125, -0.564453125, -0.5302734375, -0.49609375, -0.4619140625, -0.427734375, -0.3935546875, -0.359375, -0.3251953125, -0.291015625, -0.2568359375, -0.22265625, -0.1884765625, -0.154296875, -0.1201171875, -0.0859375, -0.0517578125, -0.017578125, 0.0166015625, 0.05078125, 0.0849609375, 0.119140625, 0.1533203125, 0.1875, 0.2216796875, 0.255859375, 0.2900390625, 0.32421875, 0.3583984375, 0.392578125, 0.4267578125, 0.4609375, 0.4951171875, 0.529296875, 0.5634765625, 0.59765625, 0.6318359375, 0.666015625, 0.7001953125, 0.734375, 0.7685546875, 0.802734375, 0.8369140625, 0.87109375, 0.9052734375, 0.939453125, 0.9736328125, 1.0078125, 1.0419921875, 1.076171875, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 19.0, 15.0, 32.0, 38.0, 55.0, 94.0, 197.0, 1091.0, 27140.0, 4054593.0, 108060.0, 2324.0, 302.0, 107.0, 55.0, 46.0, 27.0, 21.0, 25.0, 12.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.625, -141.5400390625, -137.455078125, -133.3701171875, -129.28515625, -125.2001953125, -121.115234375, -117.0302734375, -112.9453125, -108.8603515625, -104.775390625, -100.6904296875, -96.60546875, -92.5205078125, -88.435546875, -84.3505859375, -80.265625, -76.1806640625, -72.095703125, -68.0107421875, -63.92578125, -59.8408203125, -55.755859375, -51.6708984375, -47.5859375, -43.5009765625, -39.416015625, -35.3310546875, -31.24609375, -27.1611328125, -23.076171875, -18.9912109375, -14.90625, -10.8212890625, -6.736328125, -2.6513671875, 1.43359375, 5.5185546875, 9.603515625, 13.6884765625, 17.7734375, 21.8583984375, 25.943359375, 30.0283203125, 34.11328125, 38.1982421875, 42.283203125, 46.3681640625, 50.453125, 54.5380859375, 58.623046875, 62.7080078125, 66.79296875, 70.8779296875, 74.962890625, 79.0478515625, 83.1328125, 87.2177734375, 91.302734375, 95.3876953125, 99.47265625, 103.5576171875, 107.642578125, 111.7275390625, 115.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 16.0, 15.0, 12.0, 12.0, 27.0, 43.0, 40.0, 55.0, 68.0, 107.0, 152.0, 297.0, 1835.0, 572.0, 225.0, 149.0, 104.0, 75.0, 56.0, 35.0, 38.0, 28.0, 25.0, 15.0, 11.0, 6.0, 5.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.919677734375, -3.80029296875, -3.680908203125, -3.5615234375, -3.442138671875, -3.32275390625, -3.203369140625, -3.083984375, -2.964599609375, -2.84521484375, -2.725830078125, -2.6064453125, -2.487060546875, -2.36767578125, -2.248291015625, -2.12890625, -2.009521484375, -1.89013671875, -1.770751953125, -1.6513671875, -1.531982421875, -1.41259765625, -1.293212890625, -1.173828125, -1.054443359375, -0.93505859375, -0.815673828125, -0.6962890625, -0.576904296875, -0.45751953125, -0.338134765625, -0.21875, -0.099365234375, 0.02001953125, 0.139404296875, 0.2587890625, 0.378173828125, 0.49755859375, 0.616943359375, 0.736328125, 0.855712890625, 0.97509765625, 1.094482421875, 1.2138671875, 1.333251953125, 1.45263671875, 1.572021484375, 1.69140625, 1.810791015625, 1.93017578125, 2.049560546875, 2.1689453125, 2.288330078125, 2.40771484375, 2.527099609375, 2.646484375, 2.765869140625, 2.88525390625, 3.004638671875, 3.1240234375, 3.243408203125, 3.36279296875, 3.482177734375, 3.6015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 33.0, 94.0, 219.0, 252.0, 230.0, 97.0, 39.0, 19.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.35034942626953, -114.00067901611328, -111.65100860595703, -109.30133819580078, -106.95167541503906, -104.60200500488281, -102.25233459472656, -99.90266418457031, -97.55299377441406, -95.20332336425781, -92.85365295410156, -90.50398254394531, -88.15431213378906, -85.80464935302734, -83.4549789428711, -81.10530853271484, -78.7556381225586, -76.40596771240234, -74.0562973022461, -71.70662689208984, -69.35696411132812, -67.00729370117188, -64.65762329101562, -62.307952880859375, -59.958282470703125, -57.608612060546875, -55.258941650390625, -52.90927505493164, -50.55960464477539, -48.20993423461914, -45.860267639160156, -43.510597229003906, -41.16092300415039, -38.81125259399414, -36.461585998535156, -34.111915588378906, -31.762245178222656, -29.412574768066406, -27.06290626525879, -24.713237762451172, -22.363567352294922, -20.013896942138672, -17.664228439331055, -15.314558982849121, -12.964889526367188, -10.615220069885254, -8.26555061340332, -5.915882110595703, -3.566211700439453, -1.2165422439575195, 1.133127212524414, 3.4827966690063477, 5.832466125488281, 8.182135581970215, 10.531805038452148, 12.881473541259766, 15.231143951416016, 17.580814361572266, 19.930482864379883, 22.2801513671875, 24.62982177734375, 26.9794921875, 29.329160690307617, 31.678829193115234, 34.028499603271484]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 7.0, 6.0, 13.0, 12.0, 18.0, 14.0, 20.0, 26.0, 20.0, 39.0, 40.0, 41.0, 46.0, 47.0, 59.0, 48.0, 59.0, 48.0, 56.0, 49.0, 49.0, 35.0, 44.0, 34.0, 33.0, 34.0, 13.0, 21.0, 12.0, 17.0, 6.0, 6.0, 4.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.313941955566406, -19.796260833740234, -19.278579711914062, -18.76089859008789, -18.24321746826172, -17.72553825378418, -17.207857131958008, -16.690176010131836, -16.172494888305664, -15.654813766479492, -15.13713264465332, -14.619452476501465, -14.101771354675293, -13.584090232849121, -13.066410064697266, -12.548728942871094, -12.031047821044922, -11.51336669921875, -10.995685577392578, -10.478005409240723, -9.96032428741455, -9.442643165588379, -8.924962997436523, -8.407281875610352, -7.88960075378418, -7.371919631958008, -6.854238986968994, -6.3365583419799805, -5.818877220153809, -5.301196098327637, -4.783515453338623, -4.265834808349609, -3.7481517791748047, -3.230470895767212, -2.712790012359619, -2.1951091289520264, -1.6774282455444336, -1.1597473621368408, -0.642066478729248, -0.12438559532165527, 0.3932952880859375, 0.9109761714935303, 1.428657054901123, 1.9463379383087158, 2.4640188217163086, 2.9816997051239014, 3.499380588531494, 4.017061233520508, 4.53474235534668, 5.052423477172852, 5.570104122161865, 6.087784767150879, 6.605465888977051, 7.123147010803223, 7.640827655792236, 8.15850830078125, 8.676189422607422, 9.193870544433594, 9.711551666259766, 10.229231834411621, 10.746912956237793, 11.264594078063965, 11.78227424621582, 12.299955368041992, 12.817636489868164]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 6.0, 12.0, 15.0, 27.0, 36.0, 45.0, 74.0, 122.0, 201.0, 399.0, 772.0, 1826.0, 4183.0, 10409.0, 27349.0, 72314.0, 181080.0, 328241.0, 247460.0, 106891.0, 40813.0, 15424.0, 5996.0, 2545.0, 1136.0, 510.0, 260.0, 136.0, 81.0, 51.0, 31.0, 18.0, 24.0, 18.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.9954833984375, -15.490966796875, -14.9864501953125, -14.48193359375, -13.9774169921875, -13.472900390625, -12.9683837890625, -12.4638671875, -11.9593505859375, -11.454833984375, -10.9503173828125, -10.44580078125, -9.9412841796875, -9.436767578125, -8.9322509765625, -8.427734375, -7.9232177734375, -7.418701171875, -6.9141845703125, -6.40966796875, -5.9051513671875, -5.400634765625, -4.8961181640625, -4.3916015625, -3.8870849609375, -3.382568359375, -2.8780517578125, -2.37353515625, -1.8690185546875, -1.364501953125, -0.8599853515625, -0.35546875, 0.1490478515625, 0.653564453125, 1.1580810546875, 1.66259765625, 2.1671142578125, 2.671630859375, 3.1761474609375, 3.6806640625, 4.1851806640625, 4.689697265625, 5.1942138671875, 5.69873046875, 6.2032470703125, 6.707763671875, 7.2122802734375, 7.716796875, 8.2213134765625, 8.725830078125, 9.2303466796875, 9.73486328125, 10.2393798828125, 10.743896484375, 11.2484130859375, 11.7529296875, 12.2574462890625, 12.761962890625, 13.2664794921875, 13.77099609375, 14.2755126953125, 14.780029296875, 15.2845458984375, 15.7890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 19.0, 22.0, 26.0, 34.0, 42.0, 40.0, 47.0, 60.0, 58.0, 78.0, 72.0, 64.0, 66.0, 70.0, 50.0, 43.0, 36.0, 33.0, 28.0, 24.0, 20.0, 8.0, 13.0, 6.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9848175048828125, -0.937408447265625, -0.8899993896484375, -0.84259033203125, -0.7951812744140625, -0.747772216796875, -0.7003631591796875, -0.6529541015625, -0.6055450439453125, -0.558135986328125, -0.5107269287109375, -0.46331787109375, -0.4159088134765625, -0.368499755859375, -0.3210906982421875, -0.273681640625, -0.2262725830078125, -0.178863525390625, -0.1314544677734375, -0.08404541015625, -0.0366363525390625, 0.010772705078125, 0.0581817626953125, 0.1055908203125, 0.1529998779296875, 0.200408935546875, 0.2478179931640625, 0.29522705078125, 0.3426361083984375, 0.390045166015625, 0.4374542236328125, 0.48486328125, 0.5322723388671875, 0.579681396484375, 0.6270904541015625, 0.67449951171875, 0.7219085693359375, 0.769317626953125, 0.8167266845703125, 0.8641357421875, 0.9115447998046875, 0.958953857421875, 1.0063629150390625, 1.05377197265625, 1.1011810302734375, 1.148590087890625, 1.1959991455078125, 1.243408203125, 1.2908172607421875, 1.338226318359375, 1.3856353759765625, 1.43304443359375, 1.4804534912109375, 1.527862548828125, 1.5752716064453125, 1.6226806640625, 1.6700897216796875, 1.717498779296875, 1.7649078369140625, 1.81231689453125, 1.8597259521484375, 1.907135009765625, 1.9545440673828125, 2.001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 7.0, 7.0, 11.0, 23.0, 22.0, 34.0, 47.0, 66.0, 99.0, 121.0, 176.0, 223.0, 294.0, 465.0, 695.0, 1155.0, 1915.0, 2974.0, 5253.0, 10005.0, 19032.0, 37685.0, 76001.0, 145713.0, 234711.0, 227561.0, 137425.0, 71082.0, 35463.0, 17946.0, 9463.0, 5082.0, 2887.0, 1702.0, 1052.0, 655.0, 459.0, 268.0, 191.0, 150.0, 116.0, 71.0, 73.0, 43.0, 46.0, 22.0, 13.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.703125, -11.3369140625, -10.970703125, -10.6044921875, -10.23828125, -9.8720703125, -9.505859375, -9.1396484375, -8.7734375, -8.4072265625, -8.041015625, -7.6748046875, -7.30859375, -6.9423828125, -6.576171875, -6.2099609375, -5.84375, -5.4775390625, -5.111328125, -4.7451171875, -4.37890625, -4.0126953125, -3.646484375, -3.2802734375, -2.9140625, -2.5478515625, -2.181640625, -1.8154296875, -1.44921875, -1.0830078125, -0.716796875, -0.3505859375, 0.015625, 0.3818359375, 0.748046875, 1.1142578125, 1.48046875, 1.8466796875, 2.212890625, 2.5791015625, 2.9453125, 3.3115234375, 3.677734375, 4.0439453125, 4.41015625, 4.7763671875, 5.142578125, 5.5087890625, 5.875, 6.2412109375, 6.607421875, 6.9736328125, 7.33984375, 7.7060546875, 8.072265625, 8.4384765625, 8.8046875, 9.1708984375, 9.537109375, 9.9033203125, 10.26953125, 10.6357421875, 11.001953125, 11.3681640625, 11.734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 3.0, 10.0, 15.0, 14.0, 16.0, 19.0, 18.0, 17.0, 20.0, 25.0, 34.0, 30.0, 38.0, 28.0, 47.0, 50.0, 44.0, 38.0, 38.0, 38.0, 47.0, 38.0, 39.0, 39.0, 42.0, 31.0, 33.0, 29.0, 19.0, 25.0, 31.0, 14.0, 11.0, 3.0, 11.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.23046875, -7.01580810546875, -6.8011474609375, -6.58648681640625, -6.371826171875, -6.15716552734375, -5.9425048828125, -5.72784423828125, -5.51318359375, -5.29852294921875, -5.0838623046875, -4.86920166015625, -4.654541015625, -4.43988037109375, -4.2252197265625, -4.01055908203125, -3.7958984375, -3.58123779296875, -3.3665771484375, -3.15191650390625, -2.937255859375, -2.72259521484375, -2.5079345703125, -2.29327392578125, -2.07861328125, -1.86395263671875, -1.6492919921875, -1.43463134765625, -1.219970703125, -1.00531005859375, -0.7906494140625, -0.57598876953125, -0.361328125, -0.14666748046875, 0.0679931640625, 0.28265380859375, 0.497314453125, 0.71197509765625, 0.9266357421875, 1.14129638671875, 1.35595703125, 1.57061767578125, 1.7852783203125, 1.99993896484375, 2.214599609375, 2.42926025390625, 2.6439208984375, 2.85858154296875, 3.0732421875, 3.28790283203125, 3.5025634765625, 3.71722412109375, 3.931884765625, 4.14654541015625, 4.3612060546875, 4.57586669921875, 4.79052734375, 5.00518798828125, 5.2198486328125, 5.43450927734375, 5.649169921875, 5.86383056640625, 6.0784912109375, 6.29315185546875, 6.5078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 20.0, 17.0, 41.0, 33.0, 50.0, 101.0, 124.0, 190.0, 265.0, 431.0, 685.0, 1198.0, 2165.0, 4552.0, 9781.0, 23252.0, 64868.0, 184044.0, 358032.0, 249316.0, 91650.0, 32524.0, 12905.0, 5672.0, 2761.0, 1455.0, 886.0, 524.0, 307.0, 197.0, 126.0, 92.0, 71.0, 58.0, 34.0, 26.0, 18.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8302001953125, -9.519775390625, -9.2093505859375, -8.89892578125, -8.5885009765625, -8.278076171875, -7.9676513671875, -7.6572265625, -7.3468017578125, -7.036376953125, -6.7259521484375, -6.41552734375, -6.1051025390625, -5.794677734375, -5.4842529296875, -5.173828125, -4.8634033203125, -4.552978515625, -4.2425537109375, -3.93212890625, -3.6217041015625, -3.311279296875, -3.0008544921875, -2.6904296875, -2.3800048828125, -2.069580078125, -1.7591552734375, -1.44873046875, -1.1383056640625, -0.827880859375, -0.5174560546875, -0.20703125, 0.1033935546875, 0.413818359375, 0.7242431640625, 1.03466796875, 1.3450927734375, 1.655517578125, 1.9659423828125, 2.2763671875, 2.5867919921875, 2.897216796875, 3.2076416015625, 3.51806640625, 3.8284912109375, 4.138916015625, 4.4493408203125, 4.759765625, 5.0701904296875, 5.380615234375, 5.6910400390625, 6.00146484375, 6.3118896484375, 6.622314453125, 6.9327392578125, 7.2431640625, 7.5535888671875, 7.864013671875, 8.1744384765625, 8.48486328125, 8.7952880859375, 9.105712890625, 9.4161376953125, 9.7265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 8.0, 15.0, 14.0, 16.0, 25.0, 36.0, 41.0, 49.0, 53.0, 64.0, 68.0, 65.0, 80.0, 79.0, 75.0, 45.0, 65.0, 42.0, 28.0, 25.0, 24.0, 13.0, 11.0, 12.0, 6.0, 4.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013714134693145752, -0.0013313889503479004, -0.0012913644313812256, -0.0012513399124145508, -0.001211315393447876, -0.0011712908744812012, -0.0011312663555145264, -0.0010912418365478516, -0.0010512173175811768, -0.001011192798614502, -0.0009711682796478271, -0.0009311437606811523, -0.0008911192417144775, -0.0008510947227478027, -0.0008110702037811279, -0.0007710456848144531, -0.0007310211658477783, -0.0006909966468811035, -0.0006509721279144287, -0.0006109476089477539, -0.0005709230899810791, -0.0005308985710144043, -0.0004908740520477295, -0.0004508495330810547, -0.0004108250141143799, -0.0003708004951477051, -0.0003307759761810303, -0.00029075145721435547, -0.00025072693824768066, -0.00021070241928100586, -0.00017067790031433105, -0.00013065338134765625, -9.062886238098145e-05, -5.060434341430664e-05, -1.0579824447631836e-05, 2.944469451904297e-05, 6.946921348571777e-05, 0.00010949373245239258, 0.00014951825141906738, 0.0001895427703857422, 0.000229567289352417, 0.0002695918083190918, 0.0003096163272857666, 0.0003496408462524414, 0.0003896653652191162, 0.000429689884185791, 0.0004697144031524658, 0.0005097389221191406, 0.0005497634410858154, 0.0005897879600524902, 0.000629812479019165, 0.0006698369979858398, 0.0007098615169525146, 0.0007498860359191895, 0.0007899105548858643, 0.0008299350738525391, 0.0008699595928192139, 0.0009099841117858887, 0.0009500086307525635, 0.0009900331497192383, 0.001030057668685913, 0.0010700821876525879, 0.0011101067066192627, 0.0011501312255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 8.0, 13.0, 15.0, 27.0, 34.0, 45.0, 64.0, 96.0, 155.0, 249.0, 422.0, 665.0, 1121.0, 2201.0, 4000.0, 8237.0, 19262.0, 52741.0, 161113.0, 378570.0, 272310.0, 90992.0, 30996.0, 12442.0, 5902.0, 2900.0, 1625.0, 866.0, 528.0, 329.0, 202.0, 120.0, 103.0, 55.0, 43.0, 21.0, 20.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-11.078125, -10.7398681640625, -10.401611328125, -10.0633544921875, -9.72509765625, -9.3868408203125, -9.048583984375, -8.7103271484375, -8.3720703125, -8.0338134765625, -7.695556640625, -7.3572998046875, -7.01904296875, -6.6807861328125, -6.342529296875, -6.0042724609375, -5.666015625, -5.3277587890625, -4.989501953125, -4.6512451171875, -4.31298828125, -3.9747314453125, -3.636474609375, -3.2982177734375, -2.9599609375, -2.6217041015625, -2.283447265625, -1.9451904296875, -1.60693359375, -1.2686767578125, -0.930419921875, -0.5921630859375, -0.25390625, 0.0843505859375, 0.422607421875, 0.7608642578125, 1.09912109375, 1.4373779296875, 1.775634765625, 2.1138916015625, 2.4521484375, 2.7904052734375, 3.128662109375, 3.4669189453125, 3.80517578125, 4.1434326171875, 4.481689453125, 4.8199462890625, 5.158203125, 5.4964599609375, 5.834716796875, 6.1729736328125, 6.51123046875, 6.8494873046875, 7.187744140625, 7.5260009765625, 7.8642578125, 8.2025146484375, 8.540771484375, 8.8790283203125, 9.21728515625, 9.5555419921875, 9.893798828125, 10.2320556640625, 10.5703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 4.0, 7.0, 10.0, 14.0, 13.0, 20.0, 22.0, 30.0, 22.0, 45.0, 45.0, 57.0, 48.0, 53.0, 64.0, 72.0, 72.0, 60.0, 59.0, 39.0, 42.0, 39.0, 23.0, 31.0, 21.0, 19.0, 9.0, 11.0, 12.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.83502197265625, -4.6856689453125, -4.53631591796875, -4.386962890625, -4.23760986328125, -4.0882568359375, -3.93890380859375, -3.78955078125, -3.64019775390625, -3.4908447265625, -3.34149169921875, -3.192138671875, -3.04278564453125, -2.8934326171875, -2.74407958984375, -2.5947265625, -2.44537353515625, -2.2960205078125, -2.14666748046875, -1.997314453125, -1.84796142578125, -1.6986083984375, -1.54925537109375, -1.39990234375, -1.25054931640625, -1.1011962890625, -0.95184326171875, -0.802490234375, -0.65313720703125, -0.5037841796875, -0.35443115234375, -0.205078125, -0.05572509765625, 0.0936279296875, 0.24298095703125, 0.392333984375, 0.54168701171875, 0.6910400390625, 0.84039306640625, 0.98974609375, 1.13909912109375, 1.2884521484375, 1.43780517578125, 1.587158203125, 1.73651123046875, 1.8858642578125, 2.03521728515625, 2.1845703125, 2.33392333984375, 2.4832763671875, 2.63262939453125, 2.781982421875, 2.93133544921875, 3.0806884765625, 3.23004150390625, 3.37939453125, 3.52874755859375, 3.6781005859375, 3.82745361328125, 3.976806640625, 4.12615966796875, 4.2755126953125, 4.42486572265625, 4.57421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 10.0, 7.0, 12.0, 10.0, 25.0, 34.0, 55.0, 78.0, 103.0, 114.0, 128.0, 121.0, 78.0, 69.0, 57.0, 23.0, 21.0, 20.0, 7.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.85691833496094, -89.43411254882812, -86.01130676269531, -82.5885009765625, -79.16569519042969, -75.74288940429688, -72.32007598876953, -68.89727020263672, -65.4744644165039, -62.051658630371094, -58.62885284423828, -55.2060432434082, -51.78323745727539, -48.36043167114258, -44.9376220703125, -41.51481628417969, -38.092010498046875, -34.66920471191406, -31.246397018432617, -27.823589324951172, -24.40078353881836, -20.977977752685547, -17.5551700592041, -14.132362365722656, -10.709556579589844, -7.286749839782715, -3.863943099975586, -0.44113636016845703, 2.981670379638672, 6.404476165771484, 9.82728385925293, 13.250091552734375, 16.672897338867188, 20.095703125, 23.518510818481445, 26.94131851196289, 30.364124298095703, 33.786930084228516, 37.209739685058594, 40.632545471191406, 44.05535125732422, 47.47815704345703, 50.900962829589844, 54.32377243041992, 57.746578216552734, 61.16938400268555, 64.59219360351562, 68.01499938964844, 71.43780517578125, 74.86061096191406, 78.28341674804688, 81.70622253417969, 85.1290283203125, 88.55183410644531, 91.97464752197266, 95.39745330810547, 98.82025909423828, 102.2430648803711, 105.6658706665039, 109.08867645263672, 112.51148986816406, 115.93429565429688, 119.35710144042969, 122.7799072265625, 126.20271301269531]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 9.0, 17.0, 10.0, 38.0, 33.0, 40.0, 49.0, 75.0, 74.0, 56.0, 76.0, 70.0, 77.0, 66.0, 60.0, 45.0, 37.0, 39.0, 23.0, 25.0, 19.0, 12.0, 11.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.665313720703125, -58.071136474609375, -55.47695541381836, -52.882774353027344, -50.288597106933594, -47.694419860839844, -45.10023880004883, -42.50605773925781, -39.91188049316406, -37.31770324707031, -34.7235221862793, -32.12934112548828, -29.53516387939453, -26.94098472595215, -24.346805572509766, -21.752626419067383, -19.158447265625, -16.564268112182617, -13.970088958740234, -11.375909805297852, -8.781730651855469, -6.187551498413086, -3.593372344970703, -0.9991931915283203, 1.5949859619140625, 4.189165115356445, 6.783344268798828, 9.377523422241211, 11.971702575683594, 14.565881729125977, 17.16006088256836, 19.754240036010742, 22.348426818847656, 24.94260597229004, 27.536785125732422, 30.130964279174805, 32.72514343261719, 35.31932067871094, 37.91350173950195, 40.50768280029297, 43.10186004638672, 45.69603729248047, 48.290218353271484, 50.8843994140625, 53.47857666015625, 56.07275390625, 58.666934967041016, 61.26111602783203, 63.85529327392578, 66.44947052001953, 69.04365539550781, 71.63783264160156, 74.23200988769531, 76.82618713378906, 79.42036437988281, 82.0145492553711, 84.60872650146484, 87.2029037475586, 89.79708862304688, 92.39126586914062, 94.98544311523438, 97.57962036132812, 100.17379760742188, 102.76798248291016, 105.3621597290039]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 11.0, 16.0, 32.0, 41.0, 63.0, 139.0, 260.0, 769.0, 4390.0, 49761.0, 3927023.0, 195983.0, 12674.0, 2039.0, 586.0, 227.0, 97.0, 64.0, 46.0, 21.0, 14.0, 10.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.9375, -90.548828125, -87.16015625, -83.771484375, -80.3828125, -76.994140625, -73.60546875, -70.216796875, -66.828125, -63.439453125, -60.05078125, -56.662109375, -53.2734375, -49.884765625, -46.49609375, -43.107421875, -39.71875, -36.330078125, -32.94140625, -29.552734375, -26.1640625, -22.775390625, -19.38671875, -15.998046875, -12.609375, -9.220703125, -5.83203125, -2.443359375, 0.9453125, 4.333984375, 7.72265625, 11.111328125, 14.5, 17.888671875, 21.27734375, 24.666015625, 28.0546875, 31.443359375, 34.83203125, 38.220703125, 41.609375, 44.998046875, 48.38671875, 51.775390625, 55.1640625, 58.552734375, 61.94140625, 65.330078125, 68.71875, 72.107421875, 75.49609375, 78.884765625, 82.2734375, 85.662109375, 89.05078125, 92.439453125, 95.828125, 99.216796875, 102.60546875, 105.994140625, 109.3828125, 112.771484375, 116.16015625, 119.548828125, 122.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 13.0, 27.0, 24.0, 38.0, 53.0, 66.0, 57.0, 70.0, 84.0, 105.0, 87.0, 71.0, 65.0, 49.0, 53.0, 43.0, 29.0, 20.0, 12.0, 4.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9500732421875, -1.870849609375, -1.7916259765625, -1.71240234375, -1.6331787109375, -1.553955078125, -1.4747314453125, -1.3955078125, -1.3162841796875, -1.237060546875, -1.1578369140625, -1.07861328125, -0.9993896484375, -0.920166015625, -0.8409423828125, -0.76171875, -0.6824951171875, -0.603271484375, -0.5240478515625, -0.44482421875, -0.3656005859375, -0.286376953125, -0.2071533203125, -0.1279296875, -0.0487060546875, 0.030517578125, 0.1097412109375, 0.18896484375, 0.2681884765625, 0.347412109375, 0.4266357421875, 0.505859375, 0.5850830078125, 0.664306640625, 0.7435302734375, 0.82275390625, 0.9019775390625, 0.981201171875, 1.0604248046875, 1.1396484375, 1.2188720703125, 1.298095703125, 1.3773193359375, 1.45654296875, 1.5357666015625, 1.614990234375, 1.6942138671875, 1.7734375, 1.8526611328125, 1.931884765625, 2.0111083984375, 2.09033203125, 2.1695556640625, 2.248779296875, 2.3280029296875, 2.4072265625, 2.4864501953125, 2.565673828125, 2.6448974609375, 2.72412109375, 2.8033447265625, 2.882568359375, 2.9617919921875, 3.041015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 31.0, 24.0, 57.0, 92.0, 163.0, 380.0, 1082.0, 3551.0, 14766.0, 80039.0, 961414.0, 3007361.0, 101362.0, 17732.0, 4256.0, 1163.0, 384.0, 191.0, 84.0, 60.0, 31.0, 12.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.96875, -52.173828125, -50.37890625, -48.583984375, -46.7890625, -44.994140625, -43.19921875, -41.404296875, -39.609375, -37.814453125, -36.01953125, -34.224609375, -32.4296875, -30.634765625, -28.83984375, -27.044921875, -25.25, -23.455078125, -21.66015625, -19.865234375, -18.0703125, -16.275390625, -14.48046875, -12.685546875, -10.890625, -9.095703125, -7.30078125, -5.505859375, -3.7109375, -1.916015625, -0.12109375, 1.673828125, 3.46875, 5.263671875, 7.05859375, 8.853515625, 10.6484375, 12.443359375, 14.23828125, 16.033203125, 17.828125, 19.623046875, 21.41796875, 23.212890625, 25.0078125, 26.802734375, 28.59765625, 30.392578125, 32.1875, 33.982421875, 35.77734375, 37.572265625, 39.3671875, 41.162109375, 42.95703125, 44.751953125, 46.546875, 48.341796875, 50.13671875, 51.931640625, 53.7265625, 55.521484375, 57.31640625, 59.111328125, 60.90625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 8.0, 11.0, 6.0, 14.0, 13.0, 19.0, 39.0, 43.0, 56.0, 90.0, 90.0, 126.0, 206.0, 494.0, 1862.0, 365.0, 210.0, 106.0, 83.0, 75.0, 35.0, 29.0, 16.0, 19.0, 15.0, 17.0, 8.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.02227783203125, -5.8101806640625, -5.59808349609375, -5.385986328125, -5.17388916015625, -4.9617919921875, -4.74969482421875, -4.53759765625, -4.32550048828125, -4.1134033203125, -3.90130615234375, -3.689208984375, -3.47711181640625, -3.2650146484375, -3.05291748046875, -2.8408203125, -2.62872314453125, -2.4166259765625, -2.20452880859375, -1.992431640625, -1.78033447265625, -1.5682373046875, -1.35614013671875, -1.14404296875, -0.93194580078125, -0.7198486328125, -0.50775146484375, -0.295654296875, -0.08355712890625, 0.1285400390625, 0.34063720703125, 0.552734375, 0.76483154296875, 0.9769287109375, 1.18902587890625, 1.401123046875, 1.61322021484375, 1.8253173828125, 2.03741455078125, 2.24951171875, 2.46160888671875, 2.6737060546875, 2.88580322265625, 3.097900390625, 3.30999755859375, 3.5220947265625, 3.73419189453125, 3.9462890625, 4.15838623046875, 4.3704833984375, 4.58258056640625, 4.794677734375, 5.00677490234375, 5.2188720703125, 5.43096923828125, 5.64306640625, 5.85516357421875, 6.0672607421875, 6.27935791015625, 6.491455078125, 6.70355224609375, 6.9156494140625, 7.12774658203125, 7.33984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 16.0, 14.0, 27.0, 35.0, 51.0, 73.0, 103.0, 129.0, 119.0, 116.0, 106.0, 74.0, 41.0, 26.0, 15.0, 20.0, 6.0, 4.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.21955108642578, -30.569355010986328, -28.919158935546875, -27.268962860107422, -25.6187686920166, -23.96857261657715, -22.318376541137695, -20.668182373046875, -19.017986297607422, -17.36779022216797, -15.717595100402832, -14.067399024963379, -12.417203903198242, -10.767007827758789, -9.116811752319336, -7.466616630554199, -5.81641960144043, -4.166224002838135, -2.5160281658172607, -0.8658323287963867, 0.7843632698059082, 2.434558868408203, 4.084754943847656, 5.734950065612793, 7.385146141052246, 9.0353422164917, 10.685537338256836, 12.335733413696289, 13.985929489135742, 15.636124610900879, 17.286319732666016, 18.93651580810547, 20.586711883544922, 22.236907958984375, 23.887104034423828, 25.53730010986328, 27.1874942779541, 28.837690353393555, 30.487886428833008, 32.13808059692383, 33.78827667236328, 35.438472747802734, 37.08866882324219, 38.73886489868164, 40.389060974121094, 42.03925323486328, 43.689453125, 45.33964538574219, 46.989845275878906, 48.64004135131836, 50.29023742675781, 51.940433502197266, 53.59062957763672, 55.240821838378906, 56.891021728515625, 58.54121398925781, 60.191410064697266, 61.84160614013672, 63.49180221557617, 65.14199829101562, 66.79219055175781, 68.44239044189453, 70.09258270263672, 71.74278259277344, 73.39297485351562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 15.0, 19.0, 19.0, 16.0, 26.0, 28.0, 29.0, 38.0, 29.0, 38.0, 42.0, 43.0, 36.0, 57.0, 50.0, 65.0, 53.0, 48.0, 38.0, 37.0, 37.0, 33.0, 29.0, 21.0, 19.0, 17.0, 27.0, 8.0, 10.0, 4.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-31.966903686523438, -31.10605812072754, -30.245210647583008, -29.38436508178711, -28.52351951599121, -27.662673950195312, -26.80182647705078, -25.940980911254883, -25.080135345458984, -24.219289779663086, -23.358442306518555, -22.497596740722656, -21.636751174926758, -20.77590560913086, -19.915058135986328, -19.05421257019043, -18.19336700439453, -17.332521438598633, -16.4716739654541, -15.610828399658203, -14.749982833862305, -13.88913631439209, -13.028289794921875, -12.167444229125977, -11.306596755981445, -10.44575023651123, -9.584904670715332, -8.724058151245117, -7.863212585449219, -7.002366065979004, -6.141520023345947, -5.280673980712891, -4.419828414916992, -3.5589823722839355, -2.698136329650879, -1.8372900485992432, -0.9764440059661865, -0.11559772491455078, 0.7452483177185059, 1.6060943603515625, 2.466940402984619, 3.327786445617676, 4.188632488250732, 5.049478530883789, 5.910325050354004, 6.7711710929870605, 7.632017135620117, 8.492862701416016, 9.35370922088623, 10.214555740356445, 11.075401306152344, 11.936247825622559, 12.797093391418457, 13.657939910888672, 14.51878547668457, 15.379631996154785, 16.240478515625, 17.1013240814209, 17.96217155456543, 18.823017120361328, 19.683862686157227, 20.544708251953125, 21.405555725097656, 22.266401290893555, 23.127246856689453]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 2.0, 9.0, 11.0, 12.0, 21.0, 35.0, 32.0, 47.0, 80.0, 87.0, 174.0, 246.0, 442.0, 711.0, 1556.0, 3586.0, 10875.0, 39895.0, 161917.0, 476233.0, 260279.0, 65422.0, 17127.0, 5375.0, 2068.0, 914.0, 481.0, 290.0, 180.0, 126.0, 83.0, 64.0, 38.0, 36.0, 24.0, 15.0, 7.0, 12.0, 12.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-27.578125, -26.80517578125, -26.0322265625, -25.25927734375, -24.486328125, -23.71337890625, -22.9404296875, -22.16748046875, -21.39453125, -20.62158203125, -19.8486328125, -19.07568359375, -18.302734375, -17.52978515625, -16.7568359375, -15.98388671875, -15.2109375, -14.43798828125, -13.6650390625, -12.89208984375, -12.119140625, -11.34619140625, -10.5732421875, -9.80029296875, -9.02734375, -8.25439453125, -7.4814453125, -6.70849609375, -5.935546875, -5.16259765625, -4.3896484375, -3.61669921875, -2.84375, -2.07080078125, -1.2978515625, -0.52490234375, 0.248046875, 1.02099609375, 1.7939453125, 2.56689453125, 3.33984375, 4.11279296875, 4.8857421875, 5.65869140625, 6.431640625, 7.20458984375, 7.9775390625, 8.75048828125, 9.5234375, 10.29638671875, 11.0693359375, 11.84228515625, 12.615234375, 13.38818359375, 14.1611328125, 14.93408203125, 15.70703125, 16.47998046875, 17.2529296875, 18.02587890625, 18.798828125, 19.57177734375, 20.3447265625, 21.11767578125, 21.890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 11.0, 27.0, 42.0, 60.0, 58.0, 105.0, 121.0, 109.0, 110.0, 94.0, 72.0, 62.0, 37.0, 40.0, 13.0, 13.0, 4.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.429168701171875, -3.30950927734375, -3.189849853515625, -3.0701904296875, -2.950531005859375, -2.83087158203125, -2.711212158203125, -2.591552734375, -2.471893310546875, -2.35223388671875, -2.232574462890625, -2.1129150390625, -1.993255615234375, -1.87359619140625, -1.753936767578125, -1.63427734375, -1.514617919921875, -1.39495849609375, -1.275299072265625, -1.1556396484375, -1.035980224609375, -0.91632080078125, -0.796661376953125, -0.677001953125, -0.557342529296875, -0.43768310546875, -0.318023681640625, -0.1983642578125, -0.078704833984375, 0.04095458984375, 0.160614013671875, 0.2802734375, 0.399932861328125, 0.51959228515625, 0.639251708984375, 0.7589111328125, 0.878570556640625, 0.99822998046875, 1.117889404296875, 1.237548828125, 1.357208251953125, 1.47686767578125, 1.596527099609375, 1.7161865234375, 1.835845947265625, 1.95550537109375, 2.075164794921875, 2.19482421875, 2.314483642578125, 2.43414306640625, 2.553802490234375, 2.6734619140625, 2.793121337890625, 2.91278076171875, 3.032440185546875, 3.152099609375, 3.271759033203125, 3.39141845703125, 3.511077880859375, 3.6307373046875, 3.750396728515625, 3.87005615234375, 3.989715576171875, 4.109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 16.0, 24.0, 33.0, 46.0, 75.0, 118.0, 167.0, 245.0, 404.0, 721.0, 1397.0, 2684.0, 5500.0, 14358.0, 40619.0, 127652.0, 383418.0, 314377.0, 101647.0, 33104.0, 11827.0, 4702.0, 2365.0, 1187.0, 644.0, 410.0, 273.0, 156.0, 100.0, 75.0, 54.0, 37.0, 20.0, 17.0, 12.0, 17.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.484375, -19.880126953125, -19.27587890625, -18.671630859375, -18.0673828125, -17.463134765625, -16.85888671875, -16.254638671875, -15.650390625, -15.046142578125, -14.44189453125, -13.837646484375, -13.2333984375, -12.629150390625, -12.02490234375, -11.420654296875, -10.81640625, -10.212158203125, -9.60791015625, -9.003662109375, -8.3994140625, -7.795166015625, -7.19091796875, -6.586669921875, -5.982421875, -5.378173828125, -4.77392578125, -4.169677734375, -3.5654296875, -2.961181640625, -2.35693359375, -1.752685546875, -1.1484375, -0.544189453125, 0.06005859375, 0.664306640625, 1.2685546875, 1.872802734375, 2.47705078125, 3.081298828125, 3.685546875, 4.289794921875, 4.89404296875, 5.498291015625, 6.1025390625, 6.706787109375, 7.31103515625, 7.915283203125, 8.51953125, 9.123779296875, 9.72802734375, 10.332275390625, 10.9365234375, 11.540771484375, 12.14501953125, 12.749267578125, 13.353515625, 13.957763671875, 14.56201171875, 15.166259765625, 15.7705078125, 16.374755859375, 16.97900390625, 17.583251953125, 18.1875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 7.0, 10.0, 23.0, 20.0, 15.0, 33.0, 28.0, 33.0, 43.0, 41.0, 36.0, 42.0, 46.0, 46.0, 53.0, 50.0, 44.0, 48.0, 44.0, 45.0, 41.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 14.0, 18.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3702392578125, -9.045166015625, -8.7200927734375, -8.39501953125, -8.0699462890625, -7.744873046875, -7.4197998046875, -7.0947265625, -6.7696533203125, -6.444580078125, -6.1195068359375, -5.79443359375, -5.4693603515625, -5.144287109375, -4.8192138671875, -4.494140625, -4.1690673828125, -3.843994140625, -3.5189208984375, -3.19384765625, -2.8687744140625, -2.543701171875, -2.2186279296875, -1.8935546875, -1.5684814453125, -1.243408203125, -0.9183349609375, -0.59326171875, -0.2681884765625, 0.056884765625, 0.3819580078125, 0.70703125, 1.0321044921875, 1.357177734375, 1.6822509765625, 2.00732421875, 2.3323974609375, 2.657470703125, 2.9825439453125, 3.3076171875, 3.6326904296875, 3.957763671875, 4.2828369140625, 4.60791015625, 4.9329833984375, 5.258056640625, 5.5831298828125, 5.908203125, 6.2332763671875, 6.558349609375, 6.8834228515625, 7.20849609375, 7.5335693359375, 7.858642578125, 8.1837158203125, 8.5087890625, 8.8338623046875, 9.158935546875, 9.4840087890625, 9.80908203125, 10.1341552734375, 10.459228515625, 10.7843017578125, 11.109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 8.0, 15.0, 8.0, 30.0, 46.0, 60.0, 161.0, 298.0, 755.0, 2100.0, 8755.0, 55960.0, 504636.0, 419797.0, 45333.0, 7437.0, 1956.0, 611.0, 270.0, 129.0, 63.0, 44.0, 19.0, 16.0, 17.0, 11.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.761474609375, -17.14794921875, -16.534423828125, -15.9208984375, -15.307373046875, -14.69384765625, -14.080322265625, -13.466796875, -12.853271484375, -12.23974609375, -11.626220703125, -11.0126953125, -10.399169921875, -9.78564453125, -9.172119140625, -8.55859375, -7.945068359375, -7.33154296875, -6.718017578125, -6.1044921875, -5.490966796875, -4.87744140625, -4.263916015625, -3.650390625, -3.036865234375, -2.42333984375, -1.809814453125, -1.1962890625, -0.582763671875, 0.03076171875, 0.644287109375, 1.2578125, 1.871337890625, 2.48486328125, 3.098388671875, 3.7119140625, 4.325439453125, 4.93896484375, 5.552490234375, 6.166015625, 6.779541015625, 7.39306640625, 8.006591796875, 8.6201171875, 9.233642578125, 9.84716796875, 10.460693359375, 11.07421875, 11.687744140625, 12.30126953125, 12.914794921875, 13.5283203125, 14.141845703125, 14.75537109375, 15.368896484375, 15.982421875, 16.595947265625, 17.20947265625, 17.822998046875, 18.4365234375, 19.050048828125, 19.66357421875, 20.277099609375, 20.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 4.0, 7.0, 16.0, 13.0, 21.0, 17.0, 22.0, 34.0, 38.0, 39.0, 52.0, 70.0, 96.0, 83.0, 91.0, 74.0, 56.0, 49.0, 30.0, 40.0, 30.0, 23.0, 17.0, 13.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.0013904869556427002, -0.0013495087623596191, -0.001308530569076538, -0.001267552375793457, -0.001226574182510376, -0.001185595989227295, -0.0011446177959442139, -0.0011036396026611328, -0.0010626614093780518, -0.0010216832160949707, -0.0009807050228118896, -0.0009397268295288086, -0.0008987486362457275, -0.0008577704429626465, -0.0008167922496795654, -0.0007758140563964844, -0.0007348358631134033, -0.0006938576698303223, -0.0006528794765472412, -0.0006119012832641602, -0.0005709230899810791, -0.000529944896697998, -0.000488966703414917, -0.00044798851013183594, -0.0004070103168487549, -0.00036603212356567383, -0.0003250539302825928, -0.0002840757369995117, -0.00024309754371643066, -0.0002021193504333496, -0.00016114115715026855, -0.0001201629638671875, -7.918477058410645e-05, -3.820657730102539e-05, 2.771615982055664e-06, 4.374980926513672e-05, 8.472800254821777e-05, 0.00012570619583129883, 0.00016668438911437988, 0.00020766258239746094, 0.000248640775680542, 0.00028961896896362305, 0.0003305971622467041, 0.00037157535552978516, 0.0004125535488128662, 0.00045353174209594727, 0.0004945099353790283, 0.0005354881286621094, 0.0005764663219451904, 0.0006174445152282715, 0.0006584227085113525, 0.0006994009017944336, 0.0007403790950775146, 0.0007813572883605957, 0.0008223354816436768, 0.0008633136749267578, 0.0009042918682098389, 0.0009452700614929199, 0.000986248254776001, 0.001027226448059082, 0.001068204641342163, 0.0011091828346252441, 0.0011501610279083252, 0.0011911392211914062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 9.0, 17.0, 19.0, 43.0, 52.0, 87.0, 118.0, 221.0, 469.0, 1142.0, 3407.0, 13912.0, 98625.0, 694438.0, 204978.0, 23367.0, 4960.0, 1506.0, 554.0, 263.0, 125.0, 73.0, 63.0, 31.0, 20.0, 12.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.2177734375, -23.498046875, -22.7783203125, -22.05859375, -21.3388671875, -20.619140625, -19.8994140625, -19.1796875, -18.4599609375, -17.740234375, -17.0205078125, -16.30078125, -15.5810546875, -14.861328125, -14.1416015625, -13.421875, -12.7021484375, -11.982421875, -11.2626953125, -10.54296875, -9.8232421875, -9.103515625, -8.3837890625, -7.6640625, -6.9443359375, -6.224609375, -5.5048828125, -4.78515625, -4.0654296875, -3.345703125, -2.6259765625, -1.90625, -1.1865234375, -0.466796875, 0.2529296875, 0.97265625, 1.6923828125, 2.412109375, 3.1318359375, 3.8515625, 4.5712890625, 5.291015625, 6.0107421875, 6.73046875, 7.4501953125, 8.169921875, 8.8896484375, 9.609375, 10.3291015625, 11.048828125, 11.7685546875, 12.48828125, 13.2080078125, 13.927734375, 14.6474609375, 15.3671875, 16.0869140625, 16.806640625, 17.5263671875, 18.24609375, 18.9658203125, 19.685546875, 20.4052734375, 21.125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 26.0, 38.0, 66.0, 97.0, 126.0, 132.0, 131.0, 115.0, 74.0, 63.0, 41.0, 26.0, 13.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.71875, -16.36932373046875, -16.0198974609375, -15.67047119140625, -15.321044921875, -14.97161865234375, -14.6221923828125, -14.27276611328125, -13.92333984375, -13.57391357421875, -13.2244873046875, -12.87506103515625, -12.525634765625, -12.17620849609375, -11.8267822265625, -11.47735595703125, -11.1279296875, -10.77850341796875, -10.4290771484375, -10.07965087890625, -9.730224609375, -9.38079833984375, -9.0313720703125, -8.68194580078125, -8.33251953125, -7.98309326171875, -7.6336669921875, -7.28424072265625, -6.934814453125, -6.58538818359375, -6.2359619140625, -5.88653564453125, -5.537109375, -5.18768310546875, -4.8382568359375, -4.48883056640625, -4.139404296875, -3.78997802734375, -3.4405517578125, -3.09112548828125, -2.74169921875, -2.39227294921875, -2.0428466796875, -1.69342041015625, -1.343994140625, -0.99456787109375, -0.6451416015625, -0.29571533203125, 0.0537109375, 0.40313720703125, 0.7525634765625, 1.10198974609375, 1.451416015625, 1.80084228515625, 2.1502685546875, 2.49969482421875, 2.84912109375, 3.19854736328125, 3.5479736328125, 3.89739990234375, 4.246826171875, 4.59625244140625, 4.9456787109375, 5.29510498046875, 5.64453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 16.0, 27.0, 77.0, 220.0, 328.0, 215.0, 86.0, 31.0, 6.0, 5.0, 2.0, 1.0, 1.0], "bins": [-496.0281982421875, -487.0992431640625, -478.1703186035156, -469.2413635253906, -460.31243896484375, -451.38348388671875, -442.45452880859375, -433.5256042480469, -424.5966491699219, -415.6676940917969, -406.73876953125, -397.809814453125, -388.880859375, -379.9519348144531, -371.0229797363281, -362.09405517578125, -353.16510009765625, -344.23614501953125, -335.3072204589844, -326.3782653808594, -317.4493408203125, -308.5203857421875, -299.5914306640625, -290.6625061035156, -281.7335510253906, -272.8045959472656, -263.87567138671875, -254.94671630859375, -246.0177764892578, -237.08883666992188, -228.15988159179688, -219.23094177246094, -210.30198669433594, -201.373046875, -192.444091796875, -183.51515197753906, -174.58621215820312, -165.6572723388672, -156.72833251953125, -147.79937744140625, -138.8704376220703, -129.94149780273438, -121.0125503540039, -112.08360290527344, -103.1546630859375, -94.22572326660156, -85.2967758178711, -76.36782836914062, -67.43888854980469, -58.509944915771484, -49.58100128173828, -40.65205764770508, -31.723114013671875, -22.794170379638672, -13.865226745605469, -4.936283111572266, 3.9926605224609375, 12.92160415649414, 21.850547790527344, 30.779491424560547, 39.70843505859375, 48.63737869262695, 57.566322326660156, 66.49526977539062, 75.42420959472656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 10.0, 7.0, 10.0, 12.0, 19.0, 20.0, 18.0, 16.0, 26.0, 40.0, 44.0, 41.0, 52.0, 45.0, 49.0, 62.0, 51.0, 51.0, 51.0, 47.0, 36.0, 39.0, 37.0, 43.0, 28.0, 22.0, 22.0, 9.0, 14.0, 15.0, 14.0, 9.0, 4.0, 3.0, 9.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-84.17637634277344, -81.90940856933594, -79.64244842529297, -77.37548065185547, -75.10851287841797, -72.841552734375, -70.5745849609375, -68.3076171875, -66.0406494140625, -63.773685455322266, -61.506717681884766, -59.23975372314453, -56.97278594970703, -54.7058219909668, -52.43885803222656, -50.17189025878906, -47.904930114746094, -45.63796615600586, -43.37099838256836, -41.104034423828125, -38.837066650390625, -36.57010269165039, -34.303138732910156, -32.036170959472656, -29.769207000732422, -27.502241134643555, -25.235275268554688, -22.968311309814453, -20.701345443725586, -18.43437957763672, -16.167415618896484, -13.900449752807617, -11.633476257324219, -9.366510391235352, -7.099545478820801, -4.832580089569092, -2.565614700317383, -0.2986488342285156, 1.9683160781860352, 4.235280990600586, 6.502246856689453, 8.76921272277832, 11.036177635192871, 13.303142547607422, 15.570108413696289, 17.837074279785156, 20.10403823852539, 22.371004104614258, 24.637969970703125, 26.904935836791992, 29.17190170288086, 31.438865661621094, 33.705833435058594, 35.97279739379883, 38.23976135253906, 40.50672912597656, 42.7736930847168, 45.04065704345703, 47.30762481689453, 49.574588775634766, 51.841552734375, 54.1085205078125, 56.375484466552734, 58.64244842529297, 60.90941619873047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 0.0, 5.0, 4.0, 16.0, 22.0, 31.0, 49.0, 70.0, 130.0, 255.0, 560.0, 1527.0, 5085.0, 25281.0, 387373.0, 3708611.0, 52843.0, 8640.0, 2189.0, 779.0, 346.0, 173.0, 105.0, 60.0, 43.0, 36.0, 12.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.0625, -58.072265625, -56.08203125, -54.091796875, -52.1015625, -50.111328125, -48.12109375, -46.130859375, -44.140625, -42.150390625, -40.16015625, -38.169921875, -36.1796875, -34.189453125, -32.19921875, -30.208984375, -28.21875, -26.228515625, -24.23828125, -22.248046875, -20.2578125, -18.267578125, -16.27734375, -14.287109375, -12.296875, -10.306640625, -8.31640625, -6.326171875, -4.3359375, -2.345703125, -0.35546875, 1.634765625, 3.625, 5.615234375, 7.60546875, 9.595703125, 11.5859375, 13.576171875, 15.56640625, 17.556640625, 19.546875, 21.537109375, 23.52734375, 25.517578125, 27.5078125, 29.498046875, 31.48828125, 33.478515625, 35.46875, 37.458984375, 39.44921875, 41.439453125, 43.4296875, 45.419921875, 47.41015625, 49.400390625, 51.390625, 53.380859375, 55.37109375, 57.361328125, 59.3515625, 61.341796875, 63.33203125, 65.322265625, 67.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 2.0, 2.0, 7.0, 10.0, 11.0, 11.0, 26.0, 16.0, 49.0, 39.0, 48.0, 58.0, 66.0, 72.0, 67.0, 65.0, 84.0, 69.0, 69.0, 50.0, 51.0, 27.0, 19.0, 18.0, 11.0, 14.0, 16.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.962890625, -2.875946044921875, -2.78900146484375, -2.702056884765625, -2.6151123046875, -2.528167724609375, -2.44122314453125, -2.354278564453125, -2.267333984375, -2.180389404296875, -2.09344482421875, -2.006500244140625, -1.9195556640625, -1.832611083984375, -1.74566650390625, -1.658721923828125, -1.57177734375, -1.484832763671875, -1.39788818359375, -1.310943603515625, -1.2239990234375, -1.137054443359375, -1.05010986328125, -0.963165283203125, -0.876220703125, -0.789276123046875, -0.70233154296875, -0.615386962890625, -0.5284423828125, -0.441497802734375, -0.35455322265625, -0.267608642578125, -0.1806640625, -0.093719482421875, -0.00677490234375, 0.080169677734375, 0.1671142578125, 0.254058837890625, 0.34100341796875, 0.427947998046875, 0.514892578125, 0.601837158203125, 0.68878173828125, 0.775726318359375, 0.8626708984375, 0.949615478515625, 1.03656005859375, 1.123504638671875, 1.21044921875, 1.297393798828125, 1.38433837890625, 1.471282958984375, 1.5582275390625, 1.645172119140625, 1.73211669921875, 1.819061279296875, 1.906005859375, 1.992950439453125, 2.07989501953125, 2.166839599609375, 2.2537841796875, 2.340728759765625, 2.42767333984375, 2.514617919921875, 2.6015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 14.0, 20.0, 37.0, 61.0, 94.0, 177.0, 366.0, 769.0, 1862.0, 4734.0, 16425.0, 83836.0, 1416119.0, 2548224.0, 94046.0, 18358.0, 5359.0, 2012.0, 861.0, 406.0, 204.0, 115.0, 85.0, 39.0, 25.0, 16.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.19140625, -40.9140625, -39.63671875, -38.359375, -37.08203125, -35.8046875, -34.52734375, -33.25, -31.97265625, -30.6953125, -29.41796875, -28.140625, -26.86328125, -25.5859375, -24.30859375, -23.03125, -21.75390625, -20.4765625, -19.19921875, -17.921875, -16.64453125, -15.3671875, -14.08984375, -12.8125, -11.53515625, -10.2578125, -8.98046875, -7.703125, -6.42578125, -5.1484375, -3.87109375, -2.59375, -1.31640625, -0.0390625, 1.23828125, 2.515625, 3.79296875, 5.0703125, 6.34765625, 7.625, 8.90234375, 10.1796875, 11.45703125, 12.734375, 14.01171875, 15.2890625, 16.56640625, 17.84375, 19.12109375, 20.3984375, 21.67578125, 22.953125, 24.23046875, 25.5078125, 26.78515625, 28.0625, 29.33984375, 30.6171875, 31.89453125, 33.171875, 34.44921875, 35.7265625, 37.00390625, 38.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 12.0, 12.0, 20.0, 25.0, 37.0, 81.0, 125.0, 293.0, 753.0, 1874.0, 412.0, 156.0, 100.0, 54.0, 45.0, 14.0, 17.0, 12.0, 8.0, 3.0, 8.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4552001953125, -9.152587890625, -8.8499755859375, -8.54736328125, -8.2447509765625, -7.942138671875, -7.6395263671875, -7.3369140625, -7.0343017578125, -6.731689453125, -6.4290771484375, -6.12646484375, -5.8238525390625, -5.521240234375, -5.2186279296875, -4.916015625, -4.6134033203125, -4.310791015625, -4.0081787109375, -3.70556640625, -3.4029541015625, -3.100341796875, -2.7977294921875, -2.4951171875, -2.1925048828125, -1.889892578125, -1.5872802734375, -1.28466796875, -0.9820556640625, -0.679443359375, -0.3768310546875, -0.07421875, 0.2283935546875, 0.531005859375, 0.8336181640625, 1.13623046875, 1.4388427734375, 1.741455078125, 2.0440673828125, 2.3466796875, 2.6492919921875, 2.951904296875, 3.2545166015625, 3.55712890625, 3.8597412109375, 4.162353515625, 4.4649658203125, 4.767578125, 5.0701904296875, 5.372802734375, 5.6754150390625, 5.97802734375, 6.2806396484375, 6.583251953125, 6.8858642578125, 7.1884765625, 7.4910888671875, 7.793701171875, 8.0963134765625, 8.39892578125, 8.7015380859375, 9.004150390625, 9.3067626953125, 9.609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 14.0, 17.0, 28.0, 51.0, 70.0, 118.0, 163.0, 167.0, 132.0, 112.0, 53.0, 31.0, 23.0, 11.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.6428451538086, -69.5374755859375, -67.4321060180664, -65.32673645019531, -63.22136306762695, -61.11599349975586, -59.010623931884766, -56.90525436401367, -54.79988098144531, -52.69451141357422, -50.589141845703125, -48.48377227783203, -46.37839889526367, -44.27302932739258, -42.167659759521484, -40.06229019165039, -37.9569206237793, -35.8515510559082, -33.74618148803711, -31.640810012817383, -29.535438537597656, -27.430068969726562, -25.32469940185547, -23.219329833984375, -21.11395835876465, -19.008588790893555, -16.903217315673828, -14.797847747802734, -12.692477226257324, -10.587106704711914, -8.48173713684082, -6.37636661529541, -4.270992279052734, -2.1656219959259033, -0.060251712799072266, 2.0451183319091797, 4.15048885345459, 6.255859375, 8.361228942871094, 10.466599464416504, 12.571969985961914, 14.677340507507324, 16.782711029052734, 18.888080596923828, 20.993450164794922, 23.09882164001465, 25.204191207885742, 27.30956268310547, 29.414932250976562, 31.520301818847656, 33.62567138671875, 35.731040954589844, 37.8364143371582, 39.9417839050293, 42.04715347290039, 44.152523040771484, 46.257896423339844, 48.36326599121094, 50.46863555908203, 52.574005126953125, 54.679378509521484, 56.78474807739258, 58.89011764526367, 60.995487213134766, 63.10085678100586]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 14.0, 6.0, 18.0, 37.0, 30.0, 43.0, 73.0, 71.0, 98.0, 83.0, 94.0, 98.0, 74.0, 59.0, 57.0, 39.0, 42.0, 27.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.262306213378906, -30.87497329711914, -29.487640380859375, -28.100309371948242, -26.712976455688477, -25.32564353942871, -23.938312530517578, -22.550979614257812, -21.163646697998047, -19.77631378173828, -18.388980865478516, -17.001649856567383, -15.614316940307617, -14.226984024047852, -12.839652061462402, -11.452320098876953, -10.064987182617188, -8.677654266357422, -7.290322303771973, -5.902989864349365, -4.515657424926758, -3.1283249855041504, -1.740992546081543, -0.35366058349609375, 1.0336723327636719, 2.4210047721862793, 3.8083372116088867, 5.195669651031494, 6.583002090454102, 7.970334529876709, 9.357666969299316, 10.744998931884766, 12.132331848144531, 13.519664764404297, 14.906996726989746, 16.294328689575195, 17.68166160583496, 19.068994522094727, 20.45632553100586, 21.843658447265625, 23.23099136352539, 24.618324279785156, 26.005657196044922, 27.392988204956055, 28.78032112121582, 30.167654037475586, 31.55498504638672, 32.942317962646484, 34.32965087890625, 35.716983795166016, 37.10431671142578, 38.49164962768555, 39.87898254394531, 41.26631164550781, 42.65364456176758, 44.040977478027344, 45.42831039428711, 46.815643310546875, 48.20297622680664, 49.590309143066406, 50.977638244628906, 52.36497116088867, 53.75230407714844, 55.1396369934082, 56.52696990966797]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 16.0, 16.0, 21.0, 35.0, 29.0, 56.0, 71.0, 96.0, 163.0, 219.0, 364.0, 643.0, 1160.0, 2351.0, 5808.0, 19027.0, 71520.0, 265729.0, 447576.0, 169658.0, 43502.0, 12206.0, 4087.0, 1781.0, 966.0, 503.0, 335.0, 187.0, 126.0, 77.0, 51.0, 40.0, 32.0, 19.0, 16.0, 16.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.375, -20.713623046875, -20.05224609375, -19.390869140625, -18.7294921875, -18.068115234375, -17.40673828125, -16.745361328125, -16.083984375, -15.422607421875, -14.76123046875, -14.099853515625, -13.4384765625, -12.777099609375, -12.11572265625, -11.454345703125, -10.79296875, -10.131591796875, -9.47021484375, -8.808837890625, -8.1474609375, -7.486083984375, -6.82470703125, -6.163330078125, -5.501953125, -4.840576171875, -4.17919921875, -3.517822265625, -2.8564453125, -2.195068359375, -1.53369140625, -0.872314453125, -0.2109375, 0.450439453125, 1.11181640625, 1.773193359375, 2.4345703125, 3.095947265625, 3.75732421875, 4.418701171875, 5.080078125, 5.741455078125, 6.40283203125, 7.064208984375, 7.7255859375, 8.386962890625, 9.04833984375, 9.709716796875, 10.37109375, 11.032470703125, 11.69384765625, 12.355224609375, 13.0166015625, 13.677978515625, 14.33935546875, 15.000732421875, 15.662109375, 16.323486328125, 16.98486328125, 17.646240234375, 18.3076171875, 18.968994140625, 19.63037109375, 20.291748046875, 20.953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 1.0, 5.0, 7.0, 14.0, 18.0, 22.0, 53.0, 43.0, 70.0, 80.0, 100.0, 98.0, 102.0, 95.0, 77.0, 52.0, 47.0, 40.0, 23.0, 18.0, 12.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.703460693359375, -2.58465576171875, -2.465850830078125, -2.3470458984375, -2.228240966796875, -2.10943603515625, -1.990631103515625, -1.871826171875, -1.753021240234375, -1.63421630859375, -1.515411376953125, -1.3966064453125, -1.277801513671875, -1.15899658203125, -1.040191650390625, -0.92138671875, -0.802581787109375, -0.68377685546875, -0.564971923828125, -0.4461669921875, -0.327362060546875, -0.20855712890625, -0.089752197265625, 0.029052734375, 0.147857666015625, 0.26666259765625, 0.385467529296875, 0.5042724609375, 0.623077392578125, 0.74188232421875, 0.860687255859375, 0.9794921875, 1.098297119140625, 1.21710205078125, 1.335906982421875, 1.4547119140625, 1.573516845703125, 1.69232177734375, 1.811126708984375, 1.929931640625, 2.048736572265625, 2.16754150390625, 2.286346435546875, 2.4051513671875, 2.523956298828125, 2.64276123046875, 2.761566162109375, 2.88037109375, 2.999176025390625, 3.11798095703125, 3.236785888671875, 3.3555908203125, 3.474395751953125, 3.59320068359375, 3.712005615234375, 3.830810546875, 3.949615478515625, 4.06842041015625, 4.187225341796875, 4.3060302734375, 4.424835205078125, 4.54364013671875, 4.662445068359375, 4.78125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 12.0, 4.0, 8.0, 21.0, 22.0, 28.0, 43.0, 63.0, 68.0, 117.0, 163.0, 238.0, 338.0, 482.0, 821.0, 1497.0, 2928.0, 6018.0, 13807.0, 32886.0, 80919.0, 184810.0, 298212.0, 233529.0, 111256.0, 45316.0, 18408.0, 7966.0, 3731.0, 1870.0, 1024.0, 621.0, 381.0, 256.0, 213.0, 125.0, 93.0, 57.0, 52.0, 33.0, 33.0, 20.0, 16.0, 16.0, 11.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.44091796875, -10.1005859375, -9.76025390625, -9.419921875, -9.07958984375, -8.7392578125, -8.39892578125, -8.05859375, -7.71826171875, -7.3779296875, -7.03759765625, -6.697265625, -6.35693359375, -6.0166015625, -5.67626953125, -5.3359375, -4.99560546875, -4.6552734375, -4.31494140625, -3.974609375, -3.63427734375, -3.2939453125, -2.95361328125, -2.61328125, -2.27294921875, -1.9326171875, -1.59228515625, -1.251953125, -0.91162109375, -0.5712890625, -0.23095703125, 0.109375, 0.44970703125, 0.7900390625, 1.13037109375, 1.470703125, 1.81103515625, 2.1513671875, 2.49169921875, 2.83203125, 3.17236328125, 3.5126953125, 3.85302734375, 4.193359375, 4.53369140625, 4.8740234375, 5.21435546875, 5.5546875, 5.89501953125, 6.2353515625, 6.57568359375, 6.916015625, 7.25634765625, 7.5966796875, 7.93701171875, 8.27734375, 8.61767578125, 8.9580078125, 9.29833984375, 9.638671875, 9.97900390625, 10.3193359375, 10.65966796875, 11.0]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 6.0, 14.0, 11.0, 11.0, 17.0, 16.0, 34.0, 30.0, 29.0, 42.0, 30.0, 37.0, 40.0, 42.0, 49.0, 47.0, 44.0, 38.0, 43.0, 36.0, 34.0, 33.0, 47.0, 49.0, 27.0, 30.0, 24.0, 27.0, 25.0, 9.0, 8.0, 8.0, 10.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.0703125, -8.8079833984375, -8.545654296875, -8.2833251953125, -8.02099609375, -7.7586669921875, -7.496337890625, -7.2340087890625, -6.9716796875, -6.7093505859375, -6.447021484375, -6.1846923828125, -5.92236328125, -5.6600341796875, -5.397705078125, -5.1353759765625, -4.873046875, -4.6107177734375, -4.348388671875, -4.0860595703125, -3.82373046875, -3.5614013671875, -3.299072265625, -3.0367431640625, -2.7744140625, -2.5120849609375, -2.249755859375, -1.9874267578125, -1.72509765625, -1.4627685546875, -1.200439453125, -0.9381103515625, -0.67578125, -0.4134521484375, -0.151123046875, 0.1112060546875, 0.37353515625, 0.6358642578125, 0.898193359375, 1.1605224609375, 1.4228515625, 1.6851806640625, 1.947509765625, 2.2098388671875, 2.47216796875, 2.7344970703125, 2.996826171875, 3.2591552734375, 3.521484375, 3.7838134765625, 4.046142578125, 4.3084716796875, 4.57080078125, 4.8331298828125, 5.095458984375, 5.3577880859375, 5.6201171875, 5.8824462890625, 6.144775390625, 6.4071044921875, 6.66943359375, 6.9317626953125, 7.194091796875, 7.4564208984375, 7.71875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 14.0, 15.0, 13.0, 19.0, 31.0, 72.0, 104.0, 155.0, 210.0, 351.0, 641.0, 1199.0, 2685.0, 6208.0, 16692.0, 46269.0, 126360.0, 277033.0, 312074.0, 161155.0, 60854.0, 21627.0, 8199.0, 3138.0, 1522.0, 756.0, 394.0, 242.0, 158.0, 103.0, 72.0, 42.0, 43.0, 31.0, 10.0, 13.0, 11.0, 6.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45306396484375, -4.2889404296875, -4.12481689453125, -3.960693359375, -3.79656982421875, -3.6324462890625, -3.46832275390625, -3.30419921875, -3.14007568359375, -2.9759521484375, -2.81182861328125, -2.647705078125, -2.48358154296875, -2.3194580078125, -2.15533447265625, -1.9912109375, -1.82708740234375, -1.6629638671875, -1.49884033203125, -1.334716796875, -1.17059326171875, -1.0064697265625, -0.84234619140625, -0.67822265625, -0.51409912109375, -0.3499755859375, -0.18585205078125, -0.021728515625, 0.14239501953125, 0.3065185546875, 0.47064208984375, 0.634765625, 0.79888916015625, 0.9630126953125, 1.12713623046875, 1.291259765625, 1.45538330078125, 1.6195068359375, 1.78363037109375, 1.94775390625, 2.11187744140625, 2.2760009765625, 2.44012451171875, 2.604248046875, 2.76837158203125, 2.9324951171875, 3.09661865234375, 3.2607421875, 3.42486572265625, 3.5889892578125, 3.75311279296875, 3.917236328125, 4.08135986328125, 4.2454833984375, 4.40960693359375, 4.57373046875, 4.73785400390625, 4.9019775390625, 5.06610107421875, 5.230224609375, 5.39434814453125, 5.5584716796875, 5.72259521484375, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 8.0, 15.0, 14.0, 21.0, 25.0, 29.0, 47.0, 56.0, 67.0, 67.0, 93.0, 105.0, 77.0, 71.0, 38.0, 54.0, 36.0, 24.0, 21.0, 21.0, 12.0, 10.0, 17.0, 8.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009593963623046875, -0.0009296610951423645, -0.0008999258279800415, -0.0008701905608177185, -0.0008404552936553955, -0.0008107200264930725, -0.0007809847593307495, -0.0007512494921684265, -0.0007215142250061035, -0.0006917789578437805, -0.0006620436906814575, -0.0006323084235191345, -0.0006025731563568115, -0.0005728378891944885, -0.0005431026220321655, -0.0005133673548698425, -0.00048363208770751953, -0.00045389682054519653, -0.00042416155338287354, -0.00039442628622055054, -0.00036469101905822754, -0.00033495575189590454, -0.00030522048473358154, -0.00027548521757125854, -0.00024574995040893555, -0.00021601468324661255, -0.00018627941608428955, -0.00015654414892196655, -0.00012680888175964355, -9.707361459732056e-05, -6.733834743499756e-05, -3.760308027267456e-05, -7.867813110351562e-06, 2.1867454051971436e-05, 5.1602721214294434e-05, 8.133798837661743e-05, 0.00011107325553894043, 0.00014080852270126343, 0.00017054378986358643, 0.00020027905702590942, 0.00023001432418823242, 0.0002597495913505554, 0.0002894848585128784, 0.0003192201256752014, 0.0003489553928375244, 0.0003786906599998474, 0.0004084259271621704, 0.0004381611943244934, 0.0004678964614868164, 0.0004976317286491394, 0.0005273669958114624, 0.0005571022629737854, 0.0005868375301361084, 0.0006165727972984314, 0.0006463080644607544, 0.0006760433316230774, 0.0007057785987854004, 0.0007355138659477234, 0.0007652491331100464, 0.0007949844002723694, 0.0008247196674346924, 0.0008544549345970154, 0.0008841902017593384, 0.0009139254689216614, 0.0009436607360839844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 5.0, 13.0, 15.0, 19.0, 27.0, 30.0, 54.0, 67.0, 95.0, 153.0, 186.0, 309.0, 477.0, 812.0, 1501.0, 2830.0, 5980.0, 13732.0, 35468.0, 95553.0, 232597.0, 326363.0, 201221.0, 79209.0, 29236.0, 11534.0, 5031.0, 2453.0, 1363.0, 788.0, 469.0, 299.0, 173.0, 141.0, 123.0, 54.0, 48.0, 27.0, 21.0, 17.0, 14.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.16748046875, -5.0029296875, -4.83837890625, -4.673828125, -4.50927734375, -4.3447265625, -4.18017578125, -4.015625, -3.85107421875, -3.6865234375, -3.52197265625, -3.357421875, -3.19287109375, -3.0283203125, -2.86376953125, -2.69921875, -2.53466796875, -2.3701171875, -2.20556640625, -2.041015625, -1.87646484375, -1.7119140625, -1.54736328125, -1.3828125, -1.21826171875, -1.0537109375, -0.88916015625, -0.724609375, -0.56005859375, -0.3955078125, -0.23095703125, -0.06640625, 0.09814453125, 0.2626953125, 0.42724609375, 0.591796875, 0.75634765625, 0.9208984375, 1.08544921875, 1.25, 1.41455078125, 1.5791015625, 1.74365234375, 1.908203125, 2.07275390625, 2.2373046875, 2.40185546875, 2.56640625, 2.73095703125, 2.8955078125, 3.06005859375, 3.224609375, 3.38916015625, 3.5537109375, 3.71826171875, 3.8828125, 4.04736328125, 4.2119140625, 4.37646484375, 4.541015625, 4.70556640625, 4.8701171875, 5.03466796875, 5.19921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 14.0, 21.0, 21.0, 35.0, 27.0, 34.0, 33.0, 35.0, 48.0, 50.0, 60.0, 76.0, 68.0, 57.0, 54.0, 55.0, 54.0, 48.0, 20.0, 26.0, 26.0, 13.0, 18.0, 17.0, 13.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48046875, -3.374359130859375, -3.26824951171875, -3.162139892578125, -3.0560302734375, -2.949920654296875, -2.84381103515625, -2.737701416015625, -2.631591796875, -2.525482177734375, -2.41937255859375, -2.313262939453125, -2.2071533203125, -2.101043701171875, -1.99493408203125, -1.888824462890625, -1.78271484375, -1.676605224609375, -1.57049560546875, -1.464385986328125, -1.3582763671875, -1.252166748046875, -1.14605712890625, -1.039947509765625, -0.933837890625, -0.827728271484375, -0.72161865234375, -0.615509033203125, -0.5093994140625, -0.403289794921875, -0.29718017578125, -0.191070556640625, -0.0849609375, 0.021148681640625, 0.12725830078125, 0.233367919921875, 0.3394775390625, 0.445587158203125, 0.55169677734375, 0.657806396484375, 0.763916015625, 0.870025634765625, 0.97613525390625, 1.082244873046875, 1.1883544921875, 1.294464111328125, 1.40057373046875, 1.506683349609375, 1.61279296875, 1.718902587890625, 1.82501220703125, 1.931121826171875, 2.0372314453125, 2.143341064453125, 2.24945068359375, 2.355560302734375, 2.461669921875, 2.567779541015625, 2.67388916015625, 2.779998779296875, 2.8861083984375, 2.992218017578125, 3.09832763671875, 3.204437255859375, 3.310546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 16.0, 33.0, 50.0, 59.0, 130.0, 128.0, 143.0, 133.0, 98.0, 73.0, 47.0, 27.0, 21.0, 17.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.74972534179688, -70.46208190917969, -67.1744384765625, -63.88679885864258, -60.599159240722656, -57.31151580810547, -54.02387237548828, -50.736228942871094, -47.44858932495117, -44.160945892333984, -40.87330627441406, -37.585662841796875, -34.29801940917969, -31.010379791259766, -27.722736358642578, -24.435094833374023, -21.14745330810547, -17.859811782836914, -14.572169303894043, -11.284526824951172, -7.996885299682617, -4.7092437744140625, -1.421600341796875, 1.8660411834716797, 5.153682708740234, 8.441324234008789, 11.72896671295166, 15.016609191894531, 18.304250717163086, 21.59189224243164, 24.879535675048828, 28.167177200317383, 31.454818725585938, 34.742462158203125, 38.03010177612305, 41.317745208740234, 44.605384826660156, 47.893028259277344, 51.18067169189453, 54.46831512451172, 57.75595474243164, 61.04359817504883, 64.33123779296875, 67.61888122558594, 70.90652465820312, 74.19416809082031, 77.4818115234375, 80.76944732666016, 84.05709075927734, 87.34473419189453, 90.63237762451172, 93.92001342773438, 97.20765686035156, 100.49530029296875, 103.78294372558594, 107.07058715820312, 110.35823059082031, 113.6458740234375, 116.93351745605469, 120.22116088867188, 123.50879669189453, 126.79644012451172, 130.08407592773438, 133.37171936035156, 136.65936279296875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 21.0, 23.0, 22.0, 38.0, 23.0, 41.0, 40.0, 46.0, 63.0, 59.0, 66.0, 71.0, 70.0, 42.0, 51.0, 49.0, 54.0, 42.0, 29.0, 30.0, 22.0, 19.0, 13.0, 12.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11974334716797, -67.11236572265625, -65.10498046875, -63.09760284423828, -61.0902214050293, -59.08283996582031, -57.075462341308594, -55.06808090209961, -53.060699462890625, -51.05331802368164, -49.04594039916992, -47.03855895996094, -45.03117752075195, -43.02379608154297, -41.01641845703125, -39.009037017822266, -37.00165939331055, -34.99427795410156, -32.986900329589844, -30.97951889038086, -28.972137451171875, -26.964757919311523, -24.957378387451172, -22.949996948242188, -20.942617416381836, -18.935237884521484, -16.9278564453125, -14.920476913452148, -12.91309642791748, -10.905715942382812, -8.898336410522461, -6.890955924987793, -4.883579254150391, -2.8761990070343018, -0.8688187599182129, 1.1385612487792969, 3.145941734313965, 5.153322219848633, 7.160701751708984, 9.168082237243652, 11.17546272277832, 13.182843208312988, 15.190223693847656, 17.197603225708008, 19.20498275756836, 21.212364196777344, 23.219743728637695, 25.227123260498047, 27.23450469970703, 29.241884231567383, 31.249265670776367, 33.25664520263672, 35.2640266418457, 37.27140808105469, 39.278785705566406, 41.28616714477539, 43.293548583984375, 45.30093002319336, 47.30830764770508, 49.31568908691406, 51.32307052612305, 53.33045196533203, 55.33782958984375, 57.345211029052734, 59.35258865356445]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 14.0, 21.0, 24.0, 42.0, 52.0, 90.0, 138.0, 182.0, 343.0, 653.0, 1317.0, 3203.0, 9775.0, 41473.0, 537638.0, 3511248.0, 67167.0, 13597.0, 3940.0, 1550.0, 692.0, 397.0, 248.0, 130.0, 87.0, 49.0, 61.0, 30.0, 13.0, 29.0, 13.0, 10.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.0625, -30.9619140625, -29.861328125, -28.7607421875, -27.66015625, -26.5595703125, -25.458984375, -24.3583984375, -23.2578125, -22.1572265625, -21.056640625, -19.9560546875, -18.85546875, -17.7548828125, -16.654296875, -15.5537109375, -14.453125, -13.3525390625, -12.251953125, -11.1513671875, -10.05078125, -8.9501953125, -7.849609375, -6.7490234375, -5.6484375, -4.5478515625, -3.447265625, -2.3466796875, -1.24609375, -0.1455078125, 0.955078125, 2.0556640625, 3.15625, 4.2568359375, 5.357421875, 6.4580078125, 7.55859375, 8.6591796875, 9.759765625, 10.8603515625, 11.9609375, 13.0615234375, 14.162109375, 15.2626953125, 16.36328125, 17.4638671875, 18.564453125, 19.6650390625, 20.765625, 21.8662109375, 22.966796875, 24.0673828125, 25.16796875, 26.2685546875, 27.369140625, 28.4697265625, 29.5703125, 30.6708984375, 31.771484375, 32.8720703125, 33.97265625, 35.0732421875, 36.173828125, 37.2744140625, 38.375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 12.0, 15.0, 19.0, 19.0, 32.0, 47.0, 47.0, 53.0, 61.0, 72.0, 73.0, 76.0, 82.0, 66.0, 64.0, 58.0, 56.0, 35.0, 32.0, 16.0, 16.0, 12.0, 8.0, 5.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.50079345703125, -2.4019775390625, -2.30316162109375, -2.204345703125, -2.10552978515625, -2.0067138671875, -1.90789794921875, -1.80908203125, -1.71026611328125, -1.6114501953125, -1.51263427734375, -1.413818359375, -1.31500244140625, -1.2161865234375, -1.11737060546875, -1.0185546875, -0.91973876953125, -0.8209228515625, -0.72210693359375, -0.623291015625, -0.52447509765625, -0.4256591796875, -0.32684326171875, -0.22802734375, -0.12921142578125, -0.0303955078125, 0.06842041015625, 0.167236328125, 0.26605224609375, 0.3648681640625, 0.46368408203125, 0.5625, 0.66131591796875, 0.7601318359375, 0.85894775390625, 0.957763671875, 1.05657958984375, 1.1553955078125, 1.25421142578125, 1.35302734375, 1.45184326171875, 1.5506591796875, 1.64947509765625, 1.748291015625, 1.84710693359375, 1.9459228515625, 2.04473876953125, 2.1435546875, 2.24237060546875, 2.3411865234375, 2.44000244140625, 2.538818359375, 2.63763427734375, 2.7364501953125, 2.83526611328125, 2.93408203125, 3.03289794921875, 3.1317138671875, 3.23052978515625, 3.329345703125, 3.42816162109375, 3.5269775390625, 3.62579345703125, 3.724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 10.0, 11.0, 25.0, 21.0, 41.0, 42.0, 80.0, 88.0, 127.0, 177.0, 292.0, 532.0, 936.0, 1788.0, 3959.0, 10021.0, 32929.0, 144125.0, 2583833.0, 1250510.0, 120739.0, 28459.0, 8825.0, 3380.0, 1503.0, 709.0, 389.0, 223.0, 157.0, 107.0, 75.0, 38.0, 38.0, 20.0, 22.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.8564453125, -18.181640625, -17.5068359375, -16.83203125, -16.1572265625, -15.482421875, -14.8076171875, -14.1328125, -13.4580078125, -12.783203125, -12.1083984375, -11.43359375, -10.7587890625, -10.083984375, -9.4091796875, -8.734375, -8.0595703125, -7.384765625, -6.7099609375, -6.03515625, -5.3603515625, -4.685546875, -4.0107421875, -3.3359375, -2.6611328125, -1.986328125, -1.3115234375, -0.63671875, 0.0380859375, 0.712890625, 1.3876953125, 2.0625, 2.7373046875, 3.412109375, 4.0869140625, 4.76171875, 5.4365234375, 6.111328125, 6.7861328125, 7.4609375, 8.1357421875, 8.810546875, 9.4853515625, 10.16015625, 10.8349609375, 11.509765625, 12.1845703125, 12.859375, 13.5341796875, 14.208984375, 14.8837890625, 15.55859375, 16.2333984375, 16.908203125, 17.5830078125, 18.2578125, 18.9326171875, 19.607421875, 20.2822265625, 20.95703125, 21.6318359375, 22.306640625, 22.9814453125, 23.65625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 17.0, 20.0, 32.0, 50.0, 91.0, 175.0, 399.0, 1880.0, 791.0, 264.0, 139.0, 79.0, 54.0, 28.0, 22.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.21063232421875, -9.9603271484375, -9.71002197265625, -9.459716796875, -9.20941162109375, -8.9591064453125, -8.70880126953125, -8.45849609375, -8.20819091796875, -7.9578857421875, -7.70758056640625, -7.457275390625, -7.20697021484375, -6.9566650390625, -6.70635986328125, -6.4560546875, -6.20574951171875, -5.9554443359375, -5.70513916015625, -5.454833984375, -5.20452880859375, -4.9542236328125, -4.70391845703125, -4.45361328125, -4.20330810546875, -3.9530029296875, -3.70269775390625, -3.452392578125, -3.20208740234375, -2.9517822265625, -2.70147705078125, -2.451171875, -2.20086669921875, -1.9505615234375, -1.70025634765625, -1.449951171875, -1.19964599609375, -0.9493408203125, -0.69903564453125, -0.44873046875, -0.19842529296875, 0.0518798828125, 0.30218505859375, 0.552490234375, 0.80279541015625, 1.0531005859375, 1.30340576171875, 1.5537109375, 1.80401611328125, 2.0543212890625, 2.30462646484375, 2.554931640625, 2.80523681640625, 3.0555419921875, 3.30584716796875, 3.55615234375, 3.80645751953125, 4.0567626953125, 4.30706787109375, 4.557373046875, 4.80767822265625, 5.0579833984375, 5.30828857421875, 5.55859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 7.0, 18.0, 11.0, 29.0, 25.0, 43.0, 46.0, 93.0, 100.0, 117.0, 105.0, 97.0, 100.0, 65.0, 47.0, 39.0, 21.0, 11.0, 11.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.752973556518555, -27.701313018798828, -26.649654388427734, -25.597993850708008, -24.54633331298828, -23.494674682617188, -22.44301414489746, -21.391353607177734, -20.33969497680664, -19.288034439086914, -18.23637580871582, -17.184715270996094, -16.133054733276367, -15.081395149230957, -14.029735565185547, -12.97807502746582, -11.926414489746094, -10.874754905700684, -9.823094367980957, -8.771434783935547, -7.7197747230529785, -6.66811466217041, -5.616455078125, -4.564795017242432, -3.5131349563598633, -2.461474895477295, -1.4098150730133057, -0.3581552505493164, 0.693504810333252, 1.7451648712158203, 2.7968244552612305, 3.848484516143799, 4.900142669677734, 5.951802730560303, 7.003462791442871, 8.055122375488281, 9.106782913208008, 10.158442497253418, 11.210102081298828, 12.261762619018555, 13.313422203063965, 14.365081787109375, 15.416742324829102, 16.468402862548828, 17.520061492919922, 18.57172203063965, 19.623382568359375, 20.67504119873047, 21.726701736450195, 22.778362274169922, 23.830020904541016, 24.881681442260742, 25.93334197998047, 26.985000610351562, 28.03666114807129, 29.088321685791016, 30.13998031616211, 31.191640853881836, 32.24330139160156, 33.294960021972656, 34.34661865234375, 35.39828109741211, 36.4499397277832, 37.5015983581543, 38.553260803222656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 14.0, 5.0, 12.0, 8.0, 14.0, 11.0, 12.0, 13.0, 10.0, 12.0, 20.0, 22.0, 16.0, 34.0, 36.0, 23.0, 18.0, 33.0, 40.0, 26.0, 33.0, 54.0, 41.0, 37.0, 30.0, 42.0, 38.0, 30.0, 31.0, 29.0, 30.0, 23.0, 31.0, 41.0, 15.0, 16.0, 16.0, 16.0, 12.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.96296501159668, -15.47378921508789, -14.984614372253418, -14.495438575744629, -14.00626277923584, -13.517087936401367, -13.027912139892578, -12.538736343383789, -12.049560546875, -11.560384750366211, -11.071209907531738, -10.58203411102295, -10.09285831451416, -9.603683471679688, -9.114507675170898, -8.62533187866211, -8.136157035827637, -7.646981716156006, -7.157805919647217, -6.668630599975586, -6.179454803466797, -5.690279483795166, -5.201104164123535, -4.711928367614746, -4.222753047943115, -3.7335774898529053, -3.2444019317626953, -2.7552266120910645, -2.2660510540008545, -1.7768754959106445, -1.2877001762390137, -0.7985246181488037, -0.30934810638427734, 0.17982739210128784, 0.669002890586853, 1.1581783294677734, 1.6473538875579834, 2.1365294456481934, 2.625704765319824, 3.114880323410034, 3.604055881500244, 4.093231201171875, 4.582406997680664, 5.071582317352295, 5.560757637023926, 6.049933433532715, 6.539108753204346, 7.028284072875977, 7.517459869384766, 8.006635665893555, 8.495810508728027, 8.984986305236816, 9.474162101745605, 9.963336944580078, 10.452512741088867, 10.941688537597656, 11.430864334106445, 11.920040130615234, 12.409214973449707, 12.898390769958496, 13.387566566467285, 13.876741409301758, 14.365917205810547, 14.855093002319336, 15.344267845153809]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 14.0, 24.0, 29.0, 29.0, 40.0, 48.0, 53.0, 97.0, 137.0, 221.0, 329.0, 596.0, 1049.0, 2310.0, 5913.0, 18109.0, 67582.0, 271669.0, 469183.0, 153685.0, 38502.0, 11209.0, 3882.0, 1663.0, 803.0, 439.0, 285.0, 205.0, 117.0, 83.0, 52.0, 41.0, 33.0, 33.0, 22.0, 14.0, 7.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.056640625, -19.39453125, -18.732421875, -18.0703125, -17.408203125, -16.74609375, -16.083984375, -15.421875, -14.759765625, -14.09765625, -13.435546875, -12.7734375, -12.111328125, -11.44921875, -10.787109375, -10.125, -9.462890625, -8.80078125, -8.138671875, -7.4765625, -6.814453125, -6.15234375, -5.490234375, -4.828125, -4.166015625, -3.50390625, -2.841796875, -2.1796875, -1.517578125, -0.85546875, -0.193359375, 0.46875, 1.130859375, 1.79296875, 2.455078125, 3.1171875, 3.779296875, 4.44140625, 5.103515625, 5.765625, 6.427734375, 7.08984375, 7.751953125, 8.4140625, 9.076171875, 9.73828125, 10.400390625, 11.0625, 11.724609375, 12.38671875, 13.048828125, 13.7109375, 14.373046875, 15.03515625, 15.697265625, 16.359375, 17.021484375, 17.68359375, 18.345703125, 19.0078125, 19.669921875, 20.33203125, 20.994140625, 21.65625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 19.0, 19.0, 19.0, 41.0, 51.0, 51.0, 47.0, 71.0, 89.0, 83.0, 86.0, 79.0, 72.0, 78.0, 46.0, 35.0, 35.0, 24.0, 19.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.21856689453125, -3.1070556640625, -2.99554443359375, -2.884033203125, -2.77252197265625, -2.6610107421875, -2.54949951171875, -2.43798828125, -2.32647705078125, -2.2149658203125, -2.10345458984375, -1.991943359375, -1.88043212890625, -1.7689208984375, -1.65740966796875, -1.5458984375, -1.43438720703125, -1.3228759765625, -1.21136474609375, -1.099853515625, -0.98834228515625, -0.8768310546875, -0.76531982421875, -0.65380859375, -0.54229736328125, -0.4307861328125, -0.31927490234375, -0.207763671875, -0.09625244140625, 0.0152587890625, 0.12677001953125, 0.23828125, 0.34979248046875, 0.4613037109375, 0.57281494140625, 0.684326171875, 0.79583740234375, 0.9073486328125, 1.01885986328125, 1.13037109375, 1.24188232421875, 1.3533935546875, 1.46490478515625, 1.576416015625, 1.68792724609375, 1.7994384765625, 1.91094970703125, 2.0224609375, 2.13397216796875, 2.2454833984375, 2.35699462890625, 2.468505859375, 2.58001708984375, 2.6915283203125, 2.80303955078125, 2.91455078125, 3.02606201171875, 3.1375732421875, 3.24908447265625, 3.360595703125, 3.47210693359375, 3.5836181640625, 3.69512939453125, 3.806640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 11.0, 11.0, 19.0, 33.0, 42.0, 60.0, 68.0, 111.0, 167.0, 232.0, 338.0, 482.0, 760.0, 1352.0, 2387.0, 4731.0, 9774.0, 22522.0, 52419.0, 122348.0, 246607.0, 291300.0, 161688.0, 73082.0, 30936.0, 13238.0, 6180.0, 3110.0, 1647.0, 1010.0, 647.0, 399.0, 254.0, 153.0, 105.0, 81.0, 72.0, 42.0, 39.0, 23.0, 18.0, 9.0, 5.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-9.421875, -9.129150390625, -8.83642578125, -8.543701171875, -8.2509765625, -7.958251953125, -7.66552734375, -7.372802734375, -7.080078125, -6.787353515625, -6.49462890625, -6.201904296875, -5.9091796875, -5.616455078125, -5.32373046875, -5.031005859375, -4.73828125, -4.445556640625, -4.15283203125, -3.860107421875, -3.5673828125, -3.274658203125, -2.98193359375, -2.689208984375, -2.396484375, -2.103759765625, -1.81103515625, -1.518310546875, -1.2255859375, -0.932861328125, -0.64013671875, -0.347412109375, -0.0546875, 0.238037109375, 0.53076171875, 0.823486328125, 1.1162109375, 1.408935546875, 1.70166015625, 1.994384765625, 2.287109375, 2.579833984375, 2.87255859375, 3.165283203125, 3.4580078125, 3.750732421875, 4.04345703125, 4.336181640625, 4.62890625, 4.921630859375, 5.21435546875, 5.507080078125, 5.7998046875, 6.092529296875, 6.38525390625, 6.677978515625, 6.970703125, 7.263427734375, 7.55615234375, 7.848876953125, 8.1416015625, 8.434326171875, 8.72705078125, 9.019775390625, 9.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 7.0, 10.0, 9.0, 12.0, 22.0, 21.0, 22.0, 25.0, 27.0, 41.0, 36.0, 38.0, 35.0, 46.0, 35.0, 40.0, 47.0, 39.0, 47.0, 39.0, 36.0, 33.0, 37.0, 38.0, 35.0, 26.0, 30.0, 20.0, 20.0, 15.0, 14.0, 13.0, 14.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.4453125, -8.185791015625, -7.92626953125, -7.666748046875, -7.4072265625, -7.147705078125, -6.88818359375, -6.628662109375, -6.369140625, -6.109619140625, -5.85009765625, -5.590576171875, -5.3310546875, -5.071533203125, -4.81201171875, -4.552490234375, -4.29296875, -4.033447265625, -3.77392578125, -3.514404296875, -3.2548828125, -2.995361328125, -2.73583984375, -2.476318359375, -2.216796875, -1.957275390625, -1.69775390625, -1.438232421875, -1.1787109375, -0.919189453125, -0.65966796875, -0.400146484375, -0.140625, 0.118896484375, 0.37841796875, 0.637939453125, 0.8974609375, 1.156982421875, 1.41650390625, 1.676025390625, 1.935546875, 2.195068359375, 2.45458984375, 2.714111328125, 2.9736328125, 3.233154296875, 3.49267578125, 3.752197265625, 4.01171875, 4.271240234375, 4.53076171875, 4.790283203125, 5.0498046875, 5.309326171875, 5.56884765625, 5.828369140625, 6.087890625, 6.347412109375, 6.60693359375, 6.866455078125, 7.1259765625, 7.385498046875, 7.64501953125, 7.904541015625, 8.1640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 11.0, 9.0, 14.0, 16.0, 29.0, 45.0, 74.0, 67.0, 158.0, 216.0, 449.0, 874.0, 2170.0, 6025.0, 20871.0, 83151.0, 336391.0, 430040.0, 124660.0, 29780.0, 8454.0, 2808.0, 1081.0, 471.0, 282.0, 144.0, 89.0, 61.0, 32.0, 26.0, 25.0, 11.0, 9.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6015625, -8.38177490234375, -8.1619873046875, -7.94219970703125, -7.722412109375, -7.50262451171875, -7.2828369140625, -7.06304931640625, -6.84326171875, -6.62347412109375, -6.4036865234375, -6.18389892578125, -5.964111328125, -5.74432373046875, -5.5245361328125, -5.30474853515625, -5.0849609375, -4.86517333984375, -4.6453857421875, -4.42559814453125, -4.205810546875, -3.98602294921875, -3.7662353515625, -3.54644775390625, -3.32666015625, -3.10687255859375, -2.8870849609375, -2.66729736328125, -2.447509765625, -2.22772216796875, -2.0079345703125, -1.78814697265625, -1.568359375, -1.34857177734375, -1.1287841796875, -0.90899658203125, -0.689208984375, -0.46942138671875, -0.2496337890625, -0.02984619140625, 0.18994140625, 0.40972900390625, 0.6295166015625, 0.84930419921875, 1.069091796875, 1.28887939453125, 1.5086669921875, 1.72845458984375, 1.9482421875, 2.16802978515625, 2.3878173828125, 2.60760498046875, 2.827392578125, 3.04718017578125, 3.2669677734375, 3.48675537109375, 3.70654296875, 3.92633056640625, 4.1461181640625, 4.36590576171875, 4.585693359375, 4.80548095703125, 5.0252685546875, 5.24505615234375, 5.46484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 8.0, 12.0, 8.0, 25.0, 29.0, 25.0, 33.0, 35.0, 42.0, 64.0, 68.0, 91.0, 88.0, 92.0, 66.0, 65.0, 51.0, 33.0, 25.0, 20.0, 17.0, 15.0, 7.0, 12.0, 7.0, 2.0, 12.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007719993591308594, -0.0007464438676834106, -0.0007208883762359619, -0.0006953328847885132, -0.0006697773933410645, -0.0006442219018936157, -0.000618666410446167, -0.0005931109189987183, -0.0005675554275512695, -0.0005419999361038208, -0.0005164444446563721, -0.0004908889532089233, -0.0004653334617614746, -0.0004397779703140259, -0.00041422247886657715, -0.0003886669874191284, -0.0003631114959716797, -0.00033755600452423096, -0.0003120005130767822, -0.0002864450216293335, -0.00026088953018188477, -0.00023533403873443604, -0.0002097785472869873, -0.00018422305583953857, -0.00015866756439208984, -0.0001331120729446411, -0.00010755658149719238, -8.200109004974365e-05, -5.644559860229492e-05, -3.089010715484619e-05, -5.334615707397461e-06, 2.022087574005127e-05, 4.57763671875e-05, 7.133185863494873e-05, 9.688735008239746e-05, 0.0001224428415298462, 0.00014799833297729492, 0.00017355382442474365, 0.00019910931587219238, 0.0002246648073196411, 0.00025022029876708984, 0.0002757757902145386, 0.0003013312816619873, 0.00032688677310943604, 0.00035244226455688477, 0.0003779977560043335, 0.0004035532474517822, 0.00042910873889923096, 0.0004546642303466797, 0.0004802197217941284, 0.0005057752132415771, 0.0005313307046890259, 0.0005568861961364746, 0.0005824416875839233, 0.0006079971790313721, 0.0006335526704788208, 0.0006591081619262695, 0.0006846636533737183, 0.000710219144821167, 0.0007357746362686157, 0.0007613301277160645, 0.0007868856191635132, 0.0008124411106109619, 0.0008379966020584106, 0.0008635520935058594]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 17.0, 28.0, 31.0, 58.0, 80.0, 119.0, 221.0, 439.0, 868.0, 1743.0, 3902.0, 10818.0, 36629.0, 139531.0, 434858.0, 304301.0, 80124.0, 22091.0, 7180.0, 2800.0, 1266.0, 635.0, 327.0, 167.0, 102.0, 65.0, 49.0, 27.0, 21.0, 15.0, 9.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.08856201171875, -6.8724365234375, -6.65631103515625, -6.440185546875, -6.22406005859375, -6.0079345703125, -5.79180908203125, -5.57568359375, -5.35955810546875, -5.1434326171875, -4.92730712890625, -4.711181640625, -4.49505615234375, -4.2789306640625, -4.06280517578125, -3.8466796875, -3.63055419921875, -3.4144287109375, -3.19830322265625, -2.982177734375, -2.76605224609375, -2.5499267578125, -2.33380126953125, -2.11767578125, -1.90155029296875, -1.6854248046875, -1.46929931640625, -1.253173828125, -1.03704833984375, -0.8209228515625, -0.60479736328125, -0.388671875, -0.17254638671875, 0.0435791015625, 0.25970458984375, 0.475830078125, 0.69195556640625, 0.9080810546875, 1.12420654296875, 1.34033203125, 1.55645751953125, 1.7725830078125, 1.98870849609375, 2.204833984375, 2.42095947265625, 2.6370849609375, 2.85321044921875, 3.0693359375, 3.28546142578125, 3.5015869140625, 3.71771240234375, 3.933837890625, 4.14996337890625, 4.3660888671875, 4.58221435546875, 4.79833984375, 5.01446533203125, 5.2305908203125, 5.44671630859375, 5.662841796875, 5.87896728515625, 6.0950927734375, 6.31121826171875, 6.52734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 8.0, 16.0, 11.0, 14.0, 14.0, 21.0, 33.0, 21.0, 31.0, 38.0, 48.0, 33.0, 52.0, 59.0, 35.0, 69.0, 61.0, 64.0, 48.0, 41.0, 32.0, 37.0, 40.0, 26.0, 23.0, 18.0, 22.0, 12.0, 8.0, 7.0, 8.0, 9.0, 2.0, 6.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.470703125, -3.369415283203125, -3.26812744140625, -3.166839599609375, -3.0655517578125, -2.964263916015625, -2.86297607421875, -2.761688232421875, -2.660400390625, -2.559112548828125, -2.45782470703125, -2.356536865234375, -2.2552490234375, -2.153961181640625, -2.05267333984375, -1.951385498046875, -1.85009765625, -1.748809814453125, -1.64752197265625, -1.546234130859375, -1.4449462890625, -1.343658447265625, -1.24237060546875, -1.141082763671875, -1.039794921875, -0.938507080078125, -0.83721923828125, -0.735931396484375, -0.6346435546875, -0.533355712890625, -0.43206787109375, -0.330780029296875, -0.2294921875, -0.128204345703125, -0.02691650390625, 0.074371337890625, 0.1756591796875, 0.276947021484375, 0.37823486328125, 0.479522705078125, 0.580810546875, 0.682098388671875, 0.78338623046875, 0.884674072265625, 0.9859619140625, 1.087249755859375, 1.18853759765625, 1.289825439453125, 1.39111328125, 1.492401123046875, 1.59368896484375, 1.694976806640625, 1.7962646484375, 1.897552490234375, 1.99884033203125, 2.100128173828125, 2.201416015625, 2.302703857421875, 2.40399169921875, 2.505279541015625, 2.6065673828125, 2.707855224609375, 2.80914306640625, 2.910430908203125, 3.01171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 31.0, 47.0, 56.0, 63.0, 106.0, 114.0, 109.0, 107.0, 93.0, 77.0, 51.0, 31.0, 17.0, 17.0, 13.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.70713806152344, -79.26144409179688, -76.81575012207031, -74.37005615234375, -71.92436218261719, -69.47866821289062, -67.03297424316406, -64.5872802734375, -62.14158248901367, -59.69588851928711, -57.25019454956055, -54.804500579833984, -52.358802795410156, -49.913108825683594, -47.46741485595703, -45.02172088623047, -42.576026916503906, -40.130332946777344, -37.68463897705078, -35.23894500732422, -32.793251037597656, -30.34755516052246, -27.901859283447266, -25.456165313720703, -23.01047134399414, -20.564777374267578, -18.119083404541016, -15.67338752746582, -13.227693557739258, -10.781999588012695, -8.336304664611816, -5.8906097412109375, -3.444915771484375, -0.9992213249206543, 1.4464731216430664, 3.892167568206787, 6.337862014770508, 8.78355598449707, 11.22925090789795, 13.674945831298828, 16.12063980102539, 18.566333770751953, 21.012027740478516, 23.45772361755371, 25.903417587280273, 28.349111557006836, 30.79480743408203, 33.240501403808594, 35.686195373535156, 38.13188934326172, 40.57758331298828, 43.023277282714844, 45.468971252441406, 47.91466522216797, 50.3603630065918, 52.80605697631836, 55.25175094604492, 57.697444915771484, 60.14313888549805, 62.58883285522461, 65.03453063964844, 67.480224609375, 69.92591857910156, 72.37161254882812, 74.81730651855469]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 7.0, 10.0, 13.0, 15.0, 17.0, 17.0, 24.0, 29.0, 26.0, 39.0, 39.0, 46.0, 45.0, 42.0, 46.0, 46.0, 52.0, 49.0, 44.0, 41.0, 36.0, 41.0, 34.0, 47.0, 27.0, 22.0, 16.0, 16.0, 21.0, 18.0, 12.0, 18.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.153602600097656, -57.57966613769531, -56.00572967529297, -54.431793212890625, -52.85785675048828, -51.2839241027832, -49.70998764038086, -48.136051177978516, -46.56211471557617, -44.98817825317383, -43.414241790771484, -41.84030532836914, -40.26637268066406, -38.69243621826172, -37.118499755859375, -35.54456329345703, -33.97062683105469, -32.396690368652344, -30.82275390625, -29.24881935119629, -27.674882888793945, -26.1009464263916, -24.52701187133789, -22.953075408935547, -21.379138946533203, -19.80520248413086, -18.231266021728516, -16.657331466674805, -15.083395004272461, -13.509458541870117, -11.93552303314209, -10.361587524414062, -8.787651062011719, -7.213715076446533, -5.639779090881348, -4.065843105316162, -2.4919071197509766, -0.917971134185791, 0.6559648513793945, 2.229900360107422, 3.8038368225097656, 5.377772808074951, 6.951708793640137, 8.525644302368164, 10.099580764770508, 11.673517227172852, 13.247452735900879, 14.821388244628906, 16.39532470703125, 17.969261169433594, 19.543197631835938, 21.11713218688965, 22.691068649291992, 24.265005111694336, 25.838939666748047, 27.41287612915039, 28.986812591552734, 30.560749053955078, 32.13468551635742, 33.708621978759766, 35.282554626464844, 36.85649108886719, 38.43042755126953, 40.004364013671875, 41.57830047607422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 20.0, 16.0, 31.0, 52.0, 72.0, 137.0, 256.0, 557.0, 1218.0, 2986.0, 10728.0, 63543.0, 3406484.0, 657788.0, 38821.0, 7337.0, 2242.0, 918.0, 379.0, 215.0, 164.0, 84.0, 57.0, 42.0, 28.0, 16.0, 24.0, 15.0, 11.0, 2.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -28.728759765625, -27.47314453125, -26.217529296875, -24.9619140625, -23.706298828125, -22.45068359375, -21.195068359375, -19.939453125, -18.683837890625, -17.42822265625, -16.172607421875, -14.9169921875, -13.661376953125, -12.40576171875, -11.150146484375, -9.89453125, -8.638916015625, -7.38330078125, -6.127685546875, -4.8720703125, -3.616455078125, -2.36083984375, -1.105224609375, 0.150390625, 1.406005859375, 2.66162109375, 3.917236328125, 5.1728515625, 6.428466796875, 7.68408203125, 8.939697265625, 10.1953125, 11.450927734375, 12.70654296875, 13.962158203125, 15.2177734375, 16.473388671875, 17.72900390625, 18.984619140625, 20.240234375, 21.495849609375, 22.75146484375, 24.007080078125, 25.2626953125, 26.518310546875, 27.77392578125, 29.029541015625, 30.28515625, 31.540771484375, 32.79638671875, 34.052001953125, 35.3076171875, 36.563232421875, 37.81884765625, 39.074462890625, 40.330078125, 41.585693359375, 42.84130859375, 44.096923828125, 45.3525390625, 46.608154296875, 47.86376953125, 49.119384765625, 50.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 17.0, 20.0, 31.0, 30.0, 37.0, 54.0, 60.0, 69.0, 78.0, 76.0, 86.0, 80.0, 75.0, 55.0, 56.0, 35.0, 33.0, 25.0, 26.0, 13.0, 8.0, 12.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.857086181640625, -2.75518798828125, -2.653289794921875, -2.5513916015625, -2.449493408203125, -2.34759521484375, -2.245697021484375, -2.143798828125, -2.041900634765625, -1.94000244140625, -1.838104248046875, -1.7362060546875, -1.634307861328125, -1.53240966796875, -1.430511474609375, -1.32861328125, -1.226715087890625, -1.12481689453125, -1.022918701171875, -0.9210205078125, -0.819122314453125, -0.71722412109375, -0.615325927734375, -0.513427734375, -0.411529541015625, -0.30963134765625, -0.207733154296875, -0.1058349609375, -0.003936767578125, 0.09796142578125, 0.199859619140625, 0.3017578125, 0.403656005859375, 0.50555419921875, 0.607452392578125, 0.7093505859375, 0.811248779296875, 0.91314697265625, 1.015045166015625, 1.116943359375, 1.218841552734375, 1.32073974609375, 1.422637939453125, 1.5245361328125, 1.626434326171875, 1.72833251953125, 1.830230712890625, 1.93212890625, 2.034027099609375, 2.13592529296875, 2.237823486328125, 2.3397216796875, 2.441619873046875, 2.54351806640625, 2.645416259765625, 2.747314453125, 2.849212646484375, 2.95111083984375, 3.053009033203125, 3.1549072265625, 3.256805419921875, 3.35870361328125, 3.460601806640625, 3.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 16.0, 24.0, 42.0, 50.0, 93.0, 127.0, 213.0, 327.0, 661.0, 1194.0, 2791.0, 8953.0, 58016.0, 3097091.0, 976754.0, 35987.0, 6850.0, 2478.0, 1124.0, 601.0, 343.0, 206.0, 120.0, 66.0, 44.0, 29.0, 19.0, 16.0, 11.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.71826171875, -35.5302734375, -34.34228515625, -33.154296875, -31.96630859375, -30.7783203125, -29.59033203125, -28.40234375, -27.21435546875, -26.0263671875, -24.83837890625, -23.650390625, -22.46240234375, -21.2744140625, -20.08642578125, -18.8984375, -17.71044921875, -16.5224609375, -15.33447265625, -14.146484375, -12.95849609375, -11.7705078125, -10.58251953125, -9.39453125, -8.20654296875, -7.0185546875, -5.83056640625, -4.642578125, -3.45458984375, -2.2666015625, -1.07861328125, 0.109375, 1.29736328125, 2.4853515625, 3.67333984375, 4.861328125, 6.04931640625, 7.2373046875, 8.42529296875, 9.61328125, 10.80126953125, 11.9892578125, 13.17724609375, 14.365234375, 15.55322265625, 16.7412109375, 17.92919921875, 19.1171875, 20.30517578125, 21.4931640625, 22.68115234375, 23.869140625, 25.05712890625, 26.2451171875, 27.43310546875, 28.62109375, 29.80908203125, 30.9970703125, 32.18505859375, 33.373046875, 34.56103515625, 35.7490234375, 36.93701171875, 38.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 23.0, 49.0, 81.0, 191.0, 508.0, 2026.0, 737.0, 242.0, 92.0, 47.0, 16.0, 15.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.3802490234375, -11.932373046875, -11.4844970703125, -11.03662109375, -10.5887451171875, -10.140869140625, -9.6929931640625, -9.2451171875, -8.7972412109375, -8.349365234375, -7.9014892578125, -7.45361328125, -7.0057373046875, -6.557861328125, -6.1099853515625, -5.662109375, -5.2142333984375, -4.766357421875, -4.3184814453125, -3.87060546875, -3.4227294921875, -2.974853515625, -2.5269775390625, -2.0791015625, -1.6312255859375, -1.183349609375, -0.7354736328125, -0.28759765625, 0.1602783203125, 0.608154296875, 1.0560302734375, 1.50390625, 1.9517822265625, 2.399658203125, 2.8475341796875, 3.29541015625, 3.7432861328125, 4.191162109375, 4.6390380859375, 5.0869140625, 5.5347900390625, 5.982666015625, 6.4305419921875, 6.87841796875, 7.3262939453125, 7.774169921875, 8.2220458984375, 8.669921875, 9.1177978515625, 9.565673828125, 10.0135498046875, 10.46142578125, 10.9093017578125, 11.357177734375, 11.8050537109375, 12.2529296875, 12.7008056640625, 13.148681640625, 13.5965576171875, 14.04443359375, 14.4923095703125, 14.940185546875, 15.3880615234375, 15.8359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 15.0, 37.0, 63.0, 97.0, 172.0, 220.0, 158.0, 117.0, 59.0, 28.0, 15.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.96316528320312, -104.12205505371094, -101.28095245361328, -98.43984985351562, -95.59873962402344, -92.75762939453125, -89.9165267944336, -87.07542419433594, -84.23431396484375, -81.39320373535156, -78.5521011352539, -75.71099853515625, -72.86988830566406, -70.02877807617188, -67.18767547607422, -64.34657287597656, -61.505462646484375, -58.66435623168945, -55.82324981689453, -52.98214340209961, -50.14103698730469, -47.299930572509766, -44.458824157714844, -41.61771774291992, -38.776611328125, -35.93550491333008, -33.094398498535156, -30.253292083740234, -27.412185668945312, -24.57107925415039, -21.72997283935547, -18.888866424560547, -16.047767639160156, -13.206661224365234, -10.365554809570312, -7.524448394775391, -4.683341979980469, -1.8422355651855469, 0.998870849609375, 3.839977264404297, 6.681083679199219, 9.52219009399414, 12.363296508789062, 15.204402923583984, 18.045509338378906, 20.886615753173828, 23.72772216796875, 26.568828582763672, 29.409934997558594, 32.251041412353516, 35.09214782714844, 37.93325424194336, 40.77436065673828, 43.6154670715332, 46.456573486328125, 49.29767990112305, 52.13878631591797, 54.97989273071289, 57.82099914550781, 60.662105560302734, 63.503211975097656, 66.34431457519531, 69.1854248046875, 72.02653503417969, 74.86763763427734]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 18.0, 36.0, 31.0, 48.0, 73.0, 66.0, 69.0, 88.0, 97.0, 71.0, 86.0, 83.0, 67.0, 47.0, 30.0, 38.0, 15.0, 13.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.20011901855469, -30.490598678588867, -28.781078338623047, -27.07155990600586, -25.36203956604004, -23.65251922607422, -21.9429988861084, -20.233478546142578, -18.52396011352539, -16.81443977355957, -15.104920387268066, -13.395400047302246, -11.685880661010742, -9.976360321044922, -8.266839981079102, -6.557320594787598, -4.847799301147461, -3.138279438018799, -1.4287593364715576, 0.2807607650756836, 1.9902806282043457, 3.699800491333008, 5.409320831298828, 7.118840217590332, 8.828360557556152, 10.537880897521973, 12.247400283813477, 13.956920623779297, 15.666440963745117, 17.375961303710938, 19.085479736328125, 20.795000076293945, 22.504520416259766, 24.214040756225586, 25.923561096191406, 27.633079528808594, 29.342599868774414, 31.052120208740234, 32.76164245605469, 34.471160888671875, 36.18067932128906, 37.89019775390625, 39.5997200012207, 41.30923843383789, 43.018760681152344, 44.72827911376953, 46.43779754638672, 48.14731979370117, 49.856842041015625, 51.56636047363281, 53.275882720947266, 54.98540115356445, 56.694923400878906, 58.404441833496094, 60.11396026611328, 61.823482513427734, 63.53300094604492, 65.24252319335938, 66.95204162597656, 68.66156005859375, 70.37107849121094, 72.08059692382812, 73.79012298583984, 75.49964141845703, 77.20915985107422]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 15.0, 25.0, 21.0, 41.0, 59.0, 114.0, 212.0, 425.0, 973.0, 3205.0, 30011.0, 741554.0, 256363.0, 12023.0, 2043.0, 745.0, 311.0, 168.0, 87.0, 58.0, 34.0, 23.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.6875, -65.01318359375, -63.3388671875, -61.66455078125, -59.990234375, -58.31591796875, -56.6416015625, -54.96728515625, -53.29296875, -51.61865234375, -49.9443359375, -48.27001953125, -46.595703125, -44.92138671875, -43.2470703125, -41.57275390625, -39.8984375, -38.22412109375, -36.5498046875, -34.87548828125, -33.201171875, -31.52685546875, -29.8525390625, -28.17822265625, -26.50390625, -24.82958984375, -23.1552734375, -21.48095703125, -19.806640625, -18.13232421875, -16.4580078125, -14.78369140625, -13.109375, -11.43505859375, -9.7607421875, -8.08642578125, -6.412109375, -4.73779296875, -3.0634765625, -1.38916015625, 0.28515625, 1.95947265625, 3.6337890625, 5.30810546875, 6.982421875, 8.65673828125, 10.3310546875, 12.00537109375, 13.6796875, 15.35400390625, 17.0283203125, 18.70263671875, 20.376953125, 22.05126953125, 23.7255859375, 25.39990234375, 27.07421875, 28.74853515625, 30.4228515625, 32.09716796875, 33.771484375, 35.44580078125, 37.1201171875, 38.79443359375, 40.46875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 13.0, 22.0, 30.0, 53.0, 67.0, 78.0, 114.0, 124.0, 134.0, 96.0, 75.0, 64.0, 46.0, 32.0, 22.0, 12.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.0904541015625, -2.934814453125, -2.7791748046875, -2.62353515625, -2.4678955078125, -2.312255859375, -2.1566162109375, -2.0009765625, -1.8453369140625, -1.689697265625, -1.5340576171875, -1.37841796875, -1.2227783203125, -1.067138671875, -0.9114990234375, -0.755859375, -0.6002197265625, -0.444580078125, -0.2889404296875, -0.13330078125, 0.0223388671875, 0.177978515625, 0.3336181640625, 0.4892578125, 0.6448974609375, 0.800537109375, 0.9561767578125, 1.11181640625, 1.2674560546875, 1.423095703125, 1.5787353515625, 1.734375, 1.8900146484375, 2.045654296875, 2.2012939453125, 2.35693359375, 2.5125732421875, 2.668212890625, 2.8238525390625, 2.9794921875, 3.1351318359375, 3.290771484375, 3.4464111328125, 3.60205078125, 3.7576904296875, 3.913330078125, 4.0689697265625, 4.224609375, 4.3802490234375, 4.535888671875, 4.6915283203125, 4.84716796875, 5.0028076171875, 5.158447265625, 5.3140869140625, 5.4697265625, 5.6253662109375, 5.781005859375, 5.9366455078125, 6.09228515625, 6.2479248046875, 6.403564453125, 6.5592041015625, 6.71484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 4.0, 7.0, 12.0, 21.0, 14.0, 38.0, 52.0, 76.0, 125.0, 190.0, 302.0, 471.0, 879.0, 1545.0, 2941.0, 6225.0, 13440.0, 30479.0, 70720.0, 167880.0, 357604.0, 226558.0, 94085.0, 40650.0, 18049.0, 7946.0, 3707.0, 1914.0, 1022.0, 585.0, 326.0, 234.0, 171.0, 82.0, 55.0, 41.0, 35.0, 18.0, 13.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8189697265625, -7.536376953125, -7.2537841796875, -6.97119140625, -6.6885986328125, -6.406005859375, -6.1234130859375, -5.8408203125, -5.5582275390625, -5.275634765625, -4.9930419921875, -4.71044921875, -4.4278564453125, -4.145263671875, -3.8626708984375, -3.580078125, -3.2974853515625, -3.014892578125, -2.7322998046875, -2.44970703125, -2.1671142578125, -1.884521484375, -1.6019287109375, -1.3193359375, -1.0367431640625, -0.754150390625, -0.4715576171875, -0.18896484375, 0.0936279296875, 0.376220703125, 0.6588134765625, 0.94140625, 1.2239990234375, 1.506591796875, 1.7891845703125, 2.07177734375, 2.3543701171875, 2.636962890625, 2.9195556640625, 3.2021484375, 3.4847412109375, 3.767333984375, 4.0499267578125, 4.33251953125, 4.6151123046875, 4.897705078125, 5.1802978515625, 5.462890625, 5.7454833984375, 6.028076171875, 6.3106689453125, 6.59326171875, 6.8758544921875, 7.158447265625, 7.4410400390625, 7.7236328125, 8.0062255859375, 8.288818359375, 8.5714111328125, 8.85400390625, 9.1365966796875, 9.419189453125, 9.7017822265625, 9.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 10.0, 8.0, 12.0, 24.0, 26.0, 24.0, 22.0, 40.0, 44.0, 47.0, 48.0, 44.0, 45.0, 43.0, 55.0, 49.0, 48.0, 57.0, 49.0, 47.0, 45.0, 36.0, 35.0, 20.0, 26.0, 17.0, 17.0, 15.0, 7.0, 8.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34765625, -10.03125, -9.71484375, -9.3984375, -9.08203125, -8.765625, -8.44921875, -8.1328125, -7.81640625, -7.5, -7.18359375, -6.8671875, -6.55078125, -6.234375, -5.91796875, -5.6015625, -5.28515625, -4.96875, -4.65234375, -4.3359375, -4.01953125, -3.703125, -3.38671875, -3.0703125, -2.75390625, -2.4375, -2.12109375, -1.8046875, -1.48828125, -1.171875, -0.85546875, -0.5390625, -0.22265625, 0.09375, 0.41015625, 0.7265625, 1.04296875, 1.359375, 1.67578125, 1.9921875, 2.30859375, 2.625, 2.94140625, 3.2578125, 3.57421875, 3.890625, 4.20703125, 4.5234375, 4.83984375, 5.15625, 5.47265625, 5.7890625, 6.10546875, 6.421875, 6.73828125, 7.0546875, 7.37109375, 7.6875, 8.00390625, 8.3203125, 8.63671875, 8.953125, 9.26953125, 9.5859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 9.0, 21.0, 24.0, 31.0, 48.0, 75.0, 111.0, 194.0, 326.0, 565.0, 945.0, 1996.0, 4202.0, 9942.0, 26958.0, 84111.0, 283441.0, 426617.0, 139135.0, 43043.0, 15067.0, 5907.0, 2652.0, 1343.0, 693.0, 395.0, 232.0, 152.0, 90.0, 62.0, 49.0, 25.0, 15.0, 10.0, 6.0, 10.0, 6.0, 7.0, 0.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.30126953125, -5.1064453125, -4.91162109375, -4.716796875, -4.52197265625, -4.3271484375, -4.13232421875, -3.9375, -3.74267578125, -3.5478515625, -3.35302734375, -3.158203125, -2.96337890625, -2.7685546875, -2.57373046875, -2.37890625, -2.18408203125, -1.9892578125, -1.79443359375, -1.599609375, -1.40478515625, -1.2099609375, -1.01513671875, -0.8203125, -0.62548828125, -0.4306640625, -0.23583984375, -0.041015625, 0.15380859375, 0.3486328125, 0.54345703125, 0.73828125, 0.93310546875, 1.1279296875, 1.32275390625, 1.517578125, 1.71240234375, 1.9072265625, 2.10205078125, 2.296875, 2.49169921875, 2.6865234375, 2.88134765625, 3.076171875, 3.27099609375, 3.4658203125, 3.66064453125, 3.85546875, 4.05029296875, 4.2451171875, 4.43994140625, 4.634765625, 4.82958984375, 5.0244140625, 5.21923828125, 5.4140625, 5.60888671875, 5.8037109375, 5.99853515625, 6.193359375, 6.38818359375, 6.5830078125, 6.77783203125, 6.97265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 9.0, 8.0, 23.0, 16.0, 26.0, 41.0, 52.0, 73.0, 108.0, 150.0, 144.0, 105.0, 67.0, 40.0, 38.0, 28.0, 18.0, 11.0, 12.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001331329345703125, -0.0012942701578140259, -0.0012572109699249268, -0.0012201517820358276, -0.0011830925941467285, -0.0011460334062576294, -0.0011089742183685303, -0.0010719150304794312, -0.001034855842590332, -0.000997796654701233, -0.0009607374668121338, -0.0009236782789230347, -0.0008866190910339355, -0.0008495599031448364, -0.0008125007152557373, -0.0007754415273666382, -0.0007383823394775391, -0.0007013231515884399, -0.0006642639636993408, -0.0006272047758102417, -0.0005901455879211426, -0.0005530864000320435, -0.0005160272121429443, -0.0004789680242538452, -0.0004419088363647461, -0.00040484964847564697, -0.00036779046058654785, -0.00033073127269744873, -0.0002936720848083496, -0.0002566128969192505, -0.00021955370903015137, -0.00018249452114105225, -0.00014543533325195312, -0.000108376145362854, -7.131695747375488e-05, -3.425776958465576e-05, 2.8014183044433594e-06, 3.986060619354248e-05, 7.69197940826416e-05, 0.00011397898197174072, 0.00015103816986083984, 0.00018809735774993896, 0.00022515654563903809, 0.0002622157335281372, 0.00029927492141723633, 0.00033633410930633545, 0.00037339329719543457, 0.0004104524850845337, 0.0004475116729736328, 0.00048457086086273193, 0.0005216300487518311, 0.0005586892366409302, 0.0005957484245300293, 0.0006328076124191284, 0.0006698668003082275, 0.0007069259881973267, 0.0007439851760864258, 0.0007810443639755249, 0.000818103551864624, 0.0008551627397537231, 0.0008922219276428223, 0.0009292811155319214, 0.0009663403034210205, 0.0010033994913101196, 0.0010404586791992188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 5.0, 12.0, 7.0, 19.0, 26.0, 40.0, 53.0, 73.0, 112.0, 167.0, 246.0, 373.0, 652.0, 1023.0, 1702.0, 2960.0, 5713.0, 11757.0, 27466.0, 72430.0, 210120.0, 408758.0, 190725.0, 65431.0, 25233.0, 10876.0, 5503.0, 2854.0, 1589.0, 952.0, 588.0, 350.0, 249.0, 157.0, 102.0, 64.0, 51.0, 36.0, 23.0, 12.0, 15.0, 9.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.4423828125, -5.263671875, -5.0849609375, -4.90625, -4.7275390625, -4.548828125, -4.3701171875, -4.19140625, -4.0126953125, -3.833984375, -3.6552734375, -3.4765625, -3.2978515625, -3.119140625, -2.9404296875, -2.76171875, -2.5830078125, -2.404296875, -2.2255859375, -2.046875, -1.8681640625, -1.689453125, -1.5107421875, -1.33203125, -1.1533203125, -0.974609375, -0.7958984375, -0.6171875, -0.4384765625, -0.259765625, -0.0810546875, 0.09765625, 0.2763671875, 0.455078125, 0.6337890625, 0.8125, 0.9912109375, 1.169921875, 1.3486328125, 1.52734375, 1.7060546875, 1.884765625, 2.0634765625, 2.2421875, 2.4208984375, 2.599609375, 2.7783203125, 2.95703125, 3.1357421875, 3.314453125, 3.4931640625, 3.671875, 3.8505859375, 4.029296875, 4.2080078125, 4.38671875, 4.5654296875, 4.744140625, 4.9228515625, 5.1015625, 5.2802734375, 5.458984375, 5.6376953125, 5.81640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 9.0, 16.0, 16.0, 21.0, 32.0, 34.0, 47.0, 77.0, 91.0, 83.0, 77.0, 100.0, 62.0, 80.0, 59.0, 44.0, 24.0, 19.0, 17.0, 13.0, 14.0, 12.0, 8.0, 1.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.30517578125, -5.1416015625, -4.97802734375, -4.814453125, -4.65087890625, -4.4873046875, -4.32373046875, -4.16015625, -3.99658203125, -3.8330078125, -3.66943359375, -3.505859375, -3.34228515625, -3.1787109375, -3.01513671875, -2.8515625, -2.68798828125, -2.5244140625, -2.36083984375, -2.197265625, -2.03369140625, -1.8701171875, -1.70654296875, -1.54296875, -1.37939453125, -1.2158203125, -1.05224609375, -0.888671875, -0.72509765625, -0.5615234375, -0.39794921875, -0.234375, -0.07080078125, 0.0927734375, 0.25634765625, 0.419921875, 0.58349609375, 0.7470703125, 0.91064453125, 1.07421875, 1.23779296875, 1.4013671875, 1.56494140625, 1.728515625, 1.89208984375, 2.0556640625, 2.21923828125, 2.3828125, 2.54638671875, 2.7099609375, 2.87353515625, 3.037109375, 3.20068359375, 3.3642578125, 3.52783203125, 3.69140625, 3.85498046875, 4.0185546875, 4.18212890625, 4.345703125, 4.50927734375, 4.6728515625, 4.83642578125, 5.0]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 17.0, 37.0, 64.0, 163.0, 239.0, 226.0, 140.0, 66.0, 26.0, 13.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.753631591796875, -51.51547622680664, -46.27731704711914, -41.039161682128906, -35.801002502441406, -30.562847137451172, -25.324691772460938, -20.086532592773438, -14.848377227783203, -9.610219955444336, -4.372063636779785, 0.8660926818847656, 6.104249954223633, 11.3424072265625, 16.580562591552734, 21.818721771240234, 27.05687713623047, 32.2950325012207, 37.5331916809082, 42.77134704589844, 48.00950622558594, 53.24766159057617, 58.485816955566406, 63.723976135253906, 68.96212768554688, 74.20028686523438, 79.43843841552734, 84.67659759521484, 89.91475677490234, 95.15290832519531, 100.39106750488281, 105.62922668457031, 110.86738586425781, 116.10554504394531, 121.34369659423828, 126.58185577392578, 131.82000732421875, 137.05816650390625, 142.29632568359375, 147.53448486328125, 152.77264404296875, 158.01080322265625, 163.24896240234375, 168.48712158203125, 173.7252655029297, 178.9634246826172, 184.2015838623047, 189.4397430419922, 194.67788696289062, 199.91604614257812, 205.15420532226562, 210.39236450195312, 215.63050842285156, 220.86866760253906, 226.10682678222656, 231.34498596191406, 236.58314514160156, 241.82130432128906, 247.05946350097656, 252.297607421875, 257.5357666015625, 262.77392578125, 268.0120849609375, 273.250244140625, 278.4884033203125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 10.0, 7.0, 3.0, 11.0, 13.0, 9.0, 20.0, 16.0, 19.0, 14.0, 20.0, 35.0, 27.0, 26.0, 36.0, 39.0, 35.0, 43.0, 40.0, 26.0, 49.0, 49.0, 58.0, 41.0, 43.0, 29.0, 33.0, 33.0, 25.0, 26.0, 26.0, 27.0, 12.0, 17.0, 13.0, 19.0, 15.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.838951110839844, -43.33690643310547, -41.83486557006836, -40.332820892333984, -38.83077621459961, -37.3287353515625, -35.826690673828125, -34.32464599609375, -32.82260513305664, -31.3205623626709, -29.818517684936523, -28.31647491455078, -26.81443214416504, -25.312389373779297, -23.810344696044922, -22.30830192565918, -20.806257247924805, -19.304214477539062, -17.802169799804688, -16.300127029418945, -14.798084259033203, -13.296040534973145, -11.793996810913086, -10.291954040527344, -8.789910316467285, -7.287867069244385, -5.785823822021484, -4.283780097961426, -2.7817368507385254, -1.279693603515625, 0.2223501205444336, 1.7243928909301758, 3.2264366149902344, 4.728479862213135, 6.230523109436035, 7.732566833496094, 9.234609603881836, 10.736653327941895, 12.238697052001953, 13.740739822387695, 15.242783546447754, 16.744827270507812, 18.246870040893555, 19.748912811279297, 21.250957489013672, 22.753000259399414, 24.255043029785156, 25.75708770751953, 27.259130477905273, 28.761173248291016, 30.26321792602539, 31.765260696411133, 33.267303466796875, 34.76934814453125, 36.271392822265625, 37.773433685302734, 39.27547836303711, 40.777523040771484, 42.279563903808594, 43.78160858154297, 45.283653259277344, 46.78569412231445, 48.28773880004883, 49.78977966308594, 51.29182434082031]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 13.0, 13.0, 29.0, 49.0, 117.0, 237.0, 568.0, 1943.0, 12872.0, 3396902.0, 768697.0, 10079.0, 1632.0, 574.0, 240.0, 130.0, 57.0, 46.0, 28.0, 14.0, 7.0, 6.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.005859375, -53.76171875, -51.517578125, -49.2734375, -47.029296875, -44.78515625, -42.541015625, -40.296875, -38.052734375, -35.80859375, -33.564453125, -31.3203125, -29.076171875, -26.83203125, -24.587890625, -22.34375, -20.099609375, -17.85546875, -15.611328125, -13.3671875, -11.123046875, -8.87890625, -6.634765625, -4.390625, -2.146484375, 0.09765625, 2.341796875, 4.5859375, 6.830078125, 9.07421875, 11.318359375, 13.5625, 15.806640625, 18.05078125, 20.294921875, 22.5390625, 24.783203125, 27.02734375, 29.271484375, 31.515625, 33.759765625, 36.00390625, 38.248046875, 40.4921875, 42.736328125, 44.98046875, 47.224609375, 49.46875, 51.712890625, 53.95703125, 56.201171875, 58.4453125, 60.689453125, 62.93359375, 65.177734375, 67.421875, 69.666015625, 71.91015625, 74.154296875, 76.3984375, 78.642578125, 80.88671875, 83.130859375, 85.375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 24.0, 41.0, 46.0, 47.0, 80.0, 110.0, 131.0, 124.0, 98.0, 79.0, 72.0, 44.0, 33.0, 28.0, 13.0, 6.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.163330078125, -3.00634765625, -2.849365234375, -2.6923828125, -2.535400390625, -2.37841796875, -2.221435546875, -2.064453125, -1.907470703125, -1.75048828125, -1.593505859375, -1.4365234375, -1.279541015625, -1.12255859375, -0.965576171875, -0.80859375, -0.651611328125, -0.49462890625, -0.337646484375, -0.1806640625, -0.023681640625, 0.13330078125, 0.290283203125, 0.447265625, 0.604248046875, 0.76123046875, 0.918212890625, 1.0751953125, 1.232177734375, 1.38916015625, 1.546142578125, 1.703125, 1.860107421875, 2.01708984375, 2.174072265625, 2.3310546875, 2.488037109375, 2.64501953125, 2.802001953125, 2.958984375, 3.115966796875, 3.27294921875, 3.429931640625, 3.5869140625, 3.743896484375, 3.90087890625, 4.057861328125, 4.21484375, 4.371826171875, 4.52880859375, 4.685791015625, 4.8427734375, 4.999755859375, 5.15673828125, 5.313720703125, 5.470703125, 5.627685546875, 5.78466796875, 5.941650390625, 6.0986328125, 6.255615234375, 6.41259765625, 6.569580078125, 6.7265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 8.0, 10.0, 15.0, 14.0, 35.0, 38.0, 33.0, 70.0, 81.0, 128.0, 189.0, 337.0, 570.0, 1106.0, 2347.0, 5389.0, 13391.0, 38067.0, 125194.0, 625981.0, 2956726.0, 305452.0, 76445.0, 25501.0, 9269.0, 3926.0, 1832.0, 862.0, 487.0, 246.0, 164.0, 97.0, 71.0, 54.0, 31.0, 27.0, 21.0, 12.0, 16.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-13.5234375, -13.0772705078125, -12.631103515625, -12.1849365234375, -11.73876953125, -11.2926025390625, -10.846435546875, -10.4002685546875, -9.9541015625, -9.5079345703125, -9.061767578125, -8.6156005859375, -8.16943359375, -7.7232666015625, -7.277099609375, -6.8309326171875, -6.384765625, -5.9385986328125, -5.492431640625, -5.0462646484375, -4.60009765625, -4.1539306640625, -3.707763671875, -3.2615966796875, -2.8154296875, -2.3692626953125, -1.923095703125, -1.4769287109375, -1.03076171875, -0.5845947265625, -0.138427734375, 0.3077392578125, 0.75390625, 1.2000732421875, 1.646240234375, 2.0924072265625, 2.53857421875, 2.9847412109375, 3.430908203125, 3.8770751953125, 4.3232421875, 4.7694091796875, 5.215576171875, 5.6617431640625, 6.10791015625, 6.5540771484375, 7.000244140625, 7.4464111328125, 7.892578125, 8.3387451171875, 8.784912109375, 9.2310791015625, 9.67724609375, 10.1234130859375, 10.569580078125, 11.0157470703125, 11.4619140625, 11.9080810546875, 12.354248046875, 12.8004150390625, 13.24658203125, 13.6927490234375, 14.138916015625, 14.5850830078125, 15.03125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 10.0, 22.0, 28.0, 37.0, 56.0, 93.0, 156.0, 272.0, 622.0, 1663.0, 528.0, 225.0, 129.0, 86.0, 47.0, 29.0, 21.0, 9.0, 10.0, 8.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.078125, -8.847900390625, -8.61767578125, -8.387451171875, -8.1572265625, -7.927001953125, -7.69677734375, -7.466552734375, -7.236328125, -7.006103515625, -6.77587890625, -6.545654296875, -6.3154296875, -6.085205078125, -5.85498046875, -5.624755859375, -5.39453125, -5.164306640625, -4.93408203125, -4.703857421875, -4.4736328125, -4.243408203125, -4.01318359375, -3.782958984375, -3.552734375, -3.322509765625, -3.09228515625, -2.862060546875, -2.6318359375, -2.401611328125, -2.17138671875, -1.941162109375, -1.7109375, -1.480712890625, -1.25048828125, -1.020263671875, -0.7900390625, -0.559814453125, -0.32958984375, -0.099365234375, 0.130859375, 0.361083984375, 0.59130859375, 0.821533203125, 1.0517578125, 1.281982421875, 1.51220703125, 1.742431640625, 1.97265625, 2.202880859375, 2.43310546875, 2.663330078125, 2.8935546875, 3.123779296875, 3.35400390625, 3.584228515625, 3.814453125, 4.044677734375, 4.27490234375, 4.505126953125, 4.7353515625, 4.965576171875, 5.19580078125, 5.426025390625, 5.65625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 14.0, 29.0, 45.0, 63.0, 85.0, 72.0, 96.0, 85.0, 104.0, 104.0, 76.0, 68.0, 43.0, 33.0, 32.0, 7.0, 5.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.733978271484375, -38.596065521240234, -37.458152770996094, -36.32024002075195, -35.18232727050781, -34.04441452026367, -32.90650177001953, -31.76858901977539, -30.63067626953125, -29.49276351928711, -28.35485076904297, -27.216938018798828, -26.079025268554688, -24.941112518310547, -23.803199768066406, -22.665287017822266, -21.527372360229492, -20.38945960998535, -19.25154685974121, -18.11363410949707, -16.97572135925293, -15.837808609008789, -14.699894905090332, -13.561982154846191, -12.42406940460205, -11.28615665435791, -10.14824390411377, -9.010330200195312, -7.87241792678833, -6.7345051765441895, -5.596591949462891, -4.45867919921875, -3.3207664489746094, -2.1828536987304688, -1.044940710067749, 0.0929722785949707, 1.2308850288391113, 2.368797779083252, 3.506711006164551, 4.644623756408691, 5.782536506652832, 6.920449256896973, 8.058362007141113, 9.19627571105957, 10.334188461303711, 11.472101211547852, 12.610013961791992, 13.747926712036133, 14.885839462280273, 16.023752212524414, 17.161664962768555, 18.299577713012695, 19.437490463256836, 20.575403213500977, 21.71331787109375, 22.85123062133789, 23.98914337158203, 25.127056121826172, 26.264968872070312, 27.402881622314453, 28.540794372558594, 29.678707122802734, 30.816619873046875, 31.954532623291016, 33.092445373535156]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 10.0, 16.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 32.0, 29.0, 37.0, 37.0, 37.0, 42.0, 50.0, 49.0, 46.0, 51.0, 49.0, 43.0, 51.0, 43.0, 37.0, 38.0, 36.0, 30.0, 16.0, 20.0, 11.0, 16.0, 12.0, 20.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.554555892944336, -17.885683059692383, -17.21681022644043, -16.54793930053711, -15.879066467285156, -15.210193634033203, -14.54132080078125, -13.872447967529297, -13.20357608795166, -12.534703254699707, -11.86583137512207, -11.196958541870117, -10.528085708618164, -9.859213829040527, -9.190340995788574, -8.521469116210938, -7.852596282958984, -7.1837239265441895, -6.5148515701293945, -5.845978736877441, -5.1771063804626465, -4.508234024047852, -3.8393611907958984, -3.1704888343811035, -2.5016164779663086, -1.8327440023422241, -1.1638715267181396, -0.4949989318847656, 0.1738734245300293, 0.8427457809448242, 1.5116186141967773, 2.1804909706115723, 2.849363327026367, 3.518235683441162, 4.187108039855957, 4.85598087310791, 5.524853229522705, 6.1937255859375, 6.862598419189453, 7.531470775604248, 8.200343132019043, 8.869215965270996, 9.538087844848633, 10.206960678100586, 10.875833511352539, 11.544705390930176, 12.213578224182129, 12.882450103759766, 13.551322937011719, 14.220195770263672, 14.889067649841309, 15.557940483093262, 16.2268123626709, 16.89568519592285, 17.564558029174805, 18.233430862426758, 18.902301788330078, 19.57117462158203, 20.240047454833984, 20.908920288085938, 21.577791213989258, 22.24666404724121, 22.915536880493164, 23.584409713745117, 24.25328254699707]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 13.0, 4.0, 13.0, 18.0, 26.0, 52.0, 63.0, 93.0, 185.0, 338.0, 666.0, 1585.0, 5447.0, 37278.0, 441513.0, 509324.0, 42764.0, 5981.0, 1639.0, 704.0, 292.0, 194.0, 126.0, 70.0, 50.0, 30.0, 32.0, 13.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0], "bins": [-50.65625, -49.421630859375, -48.18701171875, -46.952392578125, -45.7177734375, -44.483154296875, -43.24853515625, -42.013916015625, -40.779296875, -39.544677734375, -38.31005859375, -37.075439453125, -35.8408203125, -34.606201171875, -33.37158203125, -32.136962890625, -30.90234375, -29.667724609375, -28.43310546875, -27.198486328125, -25.9638671875, -24.729248046875, -23.49462890625, -22.260009765625, -21.025390625, -19.790771484375, -18.55615234375, -17.321533203125, -16.0869140625, -14.852294921875, -13.61767578125, -12.383056640625, -11.1484375, -9.913818359375, -8.67919921875, -7.444580078125, -6.2099609375, -4.975341796875, -3.74072265625, -2.506103515625, -1.271484375, -0.036865234375, 1.19775390625, 2.432373046875, 3.6669921875, 4.901611328125, 6.13623046875, 7.370849609375, 8.60546875, 9.840087890625, 11.07470703125, 12.309326171875, 13.5439453125, 14.778564453125, 16.01318359375, 17.247802734375, 18.482421875, 19.717041015625, 20.95166015625, 22.186279296875, 23.4208984375, 24.655517578125, 25.89013671875, 27.124755859375, 28.359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 17.0, 20.0, 42.0, 37.0, 61.0, 91.0, 129.0, 111.0, 114.0, 87.0, 87.0, 59.0, 51.0, 35.0, 23.0, 11.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.186248779296875, -3.02679443359375, -2.867340087890625, -2.7078857421875, -2.548431396484375, -2.38897705078125, -2.229522705078125, -2.070068359375, -1.910614013671875, -1.75115966796875, -1.591705322265625, -1.4322509765625, -1.272796630859375, -1.11334228515625, -0.953887939453125, -0.79443359375, -0.634979248046875, -0.47552490234375, -0.316070556640625, -0.1566162109375, 0.002838134765625, 0.16229248046875, 0.321746826171875, 0.481201171875, 0.640655517578125, 0.80010986328125, 0.959564208984375, 1.1190185546875, 1.278472900390625, 1.43792724609375, 1.597381591796875, 1.7568359375, 1.916290283203125, 2.07574462890625, 2.235198974609375, 2.3946533203125, 2.554107666015625, 2.71356201171875, 2.873016357421875, 3.032470703125, 3.191925048828125, 3.35137939453125, 3.510833740234375, 3.6702880859375, 3.829742431640625, 3.98919677734375, 4.148651123046875, 4.30810546875, 4.467559814453125, 4.62701416015625, 4.786468505859375, 4.9459228515625, 5.105377197265625, 5.26483154296875, 5.424285888671875, 5.583740234375, 5.743194580078125, 5.90264892578125, 6.062103271484375, 6.2215576171875, 6.381011962890625, 6.54046630859375, 6.699920654296875, 6.859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 5.0, 7.0, 7.0, 14.0, 23.0, 38.0, 62.0, 84.0, 91.0, 167.0, 234.0, 343.0, 587.0, 1180.0, 2756.0, 7887.0, 26492.0, 96854.0, 328316.0, 402681.0, 128377.0, 35601.0, 10078.0, 3421.0, 1393.0, 669.0, 425.0, 241.0, 178.0, 119.0, 68.0, 43.0, 43.0, 24.0, 7.0, 13.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.66943359375, -11.2685546875, -10.86767578125, -10.466796875, -10.06591796875, -9.6650390625, -9.26416015625, -8.86328125, -8.46240234375, -8.0615234375, -7.66064453125, -7.259765625, -6.85888671875, -6.4580078125, -6.05712890625, -5.65625, -5.25537109375, -4.8544921875, -4.45361328125, -4.052734375, -3.65185546875, -3.2509765625, -2.85009765625, -2.44921875, -2.04833984375, -1.6474609375, -1.24658203125, -0.845703125, -0.44482421875, -0.0439453125, 0.35693359375, 0.7578125, 1.15869140625, 1.5595703125, 1.96044921875, 2.361328125, 2.76220703125, 3.1630859375, 3.56396484375, 3.96484375, 4.36572265625, 4.7666015625, 5.16748046875, 5.568359375, 5.96923828125, 6.3701171875, 6.77099609375, 7.171875, 7.57275390625, 7.9736328125, 8.37451171875, 8.775390625, 9.17626953125, 9.5771484375, 9.97802734375, 10.37890625, 10.77978515625, 11.1806640625, 11.58154296875, 11.982421875, 12.38330078125, 12.7841796875, 13.18505859375, 13.5859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 9.0, 9.0, 11.0, 13.0, 10.0, 15.0, 20.0, 21.0, 29.0, 31.0, 25.0, 20.0, 30.0, 31.0, 37.0, 29.0, 44.0, 32.0, 31.0, 28.0, 38.0, 34.0, 53.0, 28.0, 31.0, 33.0, 30.0, 25.0, 41.0, 22.0, 22.0, 18.0, 17.0, 20.0, 19.0, 11.0, 19.0, 7.0, 14.0, 2.0, 4.0, 11.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.72265625, -6.495849609375, -6.26904296875, -6.042236328125, -5.8154296875, -5.588623046875, -5.36181640625, -5.135009765625, -4.908203125, -4.681396484375, -4.45458984375, -4.227783203125, -4.0009765625, -3.774169921875, -3.54736328125, -3.320556640625, -3.09375, -2.866943359375, -2.64013671875, -2.413330078125, -2.1865234375, -1.959716796875, -1.73291015625, -1.506103515625, -1.279296875, -1.052490234375, -0.82568359375, -0.598876953125, -0.3720703125, -0.145263671875, 0.08154296875, 0.308349609375, 0.53515625, 0.761962890625, 0.98876953125, 1.215576171875, 1.4423828125, 1.669189453125, 1.89599609375, 2.122802734375, 2.349609375, 2.576416015625, 2.80322265625, 3.030029296875, 3.2568359375, 3.483642578125, 3.71044921875, 3.937255859375, 4.1640625, 4.390869140625, 4.61767578125, 4.844482421875, 5.0712890625, 5.298095703125, 5.52490234375, 5.751708984375, 5.978515625, 6.205322265625, 6.43212890625, 6.658935546875, 6.8857421875, 7.112548828125, 7.33935546875, 7.566162109375, 7.79296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 12.0, 20.0, 14.0, 28.0, 45.0, 70.0, 113.0, 260.0, 557.0, 1748.0, 6195.0, 28932.0, 221458.0, 675841.0, 92545.0, 15163.0, 3688.0, 1066.0, 399.0, 173.0, 78.0, 54.0, 22.0, 23.0, 16.0, 17.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.8270263671875, -13.411865234375, -12.9967041015625, -12.58154296875, -12.1663818359375, -11.751220703125, -11.3360595703125, -10.9208984375, -10.5057373046875, -10.090576171875, -9.6754150390625, -9.26025390625, -8.8450927734375, -8.429931640625, -8.0147705078125, -7.599609375, -7.1844482421875, -6.769287109375, -6.3541259765625, -5.93896484375, -5.5238037109375, -5.108642578125, -4.6934814453125, -4.2783203125, -3.8631591796875, -3.447998046875, -3.0328369140625, -2.61767578125, -2.2025146484375, -1.787353515625, -1.3721923828125, -0.95703125, -0.5418701171875, -0.126708984375, 0.2884521484375, 0.70361328125, 1.1187744140625, 1.533935546875, 1.9490966796875, 2.3642578125, 2.7794189453125, 3.194580078125, 3.6097412109375, 4.02490234375, 4.4400634765625, 4.855224609375, 5.2703857421875, 5.685546875, 6.1007080078125, 6.515869140625, 6.9310302734375, 7.34619140625, 7.7613525390625, 8.176513671875, 8.5916748046875, 9.0068359375, 9.4219970703125, 9.837158203125, 10.2523193359375, 10.66748046875, 11.0826416015625, 11.497802734375, 11.9129638671875, 12.328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 18.0, 20.0, 22.0, 29.0, 47.0, 61.0, 97.0, 156.0, 155.0, 108.0, 71.0, 41.0, 34.0, 29.0, 15.0, 20.0, 12.0, 6.0, 12.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016269683837890625, -0.0015861988067626953, -0.0015454292297363281, -0.001504659652709961, -0.0014638900756835938, -0.0014231204986572266, -0.0013823509216308594, -0.0013415813446044922, -0.001300811767578125, -0.0012600421905517578, -0.0012192726135253906, -0.0011785030364990234, -0.0011377334594726562, -0.001096963882446289, -0.0010561943054199219, -0.0010154247283935547, -0.0009746551513671875, -0.0009338855743408203, -0.0008931159973144531, -0.0008523464202880859, -0.0008115768432617188, -0.0007708072662353516, -0.0007300376892089844, -0.0006892681121826172, -0.00064849853515625, -0.0006077289581298828, -0.0005669593811035156, -0.0005261898040771484, -0.00048542022705078125, -0.00044465065002441406, -0.0004038810729980469, -0.0003631114959716797, -0.0003223419189453125, -0.0002815723419189453, -0.00024080276489257812, -0.00020003318786621094, -0.00015926361083984375, -0.00011849403381347656, -7.772445678710938e-05, -3.695487976074219e-05, 3.814697265625e-06, 4.458427429199219e-05, 8.535385131835938e-05, 0.00012612342834472656, 0.00016689300537109375, 0.00020766258239746094, 0.0002484321594238281, 0.0002892017364501953, 0.0003299713134765625, 0.0003707408905029297, 0.0004115104675292969, 0.00045228004455566406, 0.0004930496215820312, 0.0005338191986083984, 0.0005745887756347656, 0.0006153583526611328, 0.0006561279296875, 0.0006968975067138672, 0.0007376670837402344, 0.0007784366607666016, 0.0008192062377929688, 0.0008599758148193359, 0.0009007453918457031, 0.0009415149688720703, 0.0009822845458984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 18.0, 22.0, 23.0, 53.0, 75.0, 119.0, 232.0, 562.0, 1678.0, 6554.0, 35321.0, 407865.0, 540351.0, 44605.0, 7754.0, 1991.0, 670.0, 281.0, 154.0, 75.0, 59.0, 32.0, 16.0, 13.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.6875, -17.1829833984375, -16.678466796875, -16.1739501953125, -15.66943359375, -15.1649169921875, -14.660400390625, -14.1558837890625, -13.6513671875, -13.1468505859375, -12.642333984375, -12.1378173828125, -11.63330078125, -11.1287841796875, -10.624267578125, -10.1197509765625, -9.615234375, -9.1107177734375, -8.606201171875, -8.1016845703125, -7.59716796875, -7.0926513671875, -6.588134765625, -6.0836181640625, -5.5791015625, -5.0745849609375, -4.570068359375, -4.0655517578125, -3.56103515625, -3.0565185546875, -2.552001953125, -2.0474853515625, -1.54296875, -1.0384521484375, -0.533935546875, -0.0294189453125, 0.47509765625, 0.9796142578125, 1.484130859375, 1.9886474609375, 2.4931640625, 2.9976806640625, 3.502197265625, 4.0067138671875, 4.51123046875, 5.0157470703125, 5.520263671875, 6.0247802734375, 6.529296875, 7.0338134765625, 7.538330078125, 8.0428466796875, 8.54736328125, 9.0518798828125, 9.556396484375, 10.0609130859375, 10.5654296875, 11.0699462890625, 11.574462890625, 12.0789794921875, 12.58349609375, 13.0880126953125, 13.592529296875, 14.0970458984375, 14.6015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 13.0, 6.0, 13.0, 12.0, 25.0, 31.0, 42.0, 51.0, 65.0, 86.0, 122.0, 126.0, 85.0, 89.0, 53.0, 43.0, 35.0, 18.0, 22.0, 9.0, 15.0, 7.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -4.98333740234375, -4.7674560546875, -4.55157470703125, -4.335693359375, -4.11981201171875, -3.9039306640625, -3.68804931640625, -3.47216796875, -3.25628662109375, -3.0404052734375, -2.82452392578125, -2.608642578125, -2.39276123046875, -2.1768798828125, -1.96099853515625, -1.7451171875, -1.52923583984375, -1.3133544921875, -1.09747314453125, -0.881591796875, -0.66571044921875, -0.4498291015625, -0.23394775390625, -0.01806640625, 0.19781494140625, 0.4136962890625, 0.62957763671875, 0.845458984375, 1.06134033203125, 1.2772216796875, 1.49310302734375, 1.708984375, 1.92486572265625, 2.1407470703125, 2.35662841796875, 2.572509765625, 2.78839111328125, 3.0042724609375, 3.22015380859375, 3.43603515625, 3.65191650390625, 3.8677978515625, 4.08367919921875, 4.299560546875, 4.51544189453125, 4.7313232421875, 4.94720458984375, 5.1630859375, 5.37896728515625, 5.5948486328125, 5.81072998046875, 6.026611328125, 6.24249267578125, 6.4583740234375, 6.67425537109375, 6.89013671875, 7.10601806640625, 7.3218994140625, 7.53778076171875, 7.753662109375, 7.96954345703125, 8.1854248046875, 8.40130615234375, 8.6171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 12.0, 27.0, 41.0, 66.0, 108.0, 129.0, 162.0, 157.0, 117.0, 71.0, 49.0, 22.0, 15.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.517333984375, -57.0521354675293, -53.586936950683594, -50.121742248535156, -46.65654373168945, -43.19134521484375, -39.72614669799805, -36.260948181152344, -32.795753479003906, -29.330554962158203, -25.865358352661133, -22.40015983581543, -18.93496322631836, -15.469764709472656, -12.004566192626953, -8.539369583129883, -5.074169158935547, -1.608971357345581, 1.8562264442443848, 5.32142448425293, 8.786622047424316, 12.251819610595703, 15.717018127441406, 19.182214736938477, 22.64741325378418, 26.112611770629883, 29.577808380126953, 33.043006896972656, 36.50820541381836, 39.97340393066406, 43.4385986328125, 46.9037971496582, 50.368995666503906, 53.83419418334961, 57.29939270019531, 60.76458740234375, 64.22978973388672, 67.69498443603516, 71.16018676757812, 74.62538146972656, 78.090576171875, 81.55577087402344, 85.0209732055664, 88.48616790771484, 91.95137023925781, 95.41656494140625, 98.88175964355469, 102.34696197509766, 105.81216430664062, 109.27735900878906, 112.74256134033203, 116.20775604248047, 119.67295837402344, 123.13815307617188, 126.60334777832031, 130.06854248046875, 133.5337371826172, 136.99893188476562, 140.46412658691406, 143.92933654785156, 147.39453125, 150.85972595214844, 154.32492065429688, 157.7901153564453, 161.2553253173828]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 6.0, 7.0, 6.0, 10.0, 10.0, 21.0, 17.0, 24.0, 22.0, 22.0, 25.0, 31.0, 26.0, 32.0, 34.0, 33.0, 46.0, 33.0, 29.0, 38.0, 36.0, 43.0, 48.0, 37.0, 35.0, 27.0, 38.0, 36.0, 30.0, 17.0, 28.0, 12.0, 21.0, 15.0, 15.0, 14.0, 5.0, 10.0, 8.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-41.34233093261719, -40.033485412597656, -38.72464370727539, -37.41579818725586, -36.106956481933594, -34.79811096191406, -33.48926544189453, -32.180423736572266, -30.871578216552734, -29.562734603881836, -28.253890991210938, -26.945045471191406, -25.636201858520508, -24.32735824584961, -23.01851463317871, -21.709671020507812, -20.400827407836914, -19.091983795166016, -17.783140182495117, -16.47429656982422, -15.165451049804688, -13.856607437133789, -12.54776382446289, -11.238919258117676, -9.930075645446777, -8.621232032775879, -7.312387466430664, -6.003543853759766, -4.694699764251709, -3.3858556747436523, -2.077012062072754, -0.7681674957275391, 0.5406761169433594, 1.8495200872421265, 3.1583640575408936, 4.467207908630371, 5.776051998138428, 7.084896087646484, 8.393739700317383, 9.702584266662598, 11.011427879333496, 12.320271492004395, 13.62911605834961, 14.937959671020508, 16.246803283691406, 17.555648803710938, 18.864490509033203, 20.173336029052734, 21.482179641723633, 22.79102325439453, 24.09986686706543, 25.408710479736328, 26.71755599975586, 28.026399612426758, 29.335243225097656, 30.644088745117188, 31.952930450439453, 33.261775970458984, 34.57061767578125, 35.87946319580078, 37.18830490112305, 38.49715042114258, 39.805992126464844, 41.114837646484375, 42.423683166503906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 11.0, 8.0, 41.0, 49.0, 73.0, 105.0, 204.0, 355.0, 751.0, 1644.0, 4582.0, 20646.0, 210670.0, 3787669.0, 144107.0, 16275.0, 3984.0, 1392.0, 651.0, 324.0, 216.0, 145.0, 92.0, 67.0, 58.0, 28.0, 17.0, 21.0, 16.0, 6.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.8125, -30.455078125, -29.09765625, -27.740234375, -26.3828125, -25.025390625, -23.66796875, -22.310546875, -20.953125, -19.595703125, -18.23828125, -16.880859375, -15.5234375, -14.166015625, -12.80859375, -11.451171875, -10.09375, -8.736328125, -7.37890625, -6.021484375, -4.6640625, -3.306640625, -1.94921875, -0.591796875, 0.765625, 2.123046875, 3.48046875, 4.837890625, 6.1953125, 7.552734375, 8.91015625, 10.267578125, 11.625, 12.982421875, 14.33984375, 15.697265625, 17.0546875, 18.412109375, 19.76953125, 21.126953125, 22.484375, 23.841796875, 25.19921875, 26.556640625, 27.9140625, 29.271484375, 30.62890625, 31.986328125, 33.34375, 34.701171875, 36.05859375, 37.416015625, 38.7734375, 40.130859375, 41.48828125, 42.845703125, 44.203125, 45.560546875, 46.91796875, 48.275390625, 49.6328125, 50.990234375, 52.34765625, 53.705078125, 55.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 19.0, 23.0, 33.0, 41.0, 68.0, 79.0, 116.0, 125.0, 103.0, 90.0, 95.0, 65.0, 55.0, 32.0, 22.0, 8.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37890625, -3.21807861328125, -3.0572509765625, -2.89642333984375, -2.735595703125, -2.57476806640625, -2.4139404296875, -2.25311279296875, -2.09228515625, -1.93145751953125, -1.7706298828125, -1.60980224609375, -1.448974609375, -1.28814697265625, -1.1273193359375, -0.96649169921875, -0.8056640625, -0.64483642578125, -0.4840087890625, -0.32318115234375, -0.162353515625, -0.00152587890625, 0.1593017578125, 0.32012939453125, 0.48095703125, 0.64178466796875, 0.8026123046875, 0.96343994140625, 1.124267578125, 1.28509521484375, 1.4459228515625, 1.60675048828125, 1.767578125, 1.92840576171875, 2.0892333984375, 2.25006103515625, 2.410888671875, 2.57171630859375, 2.7325439453125, 2.89337158203125, 3.05419921875, 3.21502685546875, 3.3758544921875, 3.53668212890625, 3.697509765625, 3.85833740234375, 4.0191650390625, 4.17999267578125, 4.3408203125, 4.50164794921875, 4.6624755859375, 4.82330322265625, 4.984130859375, 5.14495849609375, 5.3057861328125, 5.46661376953125, 5.62744140625, 5.78826904296875, 5.9490966796875, 6.10992431640625, 6.270751953125, 6.43157958984375, 6.5924072265625, 6.75323486328125, 6.9140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 6.0, 20.0, 18.0, 18.0, 19.0, 43.0, 63.0, 108.0, 131.0, 270.0, 519.0, 1108.0, 3176.0, 11418.0, 53983.0, 415936.0, 3319884.0, 327402.0, 45297.0, 9771.0, 2831.0, 1067.0, 446.0, 245.0, 146.0, 97.0, 73.0, 48.0, 36.0, 24.0, 18.0, 11.0, 10.0, 11.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.953125, -26.2333984375, -25.513671875, -24.7939453125, -24.07421875, -23.3544921875, -22.634765625, -21.9150390625, -21.1953125, -20.4755859375, -19.755859375, -19.0361328125, -18.31640625, -17.5966796875, -16.876953125, -16.1572265625, -15.4375, -14.7177734375, -13.998046875, -13.2783203125, -12.55859375, -11.8388671875, -11.119140625, -10.3994140625, -9.6796875, -8.9599609375, -8.240234375, -7.5205078125, -6.80078125, -6.0810546875, -5.361328125, -4.6416015625, -3.921875, -3.2021484375, -2.482421875, -1.7626953125, -1.04296875, -0.3232421875, 0.396484375, 1.1162109375, 1.8359375, 2.5556640625, 3.275390625, 3.9951171875, 4.71484375, 5.4345703125, 6.154296875, 6.8740234375, 7.59375, 8.3134765625, 9.033203125, 9.7529296875, 10.47265625, 11.1923828125, 11.912109375, 12.6318359375, 13.3515625, 14.0712890625, 14.791015625, 15.5107421875, 16.23046875, 16.9501953125, 17.669921875, 18.3896484375, 19.109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 17.0, 32.0, 35.0, 81.0, 115.0, 243.0, 466.0, 1363.0, 889.0, 358.0, 191.0, 123.0, 55.0, 36.0, 15.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.42327880859375, -5.1004638671875, -4.77764892578125, -4.454833984375, -4.13201904296875, -3.8092041015625, -3.48638916015625, -3.16357421875, -2.84075927734375, -2.5179443359375, -2.19512939453125, -1.872314453125, -1.54949951171875, -1.2266845703125, -0.90386962890625, -0.5810546875, -0.25823974609375, 0.0645751953125, 0.38739013671875, 0.710205078125, 1.03302001953125, 1.3558349609375, 1.67864990234375, 2.00146484375, 2.32427978515625, 2.6470947265625, 2.96990966796875, 3.292724609375, 3.61553955078125, 3.9383544921875, 4.26116943359375, 4.583984375, 4.90679931640625, 5.2296142578125, 5.55242919921875, 5.875244140625, 6.19805908203125, 6.5208740234375, 6.84368896484375, 7.16650390625, 7.48931884765625, 7.8121337890625, 8.13494873046875, 8.457763671875, 8.78057861328125, 9.1033935546875, 9.42620849609375, 9.7490234375, 10.07183837890625, 10.3946533203125, 10.71746826171875, 11.040283203125, 11.36309814453125, 11.6859130859375, 12.00872802734375, 12.33154296875, 12.65435791015625, 12.9771728515625, 13.29998779296875, 13.622802734375, 13.94561767578125, 14.2684326171875, 14.59124755859375, 14.9140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 7.0, 2.0, 12.0, 10.0, 19.0, 19.0, 24.0, 38.0, 47.0, 59.0, 70.0, 84.0, 79.0, 94.0, 86.0, 89.0, 79.0, 61.0, 40.0, 22.0, 20.0, 15.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.11328887939453, -33.76093673706055, -32.40858840942383, -31.056236267089844, -29.70388412475586, -28.351533889770508, -26.999183654785156, -25.646831512451172, -24.29448127746582, -22.94213104248047, -21.589778900146484, -20.237428665161133, -18.88507843017578, -17.532726287841797, -16.180376052856445, -14.828024864196777, -13.47567367553711, -12.123322486877441, -10.770971298217773, -9.418621063232422, -8.066269874572754, -6.713918685913086, -5.361568450927734, -4.009217262268066, -2.6568660736083984, -1.3045151233673096, 0.0478358268737793, 1.400186538696289, 2.752537727355957, 4.104888916015625, 5.457239151000977, 6.8095903396606445, 8.161941528320312, 9.51429271697998, 10.866643905639648, 12.218994140625, 13.571345329284668, 14.923696517944336, 16.276046752929688, 17.628398895263672, 18.980749130249023, 20.333099365234375, 21.68545150756836, 23.03780174255371, 24.390151977539062, 25.742504119873047, 27.0948543548584, 28.44720458984375, 29.799556732177734, 31.151906967163086, 32.50425720214844, 33.85660934448242, 35.208961486816406, 36.561309814453125, 37.91366195678711, 39.266014099121094, 40.61836242675781, 41.9707145690918, 43.323062896728516, 44.6754150390625, 46.027767181396484, 47.38011932373047, 48.73246765136719, 50.08481979370117, 51.437171936035156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 9.0, 6.0, 14.0, 17.0, 14.0, 21.0, 22.0, 27.0, 29.0, 40.0, 47.0, 32.0, 45.0, 44.0, 40.0, 56.0, 37.0, 38.0, 48.0, 39.0, 37.0, 42.0, 38.0, 46.0, 32.0, 27.0, 22.0, 16.0, 21.0, 9.0, 15.0, 10.0, 9.0, 11.0, 10.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.292917251586914, -22.46396255493164, -21.635007858276367, -20.806053161621094, -19.977100372314453, -19.148143768310547, -18.319190979003906, -17.490236282348633, -16.66128158569336, -15.832326889038086, -15.003372192382812, -14.174418449401855, -13.345463752746582, -12.516509056091309, -11.687555313110352, -10.858600616455078, -10.029645919799805, -9.200691223144531, -8.371736526489258, -7.542782783508301, -6.713828086853027, -5.884873390197754, -5.055919170379639, -4.226964950561523, -3.39801025390625, -2.5690557956695557, -1.7401013374328613, -0.911146879196167, -0.08219242095947266, 0.7467622756958008, 1.575716495513916, 2.4046707153320312, 3.233623504638672, 4.062578201293945, 4.8915324211120605, 5.720486640930176, 6.549441337585449, 7.378396034240723, 8.20734977722168, 9.036304473876953, 9.865259170532227, 10.6942138671875, 11.523168563842773, 12.35212230682373, 13.181077003479004, 14.010031700134277, 14.838985443115234, 15.667940139770508, 16.49689483642578, 17.325849533081055, 18.154804229736328, 18.9837589263916, 19.812713623046875, 20.641666412353516, 21.47062110900879, 22.299575805664062, 23.128530502319336, 23.95748519897461, 24.786439895629883, 25.615394592285156, 26.444347381591797, 27.273303985595703, 28.102256774902344, 28.931211471557617, 29.76016616821289]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 9.0, 12.0, 18.0, 36.0, 52.0, 67.0, 105.0, 196.0, 377.0, 786.0, 2151.0, 10022.0, 88933.0, 831478.0, 99485.0, 10835.0, 2286.0, 797.0, 375.0, 215.0, 109.0, 66.0, 31.0, 34.0, 22.0, 8.0, 17.0, 3.0, 2.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.125, -39.73193359375, -38.3388671875, -36.94580078125, -35.552734375, -34.15966796875, -32.7666015625, -31.37353515625, -29.98046875, -28.58740234375, -27.1943359375, -25.80126953125, -24.408203125, -23.01513671875, -21.6220703125, -20.22900390625, -18.8359375, -17.44287109375, -16.0498046875, -14.65673828125, -13.263671875, -11.87060546875, -10.4775390625, -9.08447265625, -7.69140625, -6.29833984375, -4.9052734375, -3.51220703125, -2.119140625, -0.72607421875, 0.6669921875, 2.06005859375, 3.453125, 4.84619140625, 6.2392578125, 7.63232421875, 9.025390625, 10.41845703125, 11.8115234375, 13.20458984375, 14.59765625, 15.99072265625, 17.3837890625, 18.77685546875, 20.169921875, 21.56298828125, 22.9560546875, 24.34912109375, 25.7421875, 27.13525390625, 28.5283203125, 29.92138671875, 31.314453125, 32.70751953125, 34.1005859375, 35.49365234375, 36.88671875, 38.27978515625, 39.6728515625, 41.06591796875, 42.458984375, 43.85205078125, 45.2451171875, 46.63818359375, 48.03125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 18.0, 20.0, 38.0, 55.0, 62.0, 97.0, 107.0, 113.0, 123.0, 105.0, 76.0, 69.0, 43.0, 32.0, 6.0, 12.0, 11.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.710357666015625, -3.53985595703125, -3.369354248046875, -3.1988525390625, -3.028350830078125, -2.85784912109375, -2.687347412109375, -2.516845703125, -2.346343994140625, -2.17584228515625, -2.005340576171875, -1.8348388671875, -1.664337158203125, -1.49383544921875, -1.323333740234375, -1.15283203125, -0.982330322265625, -0.81182861328125, -0.641326904296875, -0.4708251953125, -0.300323486328125, -0.12982177734375, 0.040679931640625, 0.211181640625, 0.381683349609375, 0.55218505859375, 0.722686767578125, 0.8931884765625, 1.063690185546875, 1.23419189453125, 1.404693603515625, 1.5751953125, 1.745697021484375, 1.91619873046875, 2.086700439453125, 2.2572021484375, 2.427703857421875, 2.59820556640625, 2.768707275390625, 2.939208984375, 3.109710693359375, 3.28021240234375, 3.450714111328125, 3.6212158203125, 3.791717529296875, 3.96221923828125, 4.132720947265625, 4.30322265625, 4.473724365234375, 4.64422607421875, 4.814727783203125, 4.9852294921875, 5.155731201171875, 5.32623291015625, 5.496734619140625, 5.667236328125, 5.837738037109375, 6.00823974609375, 6.178741455078125, 6.3492431640625, 6.519744873046875, 6.69024658203125, 6.860748291015625, 7.03125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 37.0, 42.0, 61.0, 80.0, 100.0, 148.0, 193.0, 326.0, 498.0, 855.0, 1573.0, 3618.0, 8902.0, 23910.0, 69676.0, 250168.0, 504110.0, 119490.0, 39920.0, 13931.0, 5548.0, 2350.0, 1063.0, 660.0, 337.0, 252.0, 160.0, 150.0, 87.0, 66.0, 50.0, 43.0, 25.0, 22.0, 8.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.8699951171875, -11.489990234375, -11.1099853515625, -10.72998046875, -10.3499755859375, -9.969970703125, -9.5899658203125, -9.2099609375, -8.8299560546875, -8.449951171875, -8.0699462890625, -7.68994140625, -7.3099365234375, -6.929931640625, -6.5499267578125, -6.169921875, -5.7899169921875, -5.409912109375, -5.0299072265625, -4.64990234375, -4.2698974609375, -3.889892578125, -3.5098876953125, -3.1298828125, -2.7498779296875, -2.369873046875, -1.9898681640625, -1.60986328125, -1.2298583984375, -0.849853515625, -0.4698486328125, -0.08984375, 0.2901611328125, 0.670166015625, 1.0501708984375, 1.43017578125, 1.8101806640625, 2.190185546875, 2.5701904296875, 2.9501953125, 3.3302001953125, 3.710205078125, 4.0902099609375, 4.47021484375, 4.8502197265625, 5.230224609375, 5.6102294921875, 5.990234375, 6.3702392578125, 6.750244140625, 7.1302490234375, 7.51025390625, 7.8902587890625, 8.270263671875, 8.6502685546875, 9.0302734375, 9.4102783203125, 9.790283203125, 10.1702880859375, 10.55029296875, 10.9302978515625, 11.310302734375, 11.6903076171875, 12.0703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 11.0, 12.0, 15.0, 19.0, 23.0, 39.0, 26.0, 39.0, 40.0, 44.0, 38.0, 55.0, 44.0, 50.0, 60.0, 49.0, 40.0, 53.0, 48.0, 34.0, 46.0, 36.0, 25.0, 33.0, 27.0, 15.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0714111328125, -7.752197265625, -7.4329833984375, -7.11376953125, -6.7945556640625, -6.475341796875, -6.1561279296875, -5.8369140625, -5.5177001953125, -5.198486328125, -4.8792724609375, -4.56005859375, -4.2408447265625, -3.921630859375, -3.6024169921875, -3.283203125, -2.9639892578125, -2.644775390625, -2.3255615234375, -2.00634765625, -1.6871337890625, -1.367919921875, -1.0487060546875, -0.7294921875, -0.4102783203125, -0.091064453125, 0.2281494140625, 0.54736328125, 0.8665771484375, 1.185791015625, 1.5050048828125, 1.82421875, 2.1434326171875, 2.462646484375, 2.7818603515625, 3.10107421875, 3.4202880859375, 3.739501953125, 4.0587158203125, 4.3779296875, 4.6971435546875, 5.016357421875, 5.3355712890625, 5.65478515625, 5.9739990234375, 6.293212890625, 6.6124267578125, 6.931640625, 7.2508544921875, 7.570068359375, 7.8892822265625, 8.20849609375, 8.5277099609375, 8.846923828125, 9.1661376953125, 9.4853515625, 9.8045654296875, 10.123779296875, 10.4429931640625, 10.76220703125, 11.0814208984375, 11.400634765625, 11.7198486328125, 12.0390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 9.0, 3.0, 5.0, 16.0, 13.0, 19.0, 27.0, 43.0, 55.0, 86.0, 160.0, 310.0, 682.0, 1611.0, 4617.0, 14834.0, 58425.0, 394976.0, 479008.0, 68387.0, 16743.0, 5250.0, 1777.0, 700.0, 329.0, 160.0, 68.0, 69.0, 41.0, 30.0, 29.0, 12.0, 12.0, 8.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.46240234375, -8.2138671875, -7.96533203125, -7.716796875, -7.46826171875, -7.2197265625, -6.97119140625, -6.72265625, -6.47412109375, -6.2255859375, -5.97705078125, -5.728515625, -5.47998046875, -5.2314453125, -4.98291015625, -4.734375, -4.48583984375, -4.2373046875, -3.98876953125, -3.740234375, -3.49169921875, -3.2431640625, -2.99462890625, -2.74609375, -2.49755859375, -2.2490234375, -2.00048828125, -1.751953125, -1.50341796875, -1.2548828125, -1.00634765625, -0.7578125, -0.50927734375, -0.2607421875, -0.01220703125, 0.236328125, 0.48486328125, 0.7333984375, 0.98193359375, 1.23046875, 1.47900390625, 1.7275390625, 1.97607421875, 2.224609375, 2.47314453125, 2.7216796875, 2.97021484375, 3.21875, 3.46728515625, 3.7158203125, 3.96435546875, 4.212890625, 4.46142578125, 4.7099609375, 4.95849609375, 5.20703125, 5.45556640625, 5.7041015625, 5.95263671875, 6.201171875, 6.44970703125, 6.6982421875, 6.94677734375, 7.1953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 4.0, 14.0, 9.0, 13.0, 11.0, 21.0, 16.0, 27.0, 35.0, 67.0, 115.0, 220.0, 189.0, 64.0, 39.0, 33.0, 21.0, 21.0, 6.0, 12.0, 12.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0015316009521484375, -0.001493014395236969, -0.0014544278383255005, -0.001415841281414032, -0.0013772547245025635, -0.001338668167591095, -0.0013000816106796265, -0.001261495053768158, -0.0012229084968566895, -0.001184321939945221, -0.0011457353830337524, -0.001107148826122284, -0.0010685622692108154, -0.001029975712299347, -0.0009913891553878784, -0.0009528025984764099, -0.0009142160415649414, -0.0008756294846534729, -0.0008370429277420044, -0.0007984563708305359, -0.0007598698139190674, -0.0007212832570075989, -0.0006826967000961304, -0.0006441101431846619, -0.0006055235862731934, -0.0005669370293617249, -0.0005283504724502563, -0.0004897639155387878, -0.00045117735862731934, -0.00041259080171585083, -0.0003740042448043823, -0.0003354176878929138, -0.0002968311309814453, -0.0002582445740699768, -0.0002196580171585083, -0.0001810714602470398, -0.0001424849033355713, -0.00010389834642410278, -6.531178951263428e-05, -2.672523260116577e-05, 1.1861324310302734e-05, 5.044788122177124e-05, 8.903443813323975e-05, 0.00012762099504470825, 0.00016620755195617676, 0.00020479410886764526, 0.00024338066577911377, 0.0002819672226905823, 0.0003205537796020508, 0.0003591403365135193, 0.0003977268934249878, 0.0004363134503364563, 0.0004749000072479248, 0.0005134865641593933, 0.0005520731210708618, 0.0005906596779823303, 0.0006292462348937988, 0.0006678327918052673, 0.0007064193487167358, 0.0007450059056282043, 0.0007835924625396729, 0.0008221790194511414, 0.0008607655763626099, 0.0008993521332740784, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 23.0, 27.0, 36.0, 62.0, 104.0, 181.0, 302.0, 667.0, 1513.0, 4067.0, 14047.0, 66311.0, 563851.0, 336773.0, 44759.0, 10198.0, 3193.0, 1160.0, 551.0, 266.0, 161.0, 111.0, 56.0, 33.0, 26.0, 20.0, 18.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.6171875, -10.329345703125, -10.04150390625, -9.753662109375, -9.4658203125, -9.177978515625, -8.89013671875, -8.602294921875, -8.314453125, -8.026611328125, -7.73876953125, -7.450927734375, -7.1630859375, -6.875244140625, -6.58740234375, -6.299560546875, -6.01171875, -5.723876953125, -5.43603515625, -5.148193359375, -4.8603515625, -4.572509765625, -4.28466796875, -3.996826171875, -3.708984375, -3.421142578125, -3.13330078125, -2.845458984375, -2.5576171875, -2.269775390625, -1.98193359375, -1.694091796875, -1.40625, -1.118408203125, -0.83056640625, -0.542724609375, -0.2548828125, 0.032958984375, 0.32080078125, 0.608642578125, 0.896484375, 1.184326171875, 1.47216796875, 1.760009765625, 2.0478515625, 2.335693359375, 2.62353515625, 2.911376953125, 3.19921875, 3.487060546875, 3.77490234375, 4.062744140625, 4.3505859375, 4.638427734375, 4.92626953125, 5.214111328125, 5.501953125, 5.789794921875, 6.07763671875, 6.365478515625, 6.6533203125, 6.941162109375, 7.22900390625, 7.516845703125, 7.8046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 3.0, 2.0, 10.0, 13.0, 17.0, 24.0, 22.0, 48.0, 57.0, 80.0, 130.0, 171.0, 132.0, 76.0, 56.0, 32.0, 33.0, 26.0, 20.0, 12.0, 14.0, 3.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.76953125, -7.591217041015625, -7.41290283203125, -7.234588623046875, -7.0562744140625, -6.877960205078125, -6.69964599609375, -6.521331787109375, -6.343017578125, -6.164703369140625, -5.98638916015625, -5.808074951171875, -5.6297607421875, -5.451446533203125, -5.27313232421875, -5.094818115234375, -4.91650390625, -4.738189697265625, -4.55987548828125, -4.381561279296875, -4.2032470703125, -4.024932861328125, -3.84661865234375, -3.668304443359375, -3.489990234375, -3.311676025390625, -3.13336181640625, -2.955047607421875, -2.7767333984375, -2.598419189453125, -2.42010498046875, -2.241790771484375, -2.0634765625, -1.885162353515625, -1.70684814453125, -1.528533935546875, -1.3502197265625, -1.171905517578125, -0.99359130859375, -0.815277099609375, -0.636962890625, -0.458648681640625, -0.28033447265625, -0.102020263671875, 0.0762939453125, 0.254608154296875, 0.43292236328125, 0.611236572265625, 0.78955078125, 0.967864990234375, 1.14617919921875, 1.324493408203125, 1.5028076171875, 1.681121826171875, 1.85943603515625, 2.037750244140625, 2.216064453125, 2.394378662109375, 2.57269287109375, 2.751007080078125, 2.9293212890625, 3.107635498046875, 3.28594970703125, 3.464263916015625, 3.642578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 18.0, 40.0, 98.0, 147.0, 208.0, 189.0, 132.0, 89.0, 41.0, 20.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.54129028320312, -113.21691131591797, -108.89253234863281, -104.56814575195312, -100.24376678466797, -95.91938781738281, -91.59500122070312, -87.27062225341797, -82.94624328613281, -78.62186431884766, -74.2974853515625, -69.97309875488281, -65.64871978759766, -61.3243408203125, -56.99995803833008, -52.675575256347656, -48.3511962890625, -44.026817321777344, -39.70243453979492, -35.3780517578125, -31.053672790527344, -26.729291915893555, -22.404911041259766, -18.080530166625977, -13.756149291992188, -9.431768417358398, -5.107387542724609, -0.7830066680908203, 3.5413742065429688, 7.865755081176758, 12.190135955810547, 16.514516830444336, 20.838882446289062, 25.16326332092285, 29.48764419555664, 33.81202697753906, 38.13640594482422, 42.460784912109375, 46.7851676940918, 51.10955047607422, 55.433929443359375, 59.75830841064453, 64.08268737792969, 68.40707397460938, 72.73145294189453, 77.05583190917969, 81.38021850585938, 85.70459747314453, 90.02897644042969, 94.35335540771484, 98.677734375, 103.00212097167969, 107.32649993896484, 111.65087890625, 115.97526550292969, 120.29964447021484, 124.6240234375, 128.9484100341797, 133.2727813720703, 137.59716796875, 141.92153930664062, 146.2459259033203, 150.5703125, 154.89468383789062, 159.2190704345703]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 17.0, 21.0, 22.0, 19.0, 16.0, 17.0, 31.0, 36.0, 42.0, 42.0, 29.0, 35.0, 45.0, 39.0, 42.0, 39.0, 53.0, 40.0, 36.0, 38.0, 32.0, 32.0, 24.0, 27.0, 22.0, 23.0, 24.0, 17.0, 24.0, 12.0, 12.0, 11.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.39265441894531, -42.098670959472656, -40.8046875, -39.510704040527344, -38.21672058105469, -36.922733306884766, -35.62874984741211, -34.33476638793945, -33.0407829284668, -31.74679946899414, -30.452816009521484, -29.158830642700195, -27.86484718322754, -26.570863723754883, -25.276878356933594, -23.982894897460938, -22.68891143798828, -21.394927978515625, -20.10094451904297, -18.80695915222168, -17.512975692749023, -16.218992233276367, -14.925007820129395, -13.631023406982422, -12.337039947509766, -11.04305648803711, -9.749072074890137, -8.455087661743164, -7.161104202270508, -5.867120265960693, -4.573136329650879, -3.2791519165039062, -1.98516845703125, -0.6911845207214355, 0.6027994155883789, 1.8967833518981934, 3.190767288208008, 4.484751224517822, 5.778735160827637, 7.072719573974609, 8.366703033447266, 9.660686492919922, 10.954670906066895, 12.248655319213867, 13.542638778686523, 14.83662223815918, 16.13060760498047, 17.424591064453125, 18.71857452392578, 20.012557983398438, 21.306541442871094, 22.600526809692383, 23.89451026916504, 25.188493728637695, 26.482479095458984, 27.77646255493164, 29.070446014404297, 30.364429473876953, 31.65841293334961, 32.952396392822266, 34.24638366699219, 35.540367126464844, 36.8343505859375, 38.128334045410156, 39.42231750488281]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 12.0, 23.0, 30.0, 57.0, 111.0, 206.0, 438.0, 1015.0, 3434.0, 20672.0, 603760.0, 3525151.0, 32386.0, 4549.0, 1268.0, 527.0, 241.0, 124.0, 71.0, 63.0, 42.0, 25.0, 15.0, 14.0, 12.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3125, -37.3564453125, -35.400390625, -33.4443359375, -31.48828125, -29.5322265625, -27.576171875, -25.6201171875, -23.6640625, -21.7080078125, -19.751953125, -17.7958984375, -15.83984375, -13.8837890625, -11.927734375, -9.9716796875, -8.015625, -6.0595703125, -4.103515625, -2.1474609375, -0.19140625, 1.7646484375, 3.720703125, 5.6767578125, 7.6328125, 9.5888671875, 11.544921875, 13.5009765625, 15.45703125, 17.4130859375, 19.369140625, 21.3251953125, 23.28125, 25.2373046875, 27.193359375, 29.1494140625, 31.10546875, 33.0615234375, 35.017578125, 36.9736328125, 38.9296875, 40.8857421875, 42.841796875, 44.7978515625, 46.75390625, 48.7099609375, 50.666015625, 52.6220703125, 54.578125, 56.5341796875, 58.490234375, 60.4462890625, 62.40234375, 64.3583984375, 66.314453125, 68.2705078125, 70.2265625, 72.1826171875, 74.138671875, 76.0947265625, 78.05078125, 80.0068359375, 81.962890625, 83.9189453125, 85.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 15.0, 22.0, 23.0, 35.0, 47.0, 90.0, 86.0, 106.0, 111.0, 115.0, 94.0, 70.0, 55.0, 55.0, 24.0, 18.0, 9.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.615631103515625, -3.44805908203125, -3.280487060546875, -3.1129150390625, -2.945343017578125, -2.77777099609375, -2.610198974609375, -2.442626953125, -2.275054931640625, -2.10748291015625, -1.939910888671875, -1.7723388671875, -1.604766845703125, -1.43719482421875, -1.269622802734375, -1.10205078125, -0.934478759765625, -0.76690673828125, -0.599334716796875, -0.4317626953125, -0.264190673828125, -0.09661865234375, 0.070953369140625, 0.238525390625, 0.406097412109375, 0.57366943359375, 0.741241455078125, 0.9088134765625, 1.076385498046875, 1.24395751953125, 1.411529541015625, 1.5791015625, 1.746673583984375, 1.91424560546875, 2.081817626953125, 2.2493896484375, 2.416961669921875, 2.58453369140625, 2.752105712890625, 2.919677734375, 3.087249755859375, 3.25482177734375, 3.422393798828125, 3.5899658203125, 3.757537841796875, 3.92510986328125, 4.092681884765625, 4.26025390625, 4.427825927734375, 4.59539794921875, 4.762969970703125, 4.9305419921875, 5.098114013671875, 5.26568603515625, 5.433258056640625, 5.600830078125, 5.768402099609375, 5.93597412109375, 6.103546142578125, 6.2711181640625, 6.438690185546875, 6.60626220703125, 6.773834228515625, 6.94140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 19.0, 20.0, 42.0, 61.0, 81.0, 118.0, 217.0, 407.0, 794.0, 1990.0, 5424.0, 17762.0, 71384.0, 479924.0, 3313200.0, 238441.0, 45280.0, 12128.0, 3925.0, 1572.0, 630.0, 322.0, 186.0, 104.0, 60.0, 34.0, 26.0, 22.0, 13.0, 11.0, 8.0, 9.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.4150390625, -18.705078125, -17.9951171875, -17.28515625, -16.5751953125, -15.865234375, -15.1552734375, -14.4453125, -13.7353515625, -13.025390625, -12.3154296875, -11.60546875, -10.8955078125, -10.185546875, -9.4755859375, -8.765625, -8.0556640625, -7.345703125, -6.6357421875, -5.92578125, -5.2158203125, -4.505859375, -3.7958984375, -3.0859375, -2.3759765625, -1.666015625, -0.9560546875, -0.24609375, 0.4638671875, 1.173828125, 1.8837890625, 2.59375, 3.3037109375, 4.013671875, 4.7236328125, 5.43359375, 6.1435546875, 6.853515625, 7.5634765625, 8.2734375, 8.9833984375, 9.693359375, 10.4033203125, 11.11328125, 11.8232421875, 12.533203125, 13.2431640625, 13.953125, 14.6630859375, 15.373046875, 16.0830078125, 16.79296875, 17.5029296875, 18.212890625, 18.9228515625, 19.6328125, 20.3427734375, 21.052734375, 21.7626953125, 22.47265625, 23.1826171875, 23.892578125, 24.6025390625, 25.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 18.0, 21.0, 40.0, 48.0, 76.0, 103.0, 188.0, 334.0, 1267.0, 1067.0, 401.0, 173.0, 110.0, 57.0, 48.0, 31.0, 18.0, 15.0, 11.0, 5.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.234375, -10.972900390625, -10.71142578125, -10.449951171875, -10.1884765625, -9.927001953125, -9.66552734375, -9.404052734375, -9.142578125, -8.881103515625, -8.61962890625, -8.358154296875, -8.0966796875, -7.835205078125, -7.57373046875, -7.312255859375, -7.05078125, -6.789306640625, -6.52783203125, -6.266357421875, -6.0048828125, -5.743408203125, -5.48193359375, -5.220458984375, -4.958984375, -4.697509765625, -4.43603515625, -4.174560546875, -3.9130859375, -3.651611328125, -3.39013671875, -3.128662109375, -2.8671875, -2.605712890625, -2.34423828125, -2.082763671875, -1.8212890625, -1.559814453125, -1.29833984375, -1.036865234375, -0.775390625, -0.513916015625, -0.25244140625, 0.009033203125, 0.2705078125, 0.531982421875, 0.79345703125, 1.054931640625, 1.31640625, 1.577880859375, 1.83935546875, 2.100830078125, 2.3623046875, 2.623779296875, 2.88525390625, 3.146728515625, 3.408203125, 3.669677734375, 3.93115234375, 4.192626953125, 4.4541015625, 4.715576171875, 4.97705078125, 5.238525390625, 5.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 24.0, 28.0, 41.0, 44.0, 66.0, 78.0, 78.0, 91.0, 100.0, 101.0, 81.0, 64.0, 54.0, 40.0, 16.0, 23.0, 16.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.32663917541504, -29.106979370117188, -27.887319564819336, -26.667659759521484, -25.447999954223633, -24.22834014892578, -23.008678436279297, -21.789020538330078, -20.569358825683594, -19.349699020385742, -18.13003921508789, -16.91037940979004, -15.690719604492188, -14.471059799194336, -13.251399040222168, -12.031739234924316, -10.812080383300781, -9.59242057800293, -8.372760772705078, -7.153100490570068, -5.933440685272217, -4.713780879974365, -3.4941205978393555, -2.274460792541504, -1.0548009872436523, 0.16485893726348877, 1.3845188617706299, 2.6041789054870605, 3.823838710784912, 5.043498516082764, 6.263158798217773, 7.482818603515625, 8.702476501464844, 9.922136306762695, 11.141796112060547, 12.361455917358398, 13.58111572265625, 14.800775527954102, 16.020435333251953, 17.240097045898438, 18.459754943847656, 19.679414749145508, 20.89907455444336, 22.11873435974121, 23.338394165039062, 24.558053970336914, 25.777713775634766, 26.99737548828125, 28.2170352935791, 29.436695098876953, 30.656354904174805, 31.876014709472656, 33.09567642211914, 34.31533432006836, 35.534996032714844, 36.75465393066406, 37.97431564331055, 39.19397735595703, 40.41363525390625, 41.633296966552734, 42.85295486450195, 44.07261657714844, 45.292274475097656, 46.51193618774414, 47.73159408569336]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 15.0, 11.0, 7.0, 18.0, 13.0, 16.0, 19.0, 24.0, 27.0, 19.0, 33.0, 34.0, 38.0, 56.0, 34.0, 29.0, 41.0, 51.0, 54.0, 39.0, 29.0, 41.0, 47.0, 35.0, 28.0, 40.0, 29.0, 20.0, 23.0, 18.0, 16.0, 20.0, 16.0, 12.0, 8.0, 10.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.020980834960938, -21.336862564086914, -20.65274429321289, -19.9686279296875, -19.284509658813477, -18.600391387939453, -17.91627311706543, -17.232154846191406, -16.548038482666016, -15.863920211791992, -15.179802894592285, -14.495684623718262, -13.811567306518555, -13.127449035644531, -12.443330764770508, -11.759212493896484, -11.075094223022461, -10.390975952148438, -9.70685863494873, -9.022740364074707, -8.338623046875, -7.654504776000977, -6.970386505126953, -6.286268711090088, -5.602150917053223, -4.918033123016357, -4.233915328979492, -3.5497970581054688, -2.8656792640686035, -2.1815614700317383, -1.4974431991577148, -0.8133254051208496, -0.1292095184326172, 0.5549083948135376, 1.2390263080596924, 1.9231443405151367, 2.607262134552002, 3.291379928588867, 3.9754981994628906, 4.659615993499756, 5.343733787536621, 6.027851581573486, 6.711969375610352, 7.396087646484375, 8.080205917358398, 8.764323234558105, 9.448441505432129, 10.132558822631836, 10.81667709350586, 11.500795364379883, 12.18491268157959, 12.869030952453613, 13.55314826965332, 14.237266540527344, 14.921384811401367, 15.60550308227539, 16.28961944580078, 16.973737716674805, 17.657855987548828, 18.34197235107422, 19.026090621948242, 19.710208892822266, 20.39432716369629, 21.078445434570312, 21.762563705444336]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 5.0, 10.0, 10.0, 18.0, 34.0, 60.0, 72.0, 179.0, 313.0, 844.0, 2841.0, 22822.0, 496092.0, 498119.0, 22621.0, 2875.0, 853.0, 353.0, 183.0, 90.0, 69.0, 29.0, 14.0, 17.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.109375, -29.553955078125, -27.99853515625, -26.443115234375, -24.8876953125, -23.332275390625, -21.77685546875, -20.221435546875, -18.666015625, -17.110595703125, -15.55517578125, -13.999755859375, -12.4443359375, -10.888916015625, -9.33349609375, -7.778076171875, -6.22265625, -4.667236328125, -3.11181640625, -1.556396484375, -0.0009765625, 1.554443359375, 3.10986328125, 4.665283203125, 6.220703125, 7.776123046875, 9.33154296875, 10.886962890625, 12.4423828125, 13.997802734375, 15.55322265625, 17.108642578125, 18.6640625, 20.219482421875, 21.77490234375, 23.330322265625, 24.8857421875, 26.441162109375, 27.99658203125, 29.552001953125, 31.107421875, 32.662841796875, 34.21826171875, 35.773681640625, 37.3291015625, 38.884521484375, 40.43994140625, 41.995361328125, 43.55078125, 45.106201171875, 46.66162109375, 48.217041015625, 49.7724609375, 51.327880859375, 52.88330078125, 54.438720703125, 55.994140625, 57.549560546875, 59.10498046875, 60.660400390625, 62.2158203125, 63.771240234375, 65.32666015625, 66.882080078125, 68.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 17.0, 11.0, 16.0, 39.0, 41.0, 60.0, 89.0, 99.0, 96.0, 106.0, 95.0, 85.0, 80.0, 48.0, 43.0, 28.0, 13.0, 13.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.5552978515625, -3.387939453125, -3.2205810546875, -3.05322265625, -2.8858642578125, -2.718505859375, -2.5511474609375, -2.3837890625, -2.2164306640625, -2.049072265625, -1.8817138671875, -1.71435546875, -1.5469970703125, -1.379638671875, -1.2122802734375, -1.044921875, -0.8775634765625, -0.710205078125, -0.5428466796875, -0.37548828125, -0.2081298828125, -0.040771484375, 0.1265869140625, 0.2939453125, 0.4613037109375, 0.628662109375, 0.7960205078125, 0.96337890625, 1.1307373046875, 1.298095703125, 1.4654541015625, 1.6328125, 1.8001708984375, 1.967529296875, 2.1348876953125, 2.30224609375, 2.4696044921875, 2.636962890625, 2.8043212890625, 2.9716796875, 3.1390380859375, 3.306396484375, 3.4737548828125, 3.64111328125, 3.8084716796875, 3.975830078125, 4.1431884765625, 4.310546875, 4.4779052734375, 4.645263671875, 4.8126220703125, 4.97998046875, 5.1473388671875, 5.314697265625, 5.4820556640625, 5.6494140625, 5.8167724609375, 5.984130859375, 6.1514892578125, 6.31884765625, 6.4862060546875, 6.653564453125, 6.8209228515625, 6.98828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 13.0, 18.0, 12.0, 28.0, 34.0, 56.0, 127.0, 154.0, 332.0, 616.0, 1188.0, 2623.0, 5893.0, 13638.0, 31727.0, 82487.0, 397323.0, 377168.0, 79776.0, 31209.0, 13196.0, 5762.0, 2638.0, 1151.0, 600.0, 311.0, 161.0, 113.0, 61.0, 35.0, 29.0, 18.0, 12.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5703125, -11.1844482421875, -10.798583984375, -10.4127197265625, -10.02685546875, -9.6409912109375, -9.255126953125, -8.8692626953125, -8.4833984375, -8.0975341796875, -7.711669921875, -7.3258056640625, -6.93994140625, -6.5540771484375, -6.168212890625, -5.7823486328125, -5.396484375, -5.0106201171875, -4.624755859375, -4.2388916015625, -3.85302734375, -3.4671630859375, -3.081298828125, -2.6954345703125, -2.3095703125, -1.9237060546875, -1.537841796875, -1.1519775390625, -0.76611328125, -0.3802490234375, 0.005615234375, 0.3914794921875, 0.77734375, 1.1632080078125, 1.549072265625, 1.9349365234375, 2.32080078125, 2.7066650390625, 3.092529296875, 3.4783935546875, 3.8642578125, 4.2501220703125, 4.635986328125, 5.0218505859375, 5.40771484375, 5.7935791015625, 6.179443359375, 6.5653076171875, 6.951171875, 7.3370361328125, 7.722900390625, 8.1087646484375, 8.49462890625, 8.8804931640625, 9.266357421875, 9.6522216796875, 10.0380859375, 10.4239501953125, 10.809814453125, 11.1956787109375, 11.58154296875, 11.9674072265625, 12.353271484375, 12.7391357421875, 13.125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 13.0, 15.0, 19.0, 32.0, 22.0, 38.0, 34.0, 42.0, 46.0, 54.0, 47.0, 56.0, 46.0, 42.0, 40.0, 57.0, 57.0, 37.0, 43.0, 40.0, 24.0, 30.0, 25.0, 22.0, 25.0, 12.0, 16.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.9296875, -10.5806884765625, -10.231689453125, -9.8826904296875, -9.53369140625, -9.1846923828125, -8.835693359375, -8.4866943359375, -8.1376953125, -7.7886962890625, -7.439697265625, -7.0906982421875, -6.74169921875, -6.3927001953125, -6.043701171875, -5.6947021484375, -5.345703125, -4.9967041015625, -4.647705078125, -4.2987060546875, -3.94970703125, -3.6007080078125, -3.251708984375, -2.9027099609375, -2.5537109375, -2.2047119140625, -1.855712890625, -1.5067138671875, -1.15771484375, -0.8087158203125, -0.459716796875, -0.1107177734375, 0.23828125, 0.5872802734375, 0.936279296875, 1.2852783203125, 1.63427734375, 1.9832763671875, 2.332275390625, 2.6812744140625, 3.0302734375, 3.3792724609375, 3.728271484375, 4.0772705078125, 4.42626953125, 4.7752685546875, 5.124267578125, 5.4732666015625, 5.822265625, 6.1712646484375, 6.520263671875, 6.8692626953125, 7.21826171875, 7.5672607421875, 7.916259765625, 8.2652587890625, 8.6142578125, 8.9632568359375, 9.312255859375, 9.6612548828125, 10.01025390625, 10.3592529296875, 10.708251953125, 11.0572509765625, 11.40625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 13.0, 9.0, 19.0, 26.0, 24.0, 56.0, 61.0, 116.0, 159.0, 294.0, 562.0, 1191.0, 2672.0, 6231.0, 16236.0, 45079.0, 173982.0, 581058.0, 153034.0, 41694.0, 15239.0, 5774.0, 2545.0, 1172.0, 558.0, 267.0, 159.0, 83.0, 73.0, 56.0, 35.0, 15.0, 15.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.2152099609375, -5.031982421875, -4.8487548828125, -4.66552734375, -4.4822998046875, -4.299072265625, -4.1158447265625, -3.9326171875, -3.7493896484375, -3.566162109375, -3.3829345703125, -3.19970703125, -3.0164794921875, -2.833251953125, -2.6500244140625, -2.466796875, -2.2835693359375, -2.100341796875, -1.9171142578125, -1.73388671875, -1.5506591796875, -1.367431640625, -1.1842041015625, -1.0009765625, -0.8177490234375, -0.634521484375, -0.4512939453125, -0.26806640625, -0.0848388671875, 0.098388671875, 0.2816162109375, 0.46484375, 0.6480712890625, 0.831298828125, 1.0145263671875, 1.19775390625, 1.3809814453125, 1.564208984375, 1.7474365234375, 1.9306640625, 2.1138916015625, 2.297119140625, 2.4803466796875, 2.66357421875, 2.8468017578125, 3.030029296875, 3.2132568359375, 3.396484375, 3.5797119140625, 3.762939453125, 3.9461669921875, 4.12939453125, 4.3126220703125, 4.495849609375, 4.6790771484375, 4.8623046875, 5.0455322265625, 5.228759765625, 5.4119873046875, 5.59521484375, 5.7784423828125, 5.961669921875, 6.1448974609375, 6.328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 12.0, 16.0, 9.0, 17.0, 22.0, 56.0, 133.0, 298.0, 194.0, 80.0, 29.0, 21.0, 12.0, 14.0, 17.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011692047119140625, -0.001123771071434021, -0.0010783374309539795, -0.001032903790473938, -0.0009874701499938965, -0.000942036509513855, -0.0008966028690338135, -0.000851169228553772, -0.0008057355880737305, -0.000760301947593689, -0.0007148683071136475, -0.000669434666633606, -0.0006240010261535645, -0.000578567385673523, -0.0005331337451934814, -0.00048770010471343994, -0.00044226646423339844, -0.00039683282375335693, -0.00035139918327331543, -0.0003059655427932739, -0.0002605319023132324, -0.00021509826183319092, -0.00016966462135314941, -0.0001242309808731079, -7.87973403930664e-05, -3.33636999130249e-05, 1.2069940567016602e-05, 5.7503581047058105e-05, 0.00010293722152709961, 0.0001483708620071411, 0.00019380450248718262, 0.00023923814296722412, 0.0002846717834472656, 0.00033010542392730713, 0.00037553906440734863, 0.00042097270488739014, 0.00046640634536743164, 0.0005118399858474731, 0.0005572736263275146, 0.0006027072668075562, 0.0006481409072875977, 0.0006935745477676392, 0.0007390081882476807, 0.0007844418287277222, 0.0008298754692077637, 0.0008753091096878052, 0.0009207427501678467, 0.0009661763906478882, 0.0010116100311279297, 0.0010570436716079712, 0.0011024773120880127, 0.0011479109525680542, 0.0011933445930480957, 0.0012387782335281372, 0.0012842118740081787, 0.0013296455144882202, 0.0013750791549682617, 0.0014205127954483032, 0.0014659464359283447, 0.0015113800764083862, 0.0015568137168884277, 0.0016022473573684692, 0.0016476809978485107, 0.0016931146383285522, 0.0017385482788085938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 22.0, 23.0, 56.0, 75.0, 130.0, 233.0, 394.0, 785.0, 1611.0, 4027.0, 11533.0, 38178.0, 152849.0, 617076.0, 162222.0, 39590.0, 12161.0, 4119.0, 1750.0, 772.0, 359.0, 217.0, 132.0, 70.0, 53.0, 28.0, 20.0, 17.0, 10.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.39300537109375, -6.1688232421875, -5.94464111328125, -5.720458984375, -5.49627685546875, -5.2720947265625, -5.04791259765625, -4.82373046875, -4.59954833984375, -4.3753662109375, -4.15118408203125, -3.927001953125, -3.70281982421875, -3.4786376953125, -3.25445556640625, -3.0302734375, -2.80609130859375, -2.5819091796875, -2.35772705078125, -2.133544921875, -1.90936279296875, -1.6851806640625, -1.46099853515625, -1.23681640625, -1.01263427734375, -0.7884521484375, -0.56427001953125, -0.340087890625, -0.11590576171875, 0.1082763671875, 0.33245849609375, 0.556640625, 0.78082275390625, 1.0050048828125, 1.22918701171875, 1.453369140625, 1.67755126953125, 1.9017333984375, 2.12591552734375, 2.35009765625, 2.57427978515625, 2.7984619140625, 3.02264404296875, 3.246826171875, 3.47100830078125, 3.6951904296875, 3.91937255859375, 4.1435546875, 4.36773681640625, 4.5919189453125, 4.81610107421875, 5.040283203125, 5.26446533203125, 5.4886474609375, 5.71282958984375, 5.93701171875, 6.16119384765625, 6.3853759765625, 6.60955810546875, 6.833740234375, 7.05792236328125, 7.2821044921875, 7.50628662109375, 7.73046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 6.0, 7.0, 10.0, 12.0, 20.0, 18.0, 35.0, 38.0, 59.0, 90.0, 122.0, 139.0, 118.0, 96.0, 50.0, 40.0, 32.0, 27.0, 26.0, 10.0, 14.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9053955078125, -4.713134765625, -4.5208740234375, -4.32861328125, -4.1363525390625, -3.944091796875, -3.7518310546875, -3.5595703125, -3.3673095703125, -3.175048828125, -2.9827880859375, -2.79052734375, -2.5982666015625, -2.406005859375, -2.2137451171875, -2.021484375, -1.8292236328125, -1.636962890625, -1.4447021484375, -1.25244140625, -1.0601806640625, -0.867919921875, -0.6756591796875, -0.4833984375, -0.2911376953125, -0.098876953125, 0.0933837890625, 0.28564453125, 0.4779052734375, 0.670166015625, 0.8624267578125, 1.0546875, 1.2469482421875, 1.439208984375, 1.6314697265625, 1.82373046875, 2.0159912109375, 2.208251953125, 2.4005126953125, 2.5927734375, 2.7850341796875, 2.977294921875, 3.1695556640625, 3.36181640625, 3.5540771484375, 3.746337890625, 3.9385986328125, 4.130859375, 4.3231201171875, 4.515380859375, 4.7076416015625, 4.89990234375, 5.0921630859375, 5.284423828125, 5.4766845703125, 5.6689453125, 5.8612060546875, 6.053466796875, 6.2457275390625, 6.43798828125, 6.6302490234375, 6.822509765625, 7.0147705078125, 7.20703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 13.0, 19.0, 30.0, 31.0, 42.0, 58.0, 60.0, 56.0, 95.0, 75.0, 88.0, 90.0, 83.0, 47.0, 53.0, 40.0, 28.0, 24.0, 18.0, 10.0, 9.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.55586242675781, -73.69187927246094, -71.82788848876953, -69.96390533447266, -68.09991455078125, -66.23593139648438, -64.3719482421875, -62.507957458496094, -60.64397430419922, -58.77998733520508, -56.91600036621094, -55.05201721191406, -53.18803024291992, -51.32404327392578, -49.46005630493164, -47.5960693359375, -45.73208236694336, -43.86809539794922, -42.00410842895508, -40.14012145996094, -38.27613830566406, -36.41215133666992, -34.54816436767578, -32.68417739868164, -30.820192337036133, -28.956205368041992, -27.092220306396484, -25.228233337402344, -23.364246368408203, -21.500261306762695, -19.636274337768555, -17.772289276123047, -15.90829849243164, -14.044312477111816, -12.180326461791992, -10.316339492797852, -8.452353477478027, -6.588367462158203, -4.7243804931640625, -2.8603944778442383, -0.9964084625244141, 0.8675777912139893, 2.7315640449523926, 4.595550537109375, 6.459536552429199, 8.323522567749023, 10.187509536743164, 12.051495552062988, 13.915481567382812, 15.779467582702637, 17.64345359802246, 19.5074405670166, 21.37142562866211, 23.23541259765625, 25.09939956665039, 26.96338653564453, 28.82737159729004, 30.69135856628418, 32.55534362792969, 34.41933059692383, 36.28331756591797, 38.147300720214844, 40.01129150390625, 41.875274658203125, 43.739261627197266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 9.0, 6.0, 6.0, 13.0, 14.0, 6.0, 23.0, 21.0, 26.0, 13.0, 28.0, 37.0, 25.0, 39.0, 28.0, 38.0, 36.0, 46.0, 27.0, 32.0, 32.0, 38.0, 36.0, 35.0, 40.0, 43.0, 37.0, 30.0, 35.0, 18.0, 24.0, 20.0, 19.0, 18.0, 20.0, 14.0, 13.0, 8.0, 11.0, 5.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-40.06098937988281, -38.774513244628906, -37.488037109375, -36.201560974121094, -34.91508483886719, -33.62860870361328, -32.342132568359375, -31.0556583404541, -29.769182205200195, -28.48270606994629, -27.196229934692383, -25.909753799438477, -24.623279571533203, -23.336803436279297, -22.05032730102539, -20.763851165771484, -19.477375030517578, -18.190898895263672, -16.904422760009766, -15.617947578430176, -14.33147144317627, -13.044995307922363, -11.758520126342773, -10.472043991088867, -9.185567855834961, -7.899091720581055, -6.612616062164307, -5.326140403747559, -4.039664268493652, -2.753188133239746, -1.466712474822998, -0.18023681640625, 1.1062393188476562, 2.3927152156829834, 3.6791911125183105, 4.965666770935059, 6.252142906188965, 7.538619041442871, 8.825094223022461, 10.111570358276367, 11.398046493530273, 12.68452262878418, 13.970998764038086, 15.257473945617676, 16.543949127197266, 17.830425262451172, 19.116901397705078, 20.403377532958984, 21.68985366821289, 22.976329803466797, 24.262805938720703, 25.54928207397461, 26.835758209228516, 28.122234344482422, 29.408708572387695, 30.6951847076416, 31.981660842895508, 33.26813507080078, 34.55461120605469, 35.841087341308594, 37.1275634765625, 38.414039611816406, 39.70051574707031, 40.98699188232422, 42.273468017578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 19.0, 25.0, 34.0, 48.0, 85.0, 159.0, 280.0, 575.0, 1404.0, 4282.0, 18365.0, 163416.0, 3877149.0, 108302.0, 14212.0, 3529.0, 1183.0, 473.0, 233.0, 162.0, 90.0, 66.0, 41.0, 29.0, 24.0, 16.0, 9.0, 13.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.5, -47.81787109375, -46.1357421875, -44.45361328125, -42.771484375, -41.08935546875, -39.4072265625, -37.72509765625, -36.04296875, -34.36083984375, -32.6787109375, -30.99658203125, -29.314453125, -27.63232421875, -25.9501953125, -24.26806640625, -22.5859375, -20.90380859375, -19.2216796875, -17.53955078125, -15.857421875, -14.17529296875, -12.4931640625, -10.81103515625, -9.12890625, -7.44677734375, -5.7646484375, -4.08251953125, -2.400390625, -0.71826171875, 0.9638671875, 2.64599609375, 4.328125, 6.01025390625, 7.6923828125, 9.37451171875, 11.056640625, 12.73876953125, 14.4208984375, 16.10302734375, 17.78515625, 19.46728515625, 21.1494140625, 22.83154296875, 24.513671875, 26.19580078125, 27.8779296875, 29.56005859375, 31.2421875, 32.92431640625, 34.6064453125, 36.28857421875, 37.970703125, 39.65283203125, 41.3349609375, 43.01708984375, 44.69921875, 46.38134765625, 48.0634765625, 49.74560546875, 51.427734375, 53.10986328125, 54.7919921875, 56.47412109375, 58.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 16.0, 26.0, 26.0, 37.0, 64.0, 75.0, 101.0, 94.0, 103.0, 101.0, 80.0, 72.0, 68.0, 52.0, 28.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.544921875, -3.379730224609375, -3.21453857421875, -3.049346923828125, -2.8841552734375, -2.718963623046875, -2.55377197265625, -2.388580322265625, -2.223388671875, -2.058197021484375, -1.89300537109375, -1.727813720703125, -1.5626220703125, -1.397430419921875, -1.23223876953125, -1.067047119140625, -0.90185546875, -0.736663818359375, -0.57147216796875, -0.406280517578125, -0.2410888671875, -0.075897216796875, 0.08929443359375, 0.254486083984375, 0.419677734375, 0.584869384765625, 0.75006103515625, 0.915252685546875, 1.0804443359375, 1.245635986328125, 1.41082763671875, 1.576019287109375, 1.7412109375, 1.906402587890625, 2.07159423828125, 2.236785888671875, 2.4019775390625, 2.567169189453125, 2.73236083984375, 2.897552490234375, 3.062744140625, 3.227935791015625, 3.39312744140625, 3.558319091796875, 3.7235107421875, 3.888702392578125, 4.05389404296875, 4.219085693359375, 4.38427734375, 4.549468994140625, 4.71466064453125, 4.879852294921875, 5.0450439453125, 5.210235595703125, 5.37542724609375, 5.540618896484375, 5.705810546875, 5.871002197265625, 6.03619384765625, 6.201385498046875, 6.3665771484375, 6.531768798828125, 6.69696044921875, 6.862152099609375, 7.02734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 11.0, 9.0, 12.0, 23.0, 35.0, 53.0, 73.0, 115.0, 161.0, 230.0, 302.0, 517.0, 739.0, 1130.0, 1781.0, 2714.0, 4397.0, 7429.0, 12962.0, 23705.0, 45350.0, 95566.0, 244408.0, 2143720.0, 1204827.0, 219820.0, 88275.0, 42509.0, 22425.0, 12329.0, 7050.0, 4198.0, 2611.0, 1676.0, 1066.0, 644.0, 427.0, 295.0, 202.0, 132.0, 102.0, 63.0, 56.0, 35.0, 26.0, 17.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.71875, -10.3724365234375, -10.026123046875, -9.6798095703125, -9.33349609375, -8.9871826171875, -8.640869140625, -8.2945556640625, -7.9482421875, -7.6019287109375, -7.255615234375, -6.9093017578125, -6.56298828125, -6.2166748046875, -5.870361328125, -5.5240478515625, -5.177734375, -4.8314208984375, -4.485107421875, -4.1387939453125, -3.79248046875, -3.4461669921875, -3.099853515625, -2.7535400390625, -2.4072265625, -2.0609130859375, -1.714599609375, -1.3682861328125, -1.02197265625, -0.6756591796875, -0.329345703125, 0.0169677734375, 0.36328125, 0.7095947265625, 1.055908203125, 1.4022216796875, 1.74853515625, 2.0948486328125, 2.441162109375, 2.7874755859375, 3.1337890625, 3.4801025390625, 3.826416015625, 4.1727294921875, 4.51904296875, 4.8653564453125, 5.211669921875, 5.5579833984375, 5.904296875, 6.2506103515625, 6.596923828125, 6.9432373046875, 7.28955078125, 7.6358642578125, 7.982177734375, 8.3284912109375, 8.6748046875, 9.0211181640625, 9.367431640625, 9.7137451171875, 10.06005859375, 10.4063720703125, 10.752685546875, 11.0989990234375, 11.4453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 7.0, 13.0, 24.0, 33.0, 60.0, 70.0, 103.0, 133.0, 221.0, 497.0, 1690.0, 475.0, 240.0, 139.0, 91.0, 55.0, 48.0, 30.0, 21.0, 17.0, 22.0, 11.0, 10.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.14990234375, -6.9365234375, -6.72314453125, -6.509765625, -6.29638671875, -6.0830078125, -5.86962890625, -5.65625, -5.44287109375, -5.2294921875, -5.01611328125, -4.802734375, -4.58935546875, -4.3759765625, -4.16259765625, -3.94921875, -3.73583984375, -3.5224609375, -3.30908203125, -3.095703125, -2.88232421875, -2.6689453125, -2.45556640625, -2.2421875, -2.02880859375, -1.8154296875, -1.60205078125, -1.388671875, -1.17529296875, -0.9619140625, -0.74853515625, -0.53515625, -0.32177734375, -0.1083984375, 0.10498046875, 0.318359375, 0.53173828125, 0.7451171875, 0.95849609375, 1.171875, 1.38525390625, 1.5986328125, 1.81201171875, 2.025390625, 2.23876953125, 2.4521484375, 2.66552734375, 2.87890625, 3.09228515625, 3.3056640625, 3.51904296875, 3.732421875, 3.94580078125, 4.1591796875, 4.37255859375, 4.5859375, 4.79931640625, 5.0126953125, 5.22607421875, 5.439453125, 5.65283203125, 5.8662109375, 6.07958984375, 6.29296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 15.0, 24.0, 47.0, 63.0, 89.0, 144.0, 124.0, 128.0, 114.0, 79.0, 63.0, 50.0, 24.0, 14.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.917701721191406, -60.19791793823242, -58.47813415527344, -56.75835418701172, -55.038570404052734, -53.31878662109375, -51.599002838134766, -49.87921905517578, -48.15943908691406, -46.43965530395508, -44.719871520996094, -43.000091552734375, -41.28030776977539, -39.560523986816406, -37.84074020385742, -36.12095642089844, -34.40117263793945, -32.68138885498047, -30.961606979370117, -29.241823196411133, -27.52204132080078, -25.802257537841797, -24.082473754882812, -22.362689971923828, -20.642908096313477, -18.923124313354492, -17.20334243774414, -15.483558654785156, -13.763775825500488, -12.04399299621582, -10.324209213256836, -8.604426383972168, -6.8846435546875, -5.164860725402832, -3.445077419281006, -1.7252941131591797, -0.005511283874511719, 1.7142715454101562, 3.4340553283691406, 5.153838157653809, 6.873620986938477, 8.593403816223145, 10.313186645507812, 12.032970428466797, 13.752753257751465, 15.472536087036133, 17.192319869995117, 18.91210174560547, 20.631885528564453, 22.351669311523438, 24.07145118713379, 25.791234970092773, 27.511016845703125, 29.23080062866211, 30.950584411621094, 32.67036819458008, 34.39015197753906, 36.10993576049805, 37.82971954345703, 39.54949951171875, 41.269283294677734, 42.98906707763672, 44.7088508605957, 46.42863464355469, 48.148414611816406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 13.0, 12.0, 16.0, 13.0, 10.0, 26.0, 14.0, 46.0, 32.0, 34.0, 35.0, 29.0, 41.0, 52.0, 38.0, 45.0, 38.0, 51.0, 47.0, 39.0, 34.0, 31.0, 38.0, 25.0, 18.0, 26.0, 22.0, 12.0, 23.0, 23.0, 14.0, 12.0, 12.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.265933990478516, -19.642507553100586, -19.019081115722656, -18.39565658569336, -17.77223014831543, -17.1488037109375, -16.52537727355957, -15.90195083618164, -15.278525352478027, -14.655098915100098, -14.031673431396484, -13.408246994018555, -12.784820556640625, -12.161395072937012, -11.537968635559082, -10.914543151855469, -10.291116714477539, -9.66769027709961, -9.044264793395996, -8.420838356018066, -7.797412395477295, -7.173986434936523, -6.550559997558594, -5.927134037017822, -5.303708076477051, -4.680282115936279, -4.056856155395508, -3.433429718017578, -2.8100037574768066, -2.186577796936035, -1.5631515979766846, -0.939725399017334, -0.3162994384765625, 0.30712664127349854, 0.9305527210235596, 1.5539788007736206, 2.1774048805236816, 2.800830841064453, 3.4242570400238037, 4.047683238983154, 4.671109199523926, 5.294535160064697, 5.917961120605469, 6.541387557983398, 7.16481351852417, 7.788239479064941, 8.411665916442871, 9.035091400146484, 9.658517837524414, 10.281944274902344, 10.905369758605957, 11.528796195983887, 12.1522216796875, 12.77564811706543, 13.39907455444336, 14.022500991821289, 14.645926475524902, 15.269352912902832, 15.892778396606445, 16.516204833984375, 17.139631271362305, 17.763057708740234, 18.38648223876953, 19.00990867614746, 19.63333511352539]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 6.0, 5.0, 17.0, 25.0, 42.0, 58.0, 119.0, 195.0, 357.0, 800.0, 2062.0, 8520.0, 57400.0, 445965.0, 460972.0, 59515.0, 8687.0, 2108.0, 802.0, 373.0, 189.0, 122.0, 75.0, 44.0, 23.0, 22.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.21875, -44.142333984375, -43.06591796875, -41.989501953125, -40.9130859375, -39.836669921875, -38.76025390625, -37.683837890625, -36.607421875, -35.531005859375, -34.45458984375, -33.378173828125, -32.3017578125, -31.225341796875, -30.14892578125, -29.072509765625, -27.99609375, -26.919677734375, -25.84326171875, -24.766845703125, -23.6904296875, -22.614013671875, -21.53759765625, -20.461181640625, -19.384765625, -18.308349609375, -17.23193359375, -16.155517578125, -15.0791015625, -14.002685546875, -12.92626953125, -11.849853515625, -10.7734375, -9.697021484375, -8.62060546875, -7.544189453125, -6.4677734375, -5.391357421875, -4.31494140625, -3.238525390625, -2.162109375, -1.085693359375, -0.00927734375, 1.067138671875, 2.1435546875, 3.219970703125, 4.29638671875, 5.372802734375, 6.44921875, 7.525634765625, 8.60205078125, 9.678466796875, 10.7548828125, 11.831298828125, 12.90771484375, 13.984130859375, 15.060546875, 16.136962890625, 17.21337890625, 18.289794921875, 19.3662109375, 20.442626953125, 21.51904296875, 22.595458984375, 23.671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 10.0, 15.0, 21.0, 26.0, 42.0, 51.0, 72.0, 82.0, 90.0, 94.0, 93.0, 92.0, 73.0, 62.0, 48.0, 39.0, 33.0, 20.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.510162353515625, -3.34259033203125, -3.175018310546875, -3.0074462890625, -2.839874267578125, -2.67230224609375, -2.504730224609375, -2.337158203125, -2.169586181640625, -2.00201416015625, -1.834442138671875, -1.6668701171875, -1.499298095703125, -1.33172607421875, -1.164154052734375, -0.99658203125, -0.829010009765625, -0.66143798828125, -0.493865966796875, -0.3262939453125, -0.158721923828125, 0.00885009765625, 0.176422119140625, 0.343994140625, 0.511566162109375, 0.67913818359375, 0.846710205078125, 1.0142822265625, 1.181854248046875, 1.34942626953125, 1.516998291015625, 1.6845703125, 1.852142333984375, 2.01971435546875, 2.187286376953125, 2.3548583984375, 2.522430419921875, 2.69000244140625, 2.857574462890625, 3.025146484375, 3.192718505859375, 3.36029052734375, 3.527862548828125, 3.6954345703125, 3.863006591796875, 4.03057861328125, 4.198150634765625, 4.36572265625, 4.533294677734375, 4.70086669921875, 4.868438720703125, 5.0360107421875, 5.203582763671875, 5.37115478515625, 5.538726806640625, 5.706298828125, 5.873870849609375, 6.04144287109375, 6.209014892578125, 6.3765869140625, 6.544158935546875, 6.71173095703125, 6.879302978515625, 7.046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 12.0, 15.0, 19.0, 36.0, 34.0, 47.0, 73.0, 95.0, 111.0, 158.0, 179.0, 240.0, 325.0, 526.0, 911.0, 2027.0, 4997.0, 14657.0, 46029.0, 147491.0, 472937.0, 247112.0, 73207.0, 23250.0, 7683.0, 2733.0, 1334.0, 675.0, 436.0, 289.0, 203.0, 139.0, 135.0, 119.0, 79.0, 48.0, 36.0, 40.0, 20.0, 18.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.8203125, -13.3843994140625, -12.948486328125, -12.5125732421875, -12.07666015625, -11.6407470703125, -11.204833984375, -10.7689208984375, -10.3330078125, -9.8970947265625, -9.461181640625, -9.0252685546875, -8.58935546875, -8.1534423828125, -7.717529296875, -7.2816162109375, -6.845703125, -6.4097900390625, -5.973876953125, -5.5379638671875, -5.10205078125, -4.6661376953125, -4.230224609375, -3.7943115234375, -3.3583984375, -2.9224853515625, -2.486572265625, -2.0506591796875, -1.61474609375, -1.1788330078125, -0.742919921875, -0.3070068359375, 0.12890625, 0.5648193359375, 1.000732421875, 1.4366455078125, 1.87255859375, 2.3084716796875, 2.744384765625, 3.1802978515625, 3.6162109375, 4.0521240234375, 4.488037109375, 4.9239501953125, 5.35986328125, 5.7957763671875, 6.231689453125, 6.6676025390625, 7.103515625, 7.5394287109375, 7.975341796875, 8.4112548828125, 8.84716796875, 9.2830810546875, 9.718994140625, 10.1549072265625, 10.5908203125, 11.0267333984375, 11.462646484375, 11.8985595703125, 12.33447265625, 12.7703857421875, 13.206298828125, 13.6422119140625, 14.078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 4.0, 6.0, 6.0, 8.0, 9.0, 22.0, 16.0, 19.0, 28.0, 31.0, 35.0, 39.0, 38.0, 45.0, 42.0, 39.0, 56.0, 35.0, 47.0, 41.0, 44.0, 39.0, 41.0, 39.0, 37.0, 24.0, 25.0, 18.0, 30.0, 21.0, 16.0, 16.0, 15.0, 14.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.2867431640625, -9.948486328125, -9.6102294921875, -9.27197265625, -8.9337158203125, -8.595458984375, -8.2572021484375, -7.9189453125, -7.5806884765625, -7.242431640625, -6.9041748046875, -6.56591796875, -6.2276611328125, -5.889404296875, -5.5511474609375, -5.212890625, -4.8746337890625, -4.536376953125, -4.1981201171875, -3.85986328125, -3.5216064453125, -3.183349609375, -2.8450927734375, -2.5068359375, -2.1685791015625, -1.830322265625, -1.4920654296875, -1.15380859375, -0.8155517578125, -0.477294921875, -0.1390380859375, 0.19921875, 0.5374755859375, 0.875732421875, 1.2139892578125, 1.55224609375, 1.8905029296875, 2.228759765625, 2.5670166015625, 2.9052734375, 3.2435302734375, 3.581787109375, 3.9200439453125, 4.25830078125, 4.5965576171875, 4.934814453125, 5.2730712890625, 5.611328125, 5.9495849609375, 6.287841796875, 6.6260986328125, 6.96435546875, 7.3026123046875, 7.640869140625, 7.9791259765625, 8.3173828125, 8.6556396484375, 8.993896484375, 9.3321533203125, 9.67041015625, 10.0086669921875, 10.346923828125, 10.6851806640625, 11.0234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 12.0, 7.0, 9.0, 11.0, 31.0, 48.0, 70.0, 129.0, 229.0, 400.0, 834.0, 1822.0, 4290.0, 11481.0, 33740.0, 111732.0, 450250.0, 311371.0, 81622.0, 25122.0, 8852.0, 3396.0, 1532.0, 731.0, 371.0, 177.0, 98.0, 77.0, 39.0, 35.0, 17.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3798828125, -9.150390625, -8.9208984375, -8.69140625, -8.4619140625, -8.232421875, -8.0029296875, -7.7734375, -7.5439453125, -7.314453125, -7.0849609375, -6.85546875, -6.6259765625, -6.396484375, -6.1669921875, -5.9375, -5.7080078125, -5.478515625, -5.2490234375, -5.01953125, -4.7900390625, -4.560546875, -4.3310546875, -4.1015625, -3.8720703125, -3.642578125, -3.4130859375, -3.18359375, -2.9541015625, -2.724609375, -2.4951171875, -2.265625, -2.0361328125, -1.806640625, -1.5771484375, -1.34765625, -1.1181640625, -0.888671875, -0.6591796875, -0.4296875, -0.2001953125, 0.029296875, 0.2587890625, 0.48828125, 0.7177734375, 0.947265625, 1.1767578125, 1.40625, 1.6357421875, 1.865234375, 2.0947265625, 2.32421875, 2.5537109375, 2.783203125, 3.0126953125, 3.2421875, 3.4716796875, 3.701171875, 3.9306640625, 4.16015625, 4.3896484375, 4.619140625, 4.8486328125, 5.078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 7.0, 9.0, 25.0, 33.0, 52.0, 59.0, 100.0, 303.0, 162.0, 75.0, 59.0, 47.0, 20.0, 16.0, 16.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002582550048828125, -0.0025057196617126465, -0.002428889274597168, -0.0023520588874816895, -0.002275228500366211, -0.0021983981132507324, -0.002121567726135254, -0.0020447373390197754, -0.001967906951904297, -0.0018910765647888184, -0.0018142461776733398, -0.0017374157905578613, -0.0016605854034423828, -0.0015837550163269043, -0.0015069246292114258, -0.0014300942420959473, -0.0013532638549804688, -0.0012764334678649902, -0.0011996030807495117, -0.0011227726936340332, -0.0010459423065185547, -0.0009691119194030762, -0.0008922815322875977, -0.0008154511451721191, -0.0007386207580566406, -0.0006617903709411621, -0.0005849599838256836, -0.0005081295967102051, -0.00043129920959472656, -0.00035446882247924805, -0.00027763843536376953, -0.00020080804824829102, -0.0001239776611328125, -4.7147274017333984e-05, 2.968311309814453e-05, 0.00010651350021362305, 0.00018334388732910156, 0.0002601742744445801, 0.0003370046615600586, 0.0004138350486755371, 0.0004906654357910156, 0.0005674958229064941, 0.0006443262100219727, 0.0007211565971374512, 0.0007979869842529297, 0.0008748173713684082, 0.0009516477584838867, 0.0010284781455993652, 0.0011053085327148438, 0.0011821389198303223, 0.0012589693069458008, 0.0013357996940612793, 0.0014126300811767578, 0.0014894604682922363, 0.0015662908554077148, 0.0016431212425231934, 0.0017199516296386719, 0.0017967820167541504, 0.001873612403869629, 0.0019504427909851074, 0.002027273178100586, 0.0021041035652160645, 0.002180933952331543, 0.0022577643394470215, 0.0023345947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 23.0, 26.0, 33.0, 46.0, 70.0, 120.0, 220.0, 422.0, 833.0, 1995.0, 6026.0, 21965.0, 118002.0, 623556.0, 224908.0, 36421.0, 8762.0, 2776.0, 1093.0, 528.0, 278.0, 156.0, 98.0, 57.0, 34.0, 26.0, 18.0, 9.0, 8.0, 3.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.859375, -12.5179443359375, -12.176513671875, -11.8350830078125, -11.49365234375, -11.1522216796875, -10.810791015625, -10.4693603515625, -10.1279296875, -9.7864990234375, -9.445068359375, -9.1036376953125, -8.76220703125, -8.4207763671875, -8.079345703125, -7.7379150390625, -7.396484375, -7.0550537109375, -6.713623046875, -6.3721923828125, -6.03076171875, -5.6893310546875, -5.347900390625, -5.0064697265625, -4.6650390625, -4.3236083984375, -3.982177734375, -3.6407470703125, -3.29931640625, -2.9578857421875, -2.616455078125, -2.2750244140625, -1.93359375, -1.5921630859375, -1.250732421875, -0.9093017578125, -0.56787109375, -0.2264404296875, 0.114990234375, 0.4564208984375, 0.7978515625, 1.1392822265625, 1.480712890625, 1.8221435546875, 2.16357421875, 2.5050048828125, 2.846435546875, 3.1878662109375, 3.529296875, 3.8707275390625, 4.212158203125, 4.5535888671875, 4.89501953125, 5.2364501953125, 5.577880859375, 5.9193115234375, 6.2607421875, 6.6021728515625, 6.943603515625, 7.2850341796875, 7.62646484375, 7.9678955078125, 8.309326171875, 8.6507568359375, 8.9921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 12.0, 15.0, 11.0, 21.0, 24.0, 27.0, 45.0, 48.0, 74.0, 96.0, 118.0, 108.0, 91.0, 67.0, 46.0, 35.0, 44.0, 28.0, 17.0, 13.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.79248046875, -6.5654296875, -6.33837890625, -6.111328125, -5.88427734375, -5.6572265625, -5.43017578125, -5.203125, -4.97607421875, -4.7490234375, -4.52197265625, -4.294921875, -4.06787109375, -3.8408203125, -3.61376953125, -3.38671875, -3.15966796875, -2.9326171875, -2.70556640625, -2.478515625, -2.25146484375, -2.0244140625, -1.79736328125, -1.5703125, -1.34326171875, -1.1162109375, -0.88916015625, -0.662109375, -0.43505859375, -0.2080078125, 0.01904296875, 0.24609375, 0.47314453125, 0.7001953125, 0.92724609375, 1.154296875, 1.38134765625, 1.6083984375, 1.83544921875, 2.0625, 2.28955078125, 2.5166015625, 2.74365234375, 2.970703125, 3.19775390625, 3.4248046875, 3.65185546875, 3.87890625, 4.10595703125, 4.3330078125, 4.56005859375, 4.787109375, 5.01416015625, 5.2412109375, 5.46826171875, 5.6953125, 5.92236328125, 6.1494140625, 6.37646484375, 6.603515625, 6.83056640625, 7.0576171875, 7.28466796875, 7.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 22.0, 60.0, 195.0, 274.0, 272.0, 123.0, 37.0, 15.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.87677001953125, -114.7883071899414, -105.69984436035156, -96.61138916015625, -87.5229263305664, -78.43446350097656, -69.34600830078125, -60.257545471191406, -51.16908264160156, -42.08061981201172, -32.99216079711914, -23.90369987487793, -14.815238952636719, -5.726776123046875, 3.361682891845703, 12.450141906738281, 21.538604736328125, 30.627065658569336, 39.71552658081055, 48.803985595703125, 57.89244842529297, 66.98091125488281, 76.06936645507812, 85.15782928466797, 94.24629211425781, 103.33475494384766, 112.4232177734375, 121.51167297363281, 130.60012817382812, 139.6885986328125, 148.7770538330078, 157.86550903320312, 166.95394897460938, 176.0424041748047, 185.13087463378906, 194.21932983398438, 203.30780029296875, 212.39625549316406, 221.48471069335938, 230.57318115234375, 239.66163635253906, 248.75009155273438, 257.83856201171875, 266.9270324707031, 276.0154724121094, 285.10394287109375, 294.1924133300781, 303.2808532714844, 312.36932373046875, 321.4577941894531, 330.5462341308594, 339.63470458984375, 348.7231750488281, 357.8116455078125, 366.90008544921875, 375.9885559082031, 385.0770263671875, 394.1654968261719, 403.2539367675781, 412.3424072265625, 421.4308776855469, 430.51934814453125, 439.6077880859375, 448.6962585449219, 457.7846984863281]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 12.0, 9.0, 12.0, 14.0, 20.0, 21.0, 21.0, 22.0, 27.0, 34.0, 29.0, 46.0, 31.0, 26.0, 42.0, 51.0, 53.0, 48.0, 35.0, 44.0, 53.0, 47.0, 27.0, 34.0, 31.0, 24.0, 14.0, 20.0, 27.0, 20.0, 19.0, 16.0, 14.0, 10.0, 8.0, 1.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-59.82958984375, -58.04922103881836, -56.268856048583984, -54.488487243652344, -52.7081184387207, -50.92774963378906, -49.14738464355469, -47.36701583862305, -45.586647033691406, -43.806278228759766, -42.02591323852539, -40.24554443359375, -38.46517562866211, -36.68480682373047, -34.904441833496094, -33.12407302856445, -31.343708038330078, -29.56334114074707, -27.78297233581543, -26.002605438232422, -24.22223663330078, -22.441869735717773, -20.661502838134766, -18.881134033203125, -17.100767135620117, -15.320399284362793, -13.540031433105469, -11.759664535522461, -9.979296684265137, -8.198928833007812, -6.418561935424805, -4.6381940841674805, -2.8578262329101562, -1.0774586200714111, 0.702908992767334, 2.4832763671875, 4.263644218444824, 6.044012069702148, 7.824378967285156, 9.60474681854248, 11.385114669799805, 13.165482521057129, 14.945850372314453, 16.72621726989746, 18.50658416748047, 20.28695297241211, 22.067319869995117, 23.847686767578125, 25.628055572509766, 27.408422470092773, 29.188791275024414, 30.969158172607422, 32.74952697753906, 34.52989196777344, 36.31026077270508, 38.09062957763672, 39.870994567871094, 41.651363372802734, 43.43172836303711, 45.21209716796875, 46.99246597290039, 48.77283477783203, 50.553199768066406, 52.33356857299805, 54.11393737792969]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 6.0, 18.0, 17.0, 32.0, 38.0, 60.0, 119.0, 196.0, 330.0, 572.0, 1057.0, 2466.0, 6733.0, 25503.0, 164980.0, 3620998.0, 317776.0, 38054.0, 9079.0, 3056.0, 1378.0, 652.0, 373.0, 267.0, 138.0, 106.0, 69.0, 51.0, 33.0, 15.0, 28.0, 15.0, 11.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.59375, -28.56005859375, -27.5263671875, -26.49267578125, -25.458984375, -24.42529296875, -23.3916015625, -22.35791015625, -21.32421875, -20.29052734375, -19.2568359375, -18.22314453125, -17.189453125, -16.15576171875, -15.1220703125, -14.08837890625, -13.0546875, -12.02099609375, -10.9873046875, -9.95361328125, -8.919921875, -7.88623046875, -6.8525390625, -5.81884765625, -4.78515625, -3.75146484375, -2.7177734375, -1.68408203125, -0.650390625, 0.38330078125, 1.4169921875, 2.45068359375, 3.484375, 4.51806640625, 5.5517578125, 6.58544921875, 7.619140625, 8.65283203125, 9.6865234375, 10.72021484375, 11.75390625, 12.78759765625, 13.8212890625, 14.85498046875, 15.888671875, 16.92236328125, 17.9560546875, 18.98974609375, 20.0234375, 21.05712890625, 22.0908203125, 23.12451171875, 24.158203125, 25.19189453125, 26.2255859375, 27.25927734375, 28.29296875, 29.32666015625, 30.3603515625, 31.39404296875, 32.427734375, 33.46142578125, 34.4951171875, 35.52880859375, 36.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0, 10.0, 22.0, 21.0, 37.0, 56.0, 62.0, 77.0, 86.0, 95.0, 92.0, 91.0, 97.0, 64.0, 54.0, 40.0, 27.0, 19.0, 19.0, 12.0, 7.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.57818603515625, -3.4102783203125, -3.24237060546875, -3.074462890625, -2.90655517578125, -2.7386474609375, -2.57073974609375, -2.40283203125, -2.23492431640625, -2.0670166015625, -1.89910888671875, -1.731201171875, -1.56329345703125, -1.3953857421875, -1.22747802734375, -1.0595703125, -0.89166259765625, -0.7237548828125, -0.55584716796875, -0.387939453125, -0.22003173828125, -0.0521240234375, 0.11578369140625, 0.28369140625, 0.45159912109375, 0.6195068359375, 0.78741455078125, 0.955322265625, 1.12322998046875, 1.2911376953125, 1.45904541015625, 1.626953125, 1.79486083984375, 1.9627685546875, 2.13067626953125, 2.298583984375, 2.46649169921875, 2.6343994140625, 2.80230712890625, 2.97021484375, 3.13812255859375, 3.3060302734375, 3.47393798828125, 3.641845703125, 3.80975341796875, 3.9776611328125, 4.14556884765625, 4.3134765625, 4.48138427734375, 4.6492919921875, 4.81719970703125, 4.985107421875, 5.15301513671875, 5.3209228515625, 5.48883056640625, 5.65673828125, 5.82464599609375, 5.9925537109375, 6.16046142578125, 6.328369140625, 6.49627685546875, 6.6641845703125, 6.83209228515625, 7.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 13.0, 23.0, 31.0, 38.0, 45.0, 58.0, 76.0, 104.0, 168.0, 193.0, 299.0, 457.0, 842.0, 1828.0, 4117.0, 11583.0, 38098.0, 160341.0, 1364056.0, 2359362.0, 186924.0, 43808.0, 12901.0, 4559.0, 1838.0, 918.0, 475.0, 313.0, 219.0, 147.0, 126.0, 75.0, 63.0, 50.0, 37.0, 26.0, 8.0, 13.0, 12.0, 12.0, 6.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6220703125, -18.041015625, -17.4599609375, -16.87890625, -16.2978515625, -15.716796875, -15.1357421875, -14.5546875, -13.9736328125, -13.392578125, -12.8115234375, -12.23046875, -11.6494140625, -11.068359375, -10.4873046875, -9.90625, -9.3251953125, -8.744140625, -8.1630859375, -7.58203125, -7.0009765625, -6.419921875, -5.8388671875, -5.2578125, -4.6767578125, -4.095703125, -3.5146484375, -2.93359375, -2.3525390625, -1.771484375, -1.1904296875, -0.609375, -0.0283203125, 0.552734375, 1.1337890625, 1.71484375, 2.2958984375, 2.876953125, 3.4580078125, 4.0390625, 4.6201171875, 5.201171875, 5.7822265625, 6.36328125, 6.9443359375, 7.525390625, 8.1064453125, 8.6875, 9.2685546875, 9.849609375, 10.4306640625, 11.01171875, 11.5927734375, 12.173828125, 12.7548828125, 13.3359375, 13.9169921875, 14.498046875, 15.0791015625, 15.66015625, 16.2412109375, 16.822265625, 17.4033203125, 17.984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 8.0, 11.0, 19.0, 20.0, 28.0, 47.0, 68.0, 100.0, 142.0, 193.0, 331.0, 707.0, 1245.0, 399.0, 237.0, 168.0, 107.0, 68.0, 52.0, 29.0, 17.0, 15.0, 16.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -5.987060546875, -5.73974609375, -5.492431640625, -5.2451171875, -4.997802734375, -4.75048828125, -4.503173828125, -4.255859375, -4.008544921875, -3.76123046875, -3.513916015625, -3.2666015625, -3.019287109375, -2.77197265625, -2.524658203125, -2.27734375, -2.030029296875, -1.78271484375, -1.535400390625, -1.2880859375, -1.040771484375, -0.79345703125, -0.546142578125, -0.298828125, -0.051513671875, 0.19580078125, 0.443115234375, 0.6904296875, 0.937744140625, 1.18505859375, 1.432373046875, 1.6796875, 1.927001953125, 2.17431640625, 2.421630859375, 2.6689453125, 2.916259765625, 3.16357421875, 3.410888671875, 3.658203125, 3.905517578125, 4.15283203125, 4.400146484375, 4.6474609375, 4.894775390625, 5.14208984375, 5.389404296875, 5.63671875, 5.884033203125, 6.13134765625, 6.378662109375, 6.6259765625, 6.873291015625, 7.12060546875, 7.367919921875, 7.615234375, 7.862548828125, 8.10986328125, 8.357177734375, 8.6044921875, 8.851806640625, 9.09912109375, 9.346435546875, 9.59375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 12.0, 18.0, 34.0, 58.0, 85.0, 106.0, 138.0, 129.0, 126.0, 111.0, 69.0, 51.0, 24.0, 12.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.6125602722168, -58.34540939331055, -56.07825469970703, -53.81110382080078, -51.543949127197266, -49.276798248291016, -47.0096435546875, -44.74249267578125, -42.475341796875, -40.20819091796875, -37.941036224365234, -35.673885345458984, -33.40673065185547, -31.13957977294922, -28.872426986694336, -26.605274200439453, -24.338119506835938, -22.070966720581055, -19.803813934326172, -17.536663055419922, -15.269509315490723, -13.00235652923584, -10.735204696655273, -8.46805191040039, -6.200899124145508, -3.933746576309204, -1.6665940284729004, 0.6005582809448242, 2.867711067199707, 5.13486385345459, 7.402015686035156, 9.669168472290039, 11.936317443847656, 14.203470230102539, 16.470623016357422, 18.737773895263672, 21.004928588867188, 23.272079467773438, 25.53923225402832, 27.806385040283203, 30.073537826538086, 32.34069061279297, 34.60784149169922, 36.874996185302734, 39.142147064208984, 41.4093017578125, 43.67645263671875, 45.943603515625, 48.210758209228516, 50.477909088134766, 52.74506378173828, 55.01221466064453, 57.27936935424805, 59.5465202331543, 61.81367492675781, 64.08082580566406, 66.34797668457031, 68.61512756347656, 70.88227844238281, 73.1494369506836, 75.41658782958984, 77.6837387084961, 79.95088958740234, 82.21804809570312, 84.48519897460938]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 13.0, 7.0, 9.0, 17.0, 25.0, 19.0, 24.0, 34.0, 30.0, 28.0, 34.0, 31.0, 46.0, 36.0, 42.0, 50.0, 37.0, 38.0, 39.0, 47.0, 51.0, 37.0, 43.0, 30.0, 35.0, 24.0, 32.0, 25.0, 18.0, 9.0, 10.0, 11.0, 7.0, 14.0, 13.0, 1.0, 5.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.631668090820312, -25.734140396118164, -24.836612701416016, -23.939083099365234, -23.041555404663086, -22.144027709960938, -21.24650001525879, -20.34897232055664, -19.45144271850586, -18.55391502380371, -17.656387329101562, -16.75885772705078, -15.861330032348633, -14.963802337646484, -14.066274642944336, -13.168746948242188, -12.271219253540039, -11.37369155883789, -10.476162910461426, -9.578635215759277, -8.681106567382812, -7.783578872680664, -6.886051177978516, -5.988523006439209, -5.090994834899902, -4.193466663360596, -3.295938730239868, -2.3984107971191406, -1.500882625579834, -0.6033544540405273, 0.2941732406616211, 1.1917014122009277, 2.0892295837402344, 2.986757755279541, 3.8842856884002686, 4.781813621520996, 5.679341793060303, 6.576869964599609, 7.474397659301758, 8.371925354003906, 9.269454002380371, 10.16698169708252, 11.064510345458984, 11.962038040161133, 12.859565734863281, 13.757094383239746, 14.654622077941895, 15.55215072631836, 16.449678421020508, 17.347206115722656, 18.244733810424805, 19.142261505126953, 20.039791107177734, 20.937318801879883, 21.83484649658203, 22.73237419128418, 23.629901885986328, 24.527429580688477, 25.424957275390625, 26.322486877441406, 27.220014572143555, 28.117542266845703, 29.01506996154785, 29.91259765625, 30.81012725830078]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 7.0, 8.0, 25.0, 24.0, 51.0, 112.0, 244.0, 533.0, 1711.0, 8902.0, 93079.0, 741358.0, 184277.0, 14511.0, 2447.0, 712.0, 278.0, 136.0, 73.0, 27.0, 16.0, 13.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.5009765625, -33.251953125, -32.0029296875, -30.75390625, -29.5048828125, -28.255859375, -27.0068359375, -25.7578125, -24.5087890625, -23.259765625, -22.0107421875, -20.76171875, -19.5126953125, -18.263671875, -17.0146484375, -15.765625, -14.5166015625, -13.267578125, -12.0185546875, -10.76953125, -9.5205078125, -8.271484375, -7.0224609375, -5.7734375, -4.5244140625, -3.275390625, -2.0263671875, -0.77734375, 0.4716796875, 1.720703125, 2.9697265625, 4.21875, 5.4677734375, 6.716796875, 7.9658203125, 9.21484375, 10.4638671875, 11.712890625, 12.9619140625, 14.2109375, 15.4599609375, 16.708984375, 17.9580078125, 19.20703125, 20.4560546875, 21.705078125, 22.9541015625, 24.203125, 25.4521484375, 26.701171875, 27.9501953125, 29.19921875, 30.4482421875, 31.697265625, 32.9462890625, 34.1953125, 35.4443359375, 36.693359375, 37.9423828125, 39.19140625, 40.4404296875, 41.689453125, 42.9384765625, 44.1875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 9.0, 12.0, 25.0, 28.0, 44.0, 45.0, 69.0, 80.0, 72.0, 82.0, 76.0, 85.0, 88.0, 67.0, 63.0, 34.0, 31.0, 39.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.869140625, -3.696014404296875, -3.52288818359375, -3.349761962890625, -3.1766357421875, -3.003509521484375, -2.83038330078125, -2.657257080078125, -2.484130859375, -2.311004638671875, -2.13787841796875, -1.964752197265625, -1.7916259765625, -1.618499755859375, -1.44537353515625, -1.272247314453125, -1.09912109375, -0.925994873046875, -0.75286865234375, -0.579742431640625, -0.4066162109375, -0.233489990234375, -0.06036376953125, 0.112762451171875, 0.285888671875, 0.459014892578125, 0.63214111328125, 0.805267333984375, 0.9783935546875, 1.151519775390625, 1.32464599609375, 1.497772216796875, 1.6708984375, 1.844024658203125, 2.01715087890625, 2.190277099609375, 2.3634033203125, 2.536529541015625, 2.70965576171875, 2.882781982421875, 3.055908203125, 3.229034423828125, 3.40216064453125, 3.575286865234375, 3.7484130859375, 3.921539306640625, 4.09466552734375, 4.267791748046875, 4.44091796875, 4.614044189453125, 4.78717041015625, 4.960296630859375, 5.1334228515625, 5.306549072265625, 5.47967529296875, 5.652801513671875, 5.825927734375, 5.999053955078125, 6.17218017578125, 6.345306396484375, 6.5184326171875, 6.691558837890625, 6.86468505859375, 7.037811279296875, 7.2109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 7.0, 7.0, 5.0, 15.0, 12.0, 27.0, 37.0, 53.0, 66.0, 105.0, 146.0, 174.0, 274.0, 369.0, 581.0, 927.0, 2007.0, 4952.0, 15885.0, 58169.0, 253198.0, 507997.0, 149640.0, 36077.0, 10459.0, 3540.0, 1474.0, 723.0, 488.0, 314.0, 228.0, 175.0, 129.0, 79.0, 61.0, 37.0, 35.0, 25.0, 17.0, 11.0, 7.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.109375, -16.580078125, -16.05078125, -15.521484375, -14.9921875, -14.462890625, -13.93359375, -13.404296875, -12.875, -12.345703125, -11.81640625, -11.287109375, -10.7578125, -10.228515625, -9.69921875, -9.169921875, -8.640625, -8.111328125, -7.58203125, -7.052734375, -6.5234375, -5.994140625, -5.46484375, -4.935546875, -4.40625, -3.876953125, -3.34765625, -2.818359375, -2.2890625, -1.759765625, -1.23046875, -0.701171875, -0.171875, 0.357421875, 0.88671875, 1.416015625, 1.9453125, 2.474609375, 3.00390625, 3.533203125, 4.0625, 4.591796875, 5.12109375, 5.650390625, 6.1796875, 6.708984375, 7.23828125, 7.767578125, 8.296875, 8.826171875, 9.35546875, 9.884765625, 10.4140625, 10.943359375, 11.47265625, 12.001953125, 12.53125, 13.060546875, 13.58984375, 14.119140625, 14.6484375, 15.177734375, 15.70703125, 16.236328125, 16.765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 11.0, 14.0, 13.0, 10.0, 17.0, 21.0, 21.0, 23.0, 40.0, 31.0, 38.0, 38.0, 44.0, 53.0, 45.0, 43.0, 47.0, 51.0, 50.0, 45.0, 43.0, 45.0, 35.0, 30.0, 24.0, 26.0, 24.0, 16.0, 20.0, 10.0, 9.0, 11.0, 7.0, 10.0, 2.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.5, -12.02392578125, -11.5478515625, -11.07177734375, -10.595703125, -10.11962890625, -9.6435546875, -9.16748046875, -8.69140625, -8.21533203125, -7.7392578125, -7.26318359375, -6.787109375, -6.31103515625, -5.8349609375, -5.35888671875, -4.8828125, -4.40673828125, -3.9306640625, -3.45458984375, -2.978515625, -2.50244140625, -2.0263671875, -1.55029296875, -1.07421875, -0.59814453125, -0.1220703125, 0.35400390625, 0.830078125, 1.30615234375, 1.7822265625, 2.25830078125, 2.734375, 3.21044921875, 3.6865234375, 4.16259765625, 4.638671875, 5.11474609375, 5.5908203125, 6.06689453125, 6.54296875, 7.01904296875, 7.4951171875, 7.97119140625, 8.447265625, 8.92333984375, 9.3994140625, 9.87548828125, 10.3515625, 10.82763671875, 11.3037109375, 11.77978515625, 12.255859375, 12.73193359375, 13.2080078125, 13.68408203125, 14.16015625, 14.63623046875, 15.1123046875, 15.58837890625, 16.064453125, 16.54052734375, 17.0166015625, 17.49267578125, 17.96875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 9.0, 10.0, 10.0, 20.0, 32.0, 32.0, 75.0, 91.0, 164.0, 262.0, 471.0, 716.0, 1480.0, 3219.0, 8442.0, 26174.0, 92159.0, 302682.0, 402587.0, 147520.0, 40919.0, 12703.0, 4541.0, 1887.0, 955.0, 533.0, 309.0, 187.0, 97.0, 90.0, 56.0, 34.0, 26.0, 16.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.7265625, -6.52978515625, -6.3330078125, -6.13623046875, -5.939453125, -5.74267578125, -5.5458984375, -5.34912109375, -5.15234375, -4.95556640625, -4.7587890625, -4.56201171875, -4.365234375, -4.16845703125, -3.9716796875, -3.77490234375, -3.578125, -3.38134765625, -3.1845703125, -2.98779296875, -2.791015625, -2.59423828125, -2.3974609375, -2.20068359375, -2.00390625, -1.80712890625, -1.6103515625, -1.41357421875, -1.216796875, -1.02001953125, -0.8232421875, -0.62646484375, -0.4296875, -0.23291015625, -0.0361328125, 0.16064453125, 0.357421875, 0.55419921875, 0.7509765625, 0.94775390625, 1.14453125, 1.34130859375, 1.5380859375, 1.73486328125, 1.931640625, 2.12841796875, 2.3251953125, 2.52197265625, 2.71875, 2.91552734375, 3.1123046875, 3.30908203125, 3.505859375, 3.70263671875, 3.8994140625, 4.09619140625, 4.29296875, 4.48974609375, 4.6865234375, 4.88330078125, 5.080078125, 5.27685546875, 5.4736328125, 5.67041015625, 5.8671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 6.0, 6.0, 5.0, 3.0, 15.0, 14.0, 24.0, 16.0, 30.0, 38.0, 49.0, 58.0, 57.0, 75.0, 76.0, 78.0, 80.0, 62.0, 59.0, 52.0, 34.0, 33.0, 24.0, 21.0, 15.0, 16.0, 9.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010242462158203125, -0.000990167260169983, -0.0009560883045196533, -0.0009220093488693237, -0.0008879303932189941, -0.0008538514375686646, -0.000819772481918335, -0.0007856935262680054, -0.0007516145706176758, -0.0007175356149673462, -0.0006834566593170166, -0.000649377703666687, -0.0006152987480163574, -0.0005812197923660278, -0.0005471408367156982, -0.0005130618810653687, -0.00047898292541503906, -0.00044490396976470947, -0.0004108250141143799, -0.0003767460584640503, -0.0003426671028137207, -0.0003085881471633911, -0.0002745091915130615, -0.00024043023586273193, -0.00020635128021240234, -0.00017227232456207275, -0.00013819336891174316, -0.00010411441326141357, -7.003545761108398e-05, -3.5956501960754395e-05, -1.8775463104248047e-06, 3.2201409339904785e-05, 6.628036499023438e-05, 0.00010035932064056396, 0.00013443827629089355, 0.00016851723194122314, 0.00020259618759155273, 0.00023667514324188232, 0.0002707540988922119, 0.0003048330545425415, 0.0003389120101928711, 0.0003729909658432007, 0.0004070699214935303, 0.00044114887714385986, 0.00047522783279418945, 0.000509306788444519, 0.0005433857440948486, 0.0005774646997451782, 0.0006115436553955078, 0.0006456226110458374, 0.000679701566696167, 0.0007137805223464966, 0.0007478594779968262, 0.0007819384336471558, 0.0008160173892974854, 0.0008500963449478149, 0.0008841753005981445, 0.0009182542562484741, 0.0009523332118988037, 0.0009864121675491333, 0.0010204911231994629, 0.0010545700788497925, 0.001088649034500122, 0.0011227279901504517, 0.0011568069458007812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 16.0, 14.0, 37.0, 36.0, 53.0, 84.0, 151.0, 261.0, 540.0, 1024.0, 2664.0, 8394.0, 46387.0, 356135.0, 530507.0, 83280.0, 12713.0, 3457.0, 1295.0, 649.0, 341.0, 181.0, 104.0, 75.0, 46.0, 26.0, 23.0, 9.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.19384765625, -11.8564453125, -11.51904296875, -11.181640625, -10.84423828125, -10.5068359375, -10.16943359375, -9.83203125, -9.49462890625, -9.1572265625, -8.81982421875, -8.482421875, -8.14501953125, -7.8076171875, -7.47021484375, -7.1328125, -6.79541015625, -6.4580078125, -6.12060546875, -5.783203125, -5.44580078125, -5.1083984375, -4.77099609375, -4.43359375, -4.09619140625, -3.7587890625, -3.42138671875, -3.083984375, -2.74658203125, -2.4091796875, -2.07177734375, -1.734375, -1.39697265625, -1.0595703125, -0.72216796875, -0.384765625, -0.04736328125, 0.2900390625, 0.62744140625, 0.96484375, 1.30224609375, 1.6396484375, 1.97705078125, 2.314453125, 2.65185546875, 2.9892578125, 3.32666015625, 3.6640625, 4.00146484375, 4.3388671875, 4.67626953125, 5.013671875, 5.35107421875, 5.6884765625, 6.02587890625, 6.36328125, 6.70068359375, 7.0380859375, 7.37548828125, 7.712890625, 8.05029296875, 8.3876953125, 8.72509765625, 9.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 15.0, 13.0, 17.0, 25.0, 38.0, 42.0, 53.0, 66.0, 80.0, 95.0, 93.0, 89.0, 88.0, 59.0, 68.0, 32.0, 20.0, 32.0, 18.0, 15.0, 7.0, 8.0, 2.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.98681640625, -7.7548828125, -7.52294921875, -7.291015625, -7.05908203125, -6.8271484375, -6.59521484375, -6.36328125, -6.13134765625, -5.8994140625, -5.66748046875, -5.435546875, -5.20361328125, -4.9716796875, -4.73974609375, -4.5078125, -4.27587890625, -4.0439453125, -3.81201171875, -3.580078125, -3.34814453125, -3.1162109375, -2.88427734375, -2.65234375, -2.42041015625, -2.1884765625, -1.95654296875, -1.724609375, -1.49267578125, -1.2607421875, -1.02880859375, -0.796875, -0.56494140625, -0.3330078125, -0.10107421875, 0.130859375, 0.36279296875, 0.5947265625, 0.82666015625, 1.05859375, 1.29052734375, 1.5224609375, 1.75439453125, 1.986328125, 2.21826171875, 2.4501953125, 2.68212890625, 2.9140625, 3.14599609375, 3.3779296875, 3.60986328125, 3.841796875, 4.07373046875, 4.3056640625, 4.53759765625, 4.76953125, 5.00146484375, 5.2333984375, 5.46533203125, 5.697265625, 5.92919921875, 6.1611328125, 6.39306640625, 6.625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 13.0, 22.0, 50.0, 94.0, 163.0, 178.0, 186.0, 139.0, 83.0, 40.0, 22.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-277.1130065917969, -271.21820068359375, -265.3233642578125, -259.4285583496094, -253.53372192382812, -247.638916015625, -241.7440948486328, -235.84927368164062, -229.95445251464844, -224.05963134765625, -218.16481018066406, -212.26998901367188, -206.37518310546875, -200.48036193847656, -194.58554077148438, -188.6907196044922, -182.7958984375, -176.9010772705078, -171.00625610351562, -165.11143493652344, -159.21661376953125, -153.32180786132812, -147.42698669433594, -141.53216552734375, -135.63734436035156, -129.74252319335938, -123.84770202636719, -117.95288848876953, -112.05806732177734, -106.16324615478516, -100.2684326171875, -94.37361145019531, -88.47879028320312, -82.58396911621094, -76.68914794921875, -70.7943344116211, -64.8995132446289, -59.00469207763672, -53.1098747253418, -47.215057373046875, -41.32023620605469, -35.4254150390625, -29.530597686767578, -23.635778427124023, -17.74095916748047, -11.846139907836914, -5.951320648193359, -0.0565032958984375, 5.83831787109375, 11.733137130737305, 17.62795639038086, 23.522775650024414, 29.41759490966797, 35.312416076660156, 41.20723342895508, 47.10205078125, 52.99687194824219, 58.891693115234375, 64.78651428222656, 70.68132781982422, 76.5761489868164, 82.4709701538086, 88.36578369140625, 94.26060485839844, 100.15542602539062]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 6.0, 4.0, 3.0, 8.0, 15.0, 9.0, 19.0, 14.0, 17.0, 15.0, 30.0, 30.0, 42.0, 42.0, 43.0, 37.0, 47.0, 53.0, 55.0, 61.0, 61.0, 49.0, 41.0, 38.0, 45.0, 32.0, 28.0, 38.0, 25.0, 19.0, 23.0, 6.0, 13.0, 6.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.02273559570312, -84.3149185180664, -81.60710906982422, -78.8992919921875, -76.19147491455078, -73.48365783691406, -70.77584838867188, -68.06803131103516, -65.36021423339844, -62.652400970458984, -59.944583892822266, -57.23677062988281, -54.528953552246094, -51.82114028930664, -49.11332702636719, -46.40550994873047, -43.69770050048828, -40.98988723754883, -38.28207015991211, -35.574256896972656, -32.86643981933594, -30.158626556396484, -27.45081329345703, -24.742998123168945, -22.03518295288086, -19.327367782592773, -16.619552612304688, -13.911739349365234, -11.203924179077148, -8.496109008789062, -5.788295745849609, -3.0804805755615234, -0.3726654052734375, 2.3351492881774902, 5.042963981628418, 7.7507781982421875, 10.458593368530273, 13.16640853881836, 15.874221801757812, 18.5820369720459, 21.289852142333984, 23.99766731262207, 26.705482482910156, 29.41329574584961, 32.12110900878906, 34.82892608642578, 37.536739349365234, 40.24455261230469, 42.952369689941406, 45.66018295288086, 48.36800003051758, 51.07581329345703, 53.78363037109375, 56.4914436340332, 59.199256896972656, 61.907073974609375, 64.61488342285156, 67.32270050048828, 70.03050994873047, 72.73832702636719, 75.4461441040039, 78.15396118164062, 80.86177062988281, 83.56958770751953, 86.27740478515625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 16.0, 37.0, 81.0, 129.0, 275.0, 667.0, 1962.0, 8350.0, 133038.0, 4029866.0, 15189.0, 3018.0, 907.0, 361.0, 147.0, 76.0, 40.0, 34.0, 19.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.4609375, -61.546875, -59.6328125, -57.71875, -55.8046875, -53.890625, -51.9765625, -50.0625, -48.1484375, -46.234375, -44.3203125, -42.40625, -40.4921875, -38.578125, -36.6640625, -34.75, -32.8359375, -30.921875, -29.0078125, -27.09375, -25.1796875, -23.265625, -21.3515625, -19.4375, -17.5234375, -15.609375, -13.6953125, -11.78125, -9.8671875, -7.953125, -6.0390625, -4.125, -2.2109375, -0.296875, 1.6171875, 3.53125, 5.4453125, 7.359375, 9.2734375, 11.1875, 13.1015625, 15.015625, 16.9296875, 18.84375, 20.7578125, 22.671875, 24.5859375, 26.5, 28.4140625, 30.328125, 32.2421875, 34.15625, 36.0703125, 37.984375, 39.8984375, 41.8125, 43.7265625, 45.640625, 47.5546875, 49.46875, 51.3828125, 53.296875, 55.2109375, 57.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 9.0, 20.0, 22.0, 31.0, 34.0, 52.0, 63.0, 55.0, 59.0, 68.0, 69.0, 78.0, 71.0, 66.0, 62.0, 53.0, 41.0, 40.0, 25.0, 18.0, 20.0, 13.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.791015625, -3.6171875, -3.443359375, -3.26953125, -3.095703125, -2.921875, -2.748046875, -2.57421875, -2.400390625, -2.2265625, -2.052734375, -1.87890625, -1.705078125, -1.53125, -1.357421875, -1.18359375, -1.009765625, -0.8359375, -0.662109375, -0.48828125, -0.314453125, -0.140625, 0.033203125, 0.20703125, 0.380859375, 0.5546875, 0.728515625, 0.90234375, 1.076171875, 1.25, 1.423828125, 1.59765625, 1.771484375, 1.9453125, 2.119140625, 2.29296875, 2.466796875, 2.640625, 2.814453125, 2.98828125, 3.162109375, 3.3359375, 3.509765625, 3.68359375, 3.857421875, 4.03125, 4.205078125, 4.37890625, 4.552734375, 4.7265625, 4.900390625, 5.07421875, 5.248046875, 5.421875, 5.595703125, 5.76953125, 5.943359375, 6.1171875, 6.291015625, 6.46484375, 6.638671875, 6.8125, 6.986328125, 7.16015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 20.0, 25.0, 33.0, 63.0, 132.0, 197.0, 384.0, 670.0, 1308.0, 2635.0, 6319.0, 21173.0, 144911.0, 3936707.0, 58273.0, 12800.0, 4502.0, 1951.0, 986.0, 502.0, 275.0, 176.0, 89.0, 56.0, 40.0, 22.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -33.004150390625, -32.16455078125, -31.324951171875, -30.4853515625, -29.645751953125, -28.80615234375, -27.966552734375, -27.126953125, -26.287353515625, -25.44775390625, -24.608154296875, -23.7685546875, -22.928955078125, -22.08935546875, -21.249755859375, -20.41015625, -19.570556640625, -18.73095703125, -17.891357421875, -17.0517578125, -16.212158203125, -15.37255859375, -14.532958984375, -13.693359375, -12.853759765625, -12.01416015625, -11.174560546875, -10.3349609375, -9.495361328125, -8.65576171875, -7.816162109375, -6.9765625, -6.136962890625, -5.29736328125, -4.457763671875, -3.6181640625, -2.778564453125, -1.93896484375, -1.099365234375, -0.259765625, 0.579833984375, 1.41943359375, 2.259033203125, 3.0986328125, 3.938232421875, 4.77783203125, 5.617431640625, 6.45703125, 7.296630859375, 8.13623046875, 8.975830078125, 9.8154296875, 10.655029296875, 11.49462890625, 12.334228515625, 13.173828125, 14.013427734375, 14.85302734375, 15.692626953125, 16.5322265625, 17.371826171875, 18.21142578125, 19.051025390625, 19.890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 14.0, 7.0, 22.0, 33.0, 34.0, 79.0, 167.0, 3099.0, 320.0, 110.0, 52.0, 36.0, 21.0, 20.0, 12.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.074310302734375, -3.95330810546875, -3.832305908203125, -3.7113037109375, -3.590301513671875, -3.46929931640625, -3.348297119140625, -3.227294921875, -3.106292724609375, -2.98529052734375, -2.864288330078125, -2.7432861328125, -2.622283935546875, -2.50128173828125, -2.380279541015625, -2.25927734375, -2.138275146484375, -2.01727294921875, -1.896270751953125, -1.7752685546875, -1.654266357421875, -1.53326416015625, -1.412261962890625, -1.291259765625, -1.170257568359375, -1.04925537109375, -0.928253173828125, -0.8072509765625, -0.686248779296875, -0.56524658203125, -0.444244384765625, -0.3232421875, -0.202239990234375, -0.08123779296875, 0.039764404296875, 0.1607666015625, 0.281768798828125, 0.40277099609375, 0.523773193359375, 0.644775390625, 0.765777587890625, 0.88677978515625, 1.007781982421875, 1.1287841796875, 1.249786376953125, 1.37078857421875, 1.491790771484375, 1.61279296875, 1.733795166015625, 1.85479736328125, 1.975799560546875, 2.0968017578125, 2.217803955078125, 2.33880615234375, 2.459808349609375, 2.580810546875, 2.701812744140625, 2.82281494140625, 2.943817138671875, 3.0648193359375, 3.185821533203125, 3.30682373046875, 3.427825927734375, 3.548828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 8.0, 12.0, 17.0, 33.0, 41.0, 62.0, 60.0, 76.0, 99.0, 91.0, 89.0, 96.0, 80.0, 67.0, 43.0, 37.0, 23.0, 11.0, 15.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.29732894897461, -18.775888442993164, -18.25444793701172, -17.733007431030273, -17.211566925048828, -16.690128326416016, -16.16868782043457, -15.647247314453125, -15.12580680847168, -14.604366302490234, -14.082925796508789, -13.56148624420166, -13.040045738220215, -12.51860523223877, -11.99716567993164, -11.475725173950195, -10.95428466796875, -10.432844161987305, -9.91140365600586, -9.38996410369873, -8.868523597717285, -8.34708309173584, -7.825643062591553, -7.304203033447266, -6.78276252746582, -6.261322021484375, -5.739881992340088, -5.218441963195801, -4.6970014572143555, -4.17556095123291, -3.654120922088623, -3.132680654525757, -2.6112422943115234, -2.0898020267486572, -1.568361759185791, -1.0469214916229248, -0.5254812240600586, -0.004040956497192383, 0.5173993110656738, 1.03883957862854, 1.5602798461914062, 2.0817201137542725, 2.6031603813171387, 3.124600648880005, 3.646040916442871, 4.167481422424316, 4.6889214515686035, 5.210361480712891, 5.731801986694336, 6.253242492675781, 6.774682521820068, 7.2961225509643555, 7.817563056945801, 8.339003562927246, 8.860443115234375, 9.38188362121582, 9.903324127197266, 10.424764633178711, 10.946205139160156, 11.467644691467285, 11.98908519744873, 12.510525703430176, 13.031965255737305, 13.55340576171875, 14.074846267700195]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 12.0, 12.0, 13.0, 16.0, 16.0, 17.0, 27.0, 18.0, 32.0, 31.0, 44.0, 35.0, 41.0, 44.0, 45.0, 35.0, 44.0, 33.0, 48.0, 29.0, 36.0, 42.0, 29.0, 30.0, 35.0, 30.0, 24.0, 27.0, 25.0, 22.0, 14.0, 9.0, 14.0, 9.0, 11.0, 5.0, 6.0, 7.0, 3.0, 7.0, 1.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.998217582702637, -7.764782428741455, -7.531347274780273, -7.297912120819092, -7.06447696685791, -6.8310418128967285, -6.597606658935547, -6.364171504974365, -6.130736351013184, -5.897301197052002, -5.66386604309082, -5.430430889129639, -5.196995735168457, -4.963560581207275, -4.730125427246094, -4.496690273284912, -4.2632551193237305, -4.029819965362549, -3.796384811401367, -3.5629496574401855, -3.329514503479004, -3.0960793495178223, -2.8626441955566406, -2.629209041595459, -2.3957738876342773, -2.1623387336730957, -1.928903579711914, -1.6954684257507324, -1.4620332717895508, -1.2285981178283691, -0.9951629638671875, -0.7617278099060059, -0.5282926559448242, -0.2948575019836426, -0.06142234802246094, 0.1720128059387207, 0.40544795989990234, 0.638883113861084, 0.8723182678222656, 1.1057534217834473, 1.339188575744629, 1.5726237297058105, 1.8060588836669922, 2.039494037628174, 2.2729291915893555, 2.506364345550537, 2.7397994995117188, 2.9732346534729004, 3.206669807434082, 3.4401049613952637, 3.6735401153564453, 3.906975269317627, 4.140410423278809, 4.37384557723999, 4.607280731201172, 4.8407158851623535, 5.074151039123535, 5.307586193084717, 5.541021347045898, 5.77445650100708, 6.007891654968262, 6.241326808929443, 6.474761962890625, 6.708197116851807, 6.941632270812988]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 13.0, 33.0, 36.0, 68.0, 120.0, 245.0, 540.0, 1358.0, 4731.0, 22283.0, 121462.0, 574537.0, 265471.0, 45099.0, 8768.0, 2299.0, 779.0, 319.0, 159.0, 92.0, 39.0, 33.0, 26.0, 15.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.078125, -25.347900390625, -24.61767578125, -23.887451171875, -23.1572265625, -22.427001953125, -21.69677734375, -20.966552734375, -20.236328125, -19.506103515625, -18.77587890625, -18.045654296875, -17.3154296875, -16.585205078125, -15.85498046875, -15.124755859375, -14.39453125, -13.664306640625, -12.93408203125, -12.203857421875, -11.4736328125, -10.743408203125, -10.01318359375, -9.282958984375, -8.552734375, -7.822509765625, -7.09228515625, -6.362060546875, -5.6318359375, -4.901611328125, -4.17138671875, -3.441162109375, -2.7109375, -1.980712890625, -1.25048828125, -0.520263671875, 0.2099609375, 0.940185546875, 1.67041015625, 2.400634765625, 3.130859375, 3.861083984375, 4.59130859375, 5.321533203125, 6.0517578125, 6.781982421875, 7.51220703125, 8.242431640625, 8.97265625, 9.702880859375, 10.43310546875, 11.163330078125, 11.8935546875, 12.623779296875, 13.35400390625, 14.084228515625, 14.814453125, 15.544677734375, 16.27490234375, 17.005126953125, 17.7353515625, 18.465576171875, 19.19580078125, 19.926025390625, 20.65625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 1.0, 4.0, 8.0, 16.0, 15.0, 20.0, 20.0, 28.0, 35.0, 48.0, 49.0, 47.0, 69.0, 52.0, 74.0, 75.0, 78.0, 55.0, 48.0, 53.0, 42.0, 45.0, 26.0, 23.0, 24.0, 18.0, 6.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.8719482421875, -3.697021484375, -3.5220947265625, -3.34716796875, -3.1722412109375, -2.997314453125, -2.8223876953125, -2.6474609375, -2.4725341796875, -2.297607421875, -2.1226806640625, -1.94775390625, -1.7728271484375, -1.597900390625, -1.4229736328125, -1.248046875, -1.0731201171875, -0.898193359375, -0.7232666015625, -0.54833984375, -0.3734130859375, -0.198486328125, -0.0235595703125, 0.1513671875, 0.3262939453125, 0.501220703125, 0.6761474609375, 0.85107421875, 1.0260009765625, 1.200927734375, 1.3758544921875, 1.55078125, 1.7257080078125, 1.900634765625, 2.0755615234375, 2.25048828125, 2.4254150390625, 2.600341796875, 2.7752685546875, 2.9501953125, 3.1251220703125, 3.300048828125, 3.4749755859375, 3.64990234375, 3.8248291015625, 3.999755859375, 4.1746826171875, 4.349609375, 4.5245361328125, 4.699462890625, 4.8743896484375, 5.04931640625, 5.2242431640625, 5.399169921875, 5.5740966796875, 5.7490234375, 5.9239501953125, 6.098876953125, 6.2738037109375, 6.44873046875, 6.6236572265625, 6.798583984375, 6.9735107421875, 7.1484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 15.0, 12.0, 16.0, 27.0, 38.0, 40.0, 67.0, 77.0, 126.0, 131.0, 199.0, 268.0, 433.0, 517.0, 883.0, 1542.0, 3660.0, 12252.0, 50825.0, 278105.0, 557140.0, 106926.0, 23340.0, 6212.0, 2208.0, 1081.0, 679.0, 486.0, 349.0, 233.0, 181.0, 138.0, 92.0, 66.0, 55.0, 41.0, 28.0, 16.0, 8.0, 13.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.546875, -16.01708984375, -15.4873046875, -14.95751953125, -14.427734375, -13.89794921875, -13.3681640625, -12.83837890625, -12.30859375, -11.77880859375, -11.2490234375, -10.71923828125, -10.189453125, -9.65966796875, -9.1298828125, -8.60009765625, -8.0703125, -7.54052734375, -7.0107421875, -6.48095703125, -5.951171875, -5.42138671875, -4.8916015625, -4.36181640625, -3.83203125, -3.30224609375, -2.7724609375, -2.24267578125, -1.712890625, -1.18310546875, -0.6533203125, -0.12353515625, 0.40625, 0.93603515625, 1.4658203125, 1.99560546875, 2.525390625, 3.05517578125, 3.5849609375, 4.11474609375, 4.64453125, 5.17431640625, 5.7041015625, 6.23388671875, 6.763671875, 7.29345703125, 7.8232421875, 8.35302734375, 8.8828125, 9.41259765625, 9.9423828125, 10.47216796875, 11.001953125, 11.53173828125, 12.0615234375, 12.59130859375, 13.12109375, 13.65087890625, 14.1806640625, 14.71044921875, 15.240234375, 15.77001953125, 16.2998046875, 16.82958984375, 17.359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 4.0, 8.0, 18.0, 17.0, 21.0, 30.0, 27.0, 34.0, 38.0, 36.0, 44.0, 55.0, 44.0, 51.0, 56.0, 50.0, 58.0, 47.0, 50.0, 59.0, 39.0, 32.0, 33.0, 24.0, 20.0, 26.0, 16.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.171875, -20.55078125, -19.9296875, -19.30859375, -18.6875, -18.06640625, -17.4453125, -16.82421875, -16.203125, -15.58203125, -14.9609375, -14.33984375, -13.71875, -13.09765625, -12.4765625, -11.85546875, -11.234375, -10.61328125, -9.9921875, -9.37109375, -8.75, -8.12890625, -7.5078125, -6.88671875, -6.265625, -5.64453125, -5.0234375, -4.40234375, -3.78125, -3.16015625, -2.5390625, -1.91796875, -1.296875, -0.67578125, -0.0546875, 0.56640625, 1.1875, 1.80859375, 2.4296875, 3.05078125, 3.671875, 4.29296875, 4.9140625, 5.53515625, 6.15625, 6.77734375, 7.3984375, 8.01953125, 8.640625, 9.26171875, 9.8828125, 10.50390625, 11.125, 11.74609375, 12.3671875, 12.98828125, 13.609375, 14.23046875, 14.8515625, 15.47265625, 16.09375, 16.71484375, 17.3359375, 17.95703125, 18.578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 34.0, 40.0, 74.0, 107.0, 152.0, 228.0, 459.0, 854.0, 1898.0, 4350.0, 12983.0, 49121.0, 253997.0, 560317.0, 123151.0, 26998.0, 7969.0, 2928.0, 1268.0, 677.0, 339.0, 218.0, 123.0, 87.0, 45.0, 36.0, 20.0, 11.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.15716552734375, -6.9041748046875, -6.65118408203125, -6.398193359375, -6.14520263671875, -5.8922119140625, -5.63922119140625, -5.38623046875, -5.13323974609375, -4.8802490234375, -4.62725830078125, -4.374267578125, -4.12127685546875, -3.8682861328125, -3.61529541015625, -3.3623046875, -3.10931396484375, -2.8563232421875, -2.60333251953125, -2.350341796875, -2.09735107421875, -1.8443603515625, -1.59136962890625, -1.33837890625, -1.08538818359375, -0.8323974609375, -0.57940673828125, -0.326416015625, -0.07342529296875, 0.1795654296875, 0.43255615234375, 0.685546875, 0.93853759765625, 1.1915283203125, 1.44451904296875, 1.697509765625, 1.95050048828125, 2.2034912109375, 2.45648193359375, 2.70947265625, 2.96246337890625, 3.2154541015625, 3.46844482421875, 3.721435546875, 3.97442626953125, 4.2274169921875, 4.48040771484375, 4.7333984375, 4.98638916015625, 5.2393798828125, 5.49237060546875, 5.745361328125, 5.99835205078125, 6.2513427734375, 6.50433349609375, 6.75732421875, 7.01031494140625, 7.2633056640625, 7.51629638671875, 7.769287109375, 8.02227783203125, 8.2752685546875, 8.52825927734375, 8.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 12.0, 14.0, 21.0, 13.0, 37.0, 34.0, 42.0, 58.0, 65.0, 73.0, 83.0, 81.0, 75.0, 82.0, 80.0, 48.0, 34.0, 27.0, 20.0, 17.0, 13.0, 7.0, 12.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0013275146484375, -0.0012937411665916443, -0.0012599676847457886, -0.0012261942028999329, -0.0011924207210540771, -0.0011586472392082214, -0.0011248737573623657, -0.00109110027551651, -0.0010573267936706543, -0.0010235533118247986, -0.0009897798299789429, -0.0009560063481330872, -0.0009222328662872314, -0.0008884593844413757, -0.00085468590259552, -0.0008209124207496643, -0.0007871389389038086, -0.0007533654570579529, -0.0007195919752120972, -0.0006858184933662415, -0.0006520450115203857, -0.00061827152967453, -0.0005844980478286743, -0.0005507245659828186, -0.0005169510841369629, -0.0004831776022911072, -0.00044940412044525146, -0.00041563063859939575, -0.00038185715675354004, -0.0003480836749076843, -0.0003143101930618286, -0.0002805367112159729, -0.0002467632293701172, -0.00021298974752426147, -0.00017921626567840576, -0.00014544278383255005, -0.00011166930198669434, -7.789582014083862e-05, -4.412233829498291e-05, -1.0348856449127197e-05, 2.3424625396728516e-05, 5.719810724258423e-05, 9.097158908843994e-05, 0.00012474507093429565, 0.00015851855278015137, 0.00019229203462600708, 0.0002260655164718628, 0.0002598389983177185, 0.0002936124801635742, 0.00032738596200942993, 0.00036115944385528564, 0.00039493292570114136, 0.00042870640754699707, 0.0004624798893928528, 0.0004962533712387085, 0.0005300268530845642, 0.0005638003349304199, 0.0005975738167762756, 0.0006313472986221313, 0.0006651207804679871, 0.0006988942623138428, 0.0007326677441596985, 0.0007664412260055542, 0.0008002147078514099, 0.0008339881896972656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 6.0, 17.0, 34.0, 54.0, 96.0, 142.0, 338.0, 696.0, 1820.0, 6689.0, 41693.0, 575256.0, 384428.0, 29143.0, 5301.0, 1583.0, 634.0, 271.0, 151.0, 67.0, 43.0, 28.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.4571533203125, -11.031494140625, -10.6058349609375, -10.18017578125, -9.7545166015625, -9.328857421875, -8.9031982421875, -8.4775390625, -8.0518798828125, -7.626220703125, -7.2005615234375, -6.77490234375, -6.3492431640625, -5.923583984375, -5.4979248046875, -5.072265625, -4.6466064453125, -4.220947265625, -3.7952880859375, -3.36962890625, -2.9439697265625, -2.518310546875, -2.0926513671875, -1.6669921875, -1.2413330078125, -0.815673828125, -0.3900146484375, 0.03564453125, 0.4613037109375, 0.886962890625, 1.3126220703125, 1.73828125, 2.1639404296875, 2.589599609375, 3.0152587890625, 3.44091796875, 3.8665771484375, 4.292236328125, 4.7178955078125, 5.1435546875, 5.5692138671875, 5.994873046875, 6.4205322265625, 6.84619140625, 7.2718505859375, 7.697509765625, 8.1231689453125, 8.548828125, 8.9744873046875, 9.400146484375, 9.8258056640625, 10.25146484375, 10.6771240234375, 11.102783203125, 11.5284423828125, 11.9541015625, 12.3797607421875, 12.805419921875, 13.2310791015625, 13.65673828125, 14.0823974609375, 14.508056640625, 14.9337158203125, 15.359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 13.0, 18.0, 25.0, 27.0, 39.0, 64.0, 92.0, 109.0, 114.0, 129.0, 95.0, 71.0, 61.0, 43.0, 28.0, 12.0, 18.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.15435791015625, -5.8438720703125, -5.53338623046875, -5.222900390625, -4.91241455078125, -4.6019287109375, -4.29144287109375, -3.98095703125, -3.67047119140625, -3.3599853515625, -3.04949951171875, -2.739013671875, -2.42852783203125, -2.1180419921875, -1.80755615234375, -1.4970703125, -1.18658447265625, -0.8760986328125, -0.56561279296875, -0.255126953125, 0.05535888671875, 0.3658447265625, 0.67633056640625, 0.98681640625, 1.29730224609375, 1.6077880859375, 1.91827392578125, 2.228759765625, 2.53924560546875, 2.8497314453125, 3.16021728515625, 3.470703125, 3.78118896484375, 4.0916748046875, 4.40216064453125, 4.712646484375, 5.02313232421875, 5.3336181640625, 5.64410400390625, 5.95458984375, 6.26507568359375, 6.5755615234375, 6.88604736328125, 7.196533203125, 7.50701904296875, 7.8175048828125, 8.12799072265625, 8.4384765625, 8.74896240234375, 9.0594482421875, 9.36993408203125, 9.680419921875, 9.99090576171875, 10.3013916015625, 10.61187744140625, 10.92236328125, 11.23284912109375, 11.5433349609375, 11.85382080078125, 12.164306640625, 12.47479248046875, 12.7852783203125, 13.09576416015625, 13.40625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 12.0, 21.0, 43.0, 64.0, 121.0, 144.0, 165.0, 170.0, 109.0, 66.0, 44.0, 19.0, 15.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-171.34573364257812, -166.12405395507812, -160.90235900878906, -155.68067932128906, -150.45899963378906, -145.2373046875, -140.015625, -134.7939453125, -129.57225036621094, -124.3505630493164, -119.1288833618164, -113.90719604492188, -108.68550872802734, -103.46382141113281, -98.24214172363281, -93.02045440673828, -87.79877471923828, -82.57708740234375, -77.35540771484375, -72.13372039794922, -66.91203308105469, -61.69034957885742, -56.468666076660156, -51.246978759765625, -46.02529525756836, -40.803611755371094, -35.58192443847656, -30.360240936279297, -25.1385555267334, -19.9168701171875, -14.695186614990234, -9.473499298095703, -4.2518157958984375, 0.9698691368103027, 6.191554069519043, 11.413238525390625, 16.634923934936523, 21.856609344482422, 27.078292846679688, 32.29998016357422, 37.521663665771484, 42.74334716796875, 47.96503448486328, 53.18671798706055, 58.40840148925781, 63.630088806152344, 68.85177612304688, 74.07345581054688, 79.2951431274414, 84.51683044433594, 89.73851013183594, 94.96019744873047, 100.181884765625, 105.403564453125, 110.62525177001953, 115.84693908691406, 121.06861877441406, 126.2903060913086, 131.51199340820312, 136.73367309570312, 141.95535278320312, 147.1770477294922, 152.3987274169922, 157.62042236328125, 162.84210205078125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 9.0, 11.0, 9.0, 9.0, 15.0, 17.0, 16.0, 21.0, 26.0, 33.0, 36.0, 33.0, 38.0, 42.0, 34.0, 40.0, 50.0, 52.0, 49.0, 64.0, 42.0, 41.0, 43.0, 28.0, 46.0, 21.0, 25.0, 19.0, 16.0, 19.0, 12.0, 13.0, 10.0, 6.0, 5.0, 11.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.07047271728516, -75.499755859375, -72.92903137207031, -70.35831451416016, -67.78759765625, -65.21687316894531, -62.646156311035156, -60.075435638427734, -57.50471496582031, -54.93399429321289, -52.36327362060547, -49.79255676269531, -47.22183609008789, -44.65111541748047, -42.08039855957031, -39.50967788696289, -36.93895721435547, -34.36823654174805, -31.797517776489258, -29.22679901123047, -26.656078338623047, -24.085357666015625, -21.514638900756836, -18.943920135498047, -16.373199462890625, -13.80247974395752, -11.231760025024414, -8.661040306091309, -6.090320587158203, -3.5196008682250977, -0.9488811492919922, 1.6218376159667969, 4.1925506591796875, 6.763270378112793, 9.333990097045898, 11.904709815979004, 14.47542953491211, 17.04615020751953, 19.61686897277832, 22.18758773803711, 24.75830841064453, 27.329029083251953, 29.899747848510742, 32.47046661376953, 35.04118728637695, 37.611907958984375, 40.18262481689453, 42.75334548950195, 45.324066162109375, 47.8947868347168, 50.46550750732422, 53.036224365234375, 55.6069450378418, 58.17766571044922, 60.748382568359375, 63.3191032409668, 65.88982391357422, 68.46054077148438, 71.03126525878906, 73.60198211669922, 76.17269897460938, 78.74342346191406, 81.31414031982422, 83.88485717773438, 86.45558166503906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 5.0, 9.0, 10.0, 20.0, 25.0, 54.0, 73.0, 153.0, 293.0, 679.0, 1806.0, 5839.0, 31804.0, 4001709.0, 133753.0, 12762.0, 3138.0, 1168.0, 471.0, 217.0, 112.0, 67.0, 30.0, 23.0, 14.0, 13.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.77685546875, -31.3974609375, -30.01806640625, -28.638671875, -27.25927734375, -25.8798828125, -24.50048828125, -23.12109375, -21.74169921875, -20.3623046875, -18.98291015625, -17.603515625, -16.22412109375, -14.8447265625, -13.46533203125, -12.0859375, -10.70654296875, -9.3271484375, -7.94775390625, -6.568359375, -5.18896484375, -3.8095703125, -2.43017578125, -1.05078125, 0.32861328125, 1.7080078125, 3.08740234375, 4.466796875, 5.84619140625, 7.2255859375, 8.60498046875, 9.984375, 11.36376953125, 12.7431640625, 14.12255859375, 15.501953125, 16.88134765625, 18.2607421875, 19.64013671875, 21.01953125, 22.39892578125, 23.7783203125, 25.15771484375, 26.537109375, 27.91650390625, 29.2958984375, 30.67529296875, 32.0546875, 33.43408203125, 34.8134765625, 36.19287109375, 37.572265625, 38.95166015625, 40.3310546875, 41.71044921875, 43.08984375, 44.46923828125, 45.8486328125, 47.22802734375, 48.607421875, 49.98681640625, 51.3662109375, 52.74560546875, 54.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 14.0, 18.0, 21.0, 26.0, 25.0, 50.0, 51.0, 41.0, 61.0, 54.0, 74.0, 90.0, 64.0, 65.0, 68.0, 40.0, 55.0, 42.0, 28.0, 29.0, 20.0, 18.0, 12.0, 12.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.807342529296875, -3.63226318359375, -3.457183837890625, -3.2821044921875, -3.107025146484375, -2.93194580078125, -2.756866455078125, -2.581787109375, -2.406707763671875, -2.23162841796875, -2.056549072265625, -1.8814697265625, -1.706390380859375, -1.53131103515625, -1.356231689453125, -1.18115234375, -1.006072998046875, -0.83099365234375, -0.655914306640625, -0.4808349609375, -0.305755615234375, -0.13067626953125, 0.044403076171875, 0.219482421875, 0.394561767578125, 0.56964111328125, 0.744720458984375, 0.9197998046875, 1.094879150390625, 1.26995849609375, 1.445037841796875, 1.6201171875, 1.795196533203125, 1.97027587890625, 2.145355224609375, 2.3204345703125, 2.495513916015625, 2.67059326171875, 2.845672607421875, 3.020751953125, 3.195831298828125, 3.37091064453125, 3.545989990234375, 3.7210693359375, 3.896148681640625, 4.07122802734375, 4.246307373046875, 4.42138671875, 4.596466064453125, 4.77154541015625, 4.946624755859375, 5.1217041015625, 5.296783447265625, 5.47186279296875, 5.646942138671875, 5.822021484375, 5.997100830078125, 6.17218017578125, 6.347259521484375, 6.5223388671875, 6.697418212890625, 6.87249755859375, 7.047576904296875, 7.22265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 17.0, 16.0, 35.0, 47.0, 88.0, 99.0, 177.0, 248.0, 376.0, 615.0, 921.0, 1478.0, 2427.0, 4201.0, 7355.0, 14419.0, 31117.0, 84851.0, 2928091.0, 972600.0, 82682.0, 30531.0, 14092.0, 7220.0, 4162.0, 2380.0, 1423.0, 888.0, 577.0, 390.0, 252.0, 166.0, 109.0, 71.0, 46.0, 39.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.1920166015625, -10.805908203125, -10.4197998046875, -10.03369140625, -9.6475830078125, -9.261474609375, -8.8753662109375, -8.4892578125, -8.1031494140625, -7.717041015625, -7.3309326171875, -6.94482421875, -6.5587158203125, -6.172607421875, -5.7864990234375, -5.400390625, -5.0142822265625, -4.628173828125, -4.2420654296875, -3.85595703125, -3.4698486328125, -3.083740234375, -2.6976318359375, -2.3115234375, -1.9254150390625, -1.539306640625, -1.1531982421875, -0.76708984375, -0.3809814453125, 0.005126953125, 0.3912353515625, 0.77734375, 1.1634521484375, 1.549560546875, 1.9356689453125, 2.32177734375, 2.7078857421875, 3.093994140625, 3.4801025390625, 3.8662109375, 4.2523193359375, 4.638427734375, 5.0245361328125, 5.41064453125, 5.7967529296875, 6.182861328125, 6.5689697265625, 6.955078125, 7.3411865234375, 7.727294921875, 8.1134033203125, 8.49951171875, 8.8856201171875, 9.271728515625, 9.6578369140625, 10.0439453125, 10.4300537109375, 10.816162109375, 11.2022705078125, 11.58837890625, 11.9744873046875, 12.360595703125, 12.7467041015625, 13.1328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 9.0, 7.0, 11.0, 7.0, 20.0, 19.0, 30.0, 56.0, 49.0, 85.0, 184.0, 2544.0, 622.0, 162.0, 69.0, 45.0, 29.0, 21.0, 24.0, 11.0, 16.0, 12.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.672943115234375, -3.56463623046875, -3.456329345703125, -3.3480224609375, -3.239715576171875, -3.13140869140625, -3.023101806640625, -2.914794921875, -2.806488037109375, -2.69818115234375, -2.589874267578125, -2.4815673828125, -2.373260498046875, -2.26495361328125, -2.156646728515625, -2.04833984375, -1.940032958984375, -1.83172607421875, -1.723419189453125, -1.6151123046875, -1.506805419921875, -1.39849853515625, -1.290191650390625, -1.181884765625, -1.073577880859375, -0.96527099609375, -0.856964111328125, -0.7486572265625, -0.640350341796875, -0.53204345703125, -0.423736572265625, -0.3154296875, -0.207122802734375, -0.09881591796875, 0.009490966796875, 0.1177978515625, 0.226104736328125, 0.33441162109375, 0.442718505859375, 0.551025390625, 0.659332275390625, 0.76763916015625, 0.875946044921875, 0.9842529296875, 1.092559814453125, 1.20086669921875, 1.309173583984375, 1.41748046875, 1.525787353515625, 1.63409423828125, 1.742401123046875, 1.8507080078125, 1.959014892578125, 2.06732177734375, 2.175628662109375, 2.283935546875, 2.392242431640625, 2.50054931640625, 2.608856201171875, 2.7171630859375, 2.825469970703125, 2.93377685546875, 3.042083740234375, 3.150390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 14.0, 9.0, 22.0, 37.0, 42.0, 52.0, 64.0, 80.0, 92.0, 81.0, 96.0, 83.0, 74.0, 64.0, 63.0, 41.0, 28.0, 24.0, 14.0, 12.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78056526184082, -21.241167068481445, -20.701766967773438, -20.162368774414062, -19.622970581054688, -19.08357048034668, -18.544172286987305, -18.004772186279297, -17.465373992919922, -16.925975799560547, -16.38657569885254, -15.847177505493164, -15.307778358459473, -14.768379211425781, -14.228981018066406, -13.689581871032715, -13.150182723999023, -12.610783576965332, -12.07138442993164, -11.531986236572266, -10.992587089538574, -10.453187942504883, -9.913789749145508, -9.374390602111816, -8.834991455078125, -8.295592308044434, -7.7561936378479, -7.216794967651367, -6.677395820617676, -6.137996673583984, -5.598598003387451, -5.059199333190918, -4.519800186157227, -3.9804012775421143, -3.441002368927002, -2.9016034603118896, -2.3622045516967773, -1.822805643081665, -1.2834067344665527, -0.7440078258514404, -0.20460891723632812, 0.3347899913787842, 0.8741888999938965, 1.4135878086090088, 1.952986717224121, 2.4923856258392334, 3.0317845344543457, 3.571183443069458, 4.11058235168457, 4.649981498718262, 5.189380168914795, 5.728778839111328, 6.2681779861450195, 6.807577133178711, 7.346975803375244, 7.886374473571777, 8.425773620605469, 8.96517276763916, 9.504571914672852, 10.043970108032227, 10.583369255065918, 11.12276840209961, 11.662166595458984, 12.201565742492676, 12.740964889526367]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 6.0, 7.0, 9.0, 19.0, 23.0, 13.0, 14.0, 21.0, 19.0, 22.0, 32.0, 37.0, 29.0, 32.0, 41.0, 36.0, 46.0, 47.0, 45.0, 28.0, 47.0, 39.0, 35.0, 30.0, 33.0, 32.0, 23.0, 24.0, 27.0, 27.0, 26.0, 16.0, 12.0, 16.0, 8.0, 8.0, 10.0, 13.0, 4.0, 5.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.702902793884277, -8.4434814453125, -8.184060096740723, -7.924638748168945, -7.665217399597168, -7.405796051025391, -7.146374702453613, -6.886953353881836, -6.627532005310059, -6.368110656738281, -6.108689308166504, -5.849267959594727, -5.589846611022949, -5.330425262451172, -5.0710039138793945, -4.811582565307617, -4.552161693572998, -4.292740345001221, -4.033318996429443, -3.773897647857666, -3.5144762992858887, -3.2550549507141113, -2.995633840560913, -2.7362124919891357, -2.4767911434173584, -2.217369794845581, -1.9579484462738037, -1.698527216911316, -1.4391058683395386, -1.1796845197677612, -0.9202632904052734, -0.6608419418334961, -0.40142059326171875, -0.1419992744922638, 0.11742204427719116, 0.37684333324432373, 0.6362646818161011, 0.8956860303878784, 1.1551072597503662, 1.4145286083221436, 1.673949956893921, 1.9333713054656982, 2.1927926540374756, 2.452213764190674, 2.711635112762451, 2.9710564613342285, 3.230477809906006, 3.489899158477783, 3.7493205070495605, 4.008741855621338, 4.268163204193115, 4.527584552764893, 4.78700590133667, 5.046427249908447, 5.305848121643066, 5.565269470214844, 5.824690818786621, 6.084112167358398, 6.343533515930176, 6.602954864501953, 6.8623762130737305, 7.121797561645508, 7.381218910217285, 7.6406402587890625, 7.90006160736084]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 20.0, 25.0, 48.0, 70.0, 144.0, 271.0, 638.0, 1778.0, 5685.0, 23299.0, 128421.0, 511452.0, 304329.0, 55752.0, 11521.0, 3083.0, 1077.0, 437.0, 209.0, 141.0, 57.0, 29.0, 22.0, 18.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.4429931640625, -19.901611328125, -19.3602294921875, -18.81884765625, -18.2774658203125, -17.736083984375, -17.1947021484375, -16.6533203125, -16.1119384765625, -15.570556640625, -15.0291748046875, -14.48779296875, -13.9464111328125, -13.405029296875, -12.8636474609375, -12.322265625, -11.7808837890625, -11.239501953125, -10.6981201171875, -10.15673828125, -9.6153564453125, -9.073974609375, -8.5325927734375, -7.9912109375, -7.4498291015625, -6.908447265625, -6.3670654296875, -5.82568359375, -5.2843017578125, -4.742919921875, -4.2015380859375, -3.66015625, -3.1187744140625, -2.577392578125, -2.0360107421875, -1.49462890625, -0.9532470703125, -0.411865234375, 0.1295166015625, 0.6708984375, 1.2122802734375, 1.753662109375, 2.2950439453125, 2.83642578125, 3.3778076171875, 3.919189453125, 4.4605712890625, 5.001953125, 5.5433349609375, 6.084716796875, 6.6260986328125, 7.16748046875, 7.7088623046875, 8.250244140625, 8.7916259765625, 9.3330078125, 9.8743896484375, 10.415771484375, 10.9571533203125, 11.49853515625, 12.0399169921875, 12.581298828125, 13.1226806640625, 13.6640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 18.0, 21.0, 23.0, 39.0, 39.0, 43.0, 47.0, 52.0, 57.0, 70.0, 74.0, 72.0, 57.0, 66.0, 50.0, 51.0, 38.0, 29.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.84356689453125, -3.6676025390625, -3.49163818359375, -3.315673828125, -3.13970947265625, -2.9637451171875, -2.78778076171875, -2.61181640625, -2.43585205078125, -2.2598876953125, -2.08392333984375, -1.907958984375, -1.73199462890625, -1.5560302734375, -1.38006591796875, -1.2041015625, -1.02813720703125, -0.8521728515625, -0.67620849609375, -0.500244140625, -0.32427978515625, -0.1483154296875, 0.02764892578125, 0.20361328125, 0.37957763671875, 0.5555419921875, 0.73150634765625, 0.907470703125, 1.08343505859375, 1.2593994140625, 1.43536376953125, 1.611328125, 1.78729248046875, 1.9632568359375, 2.13922119140625, 2.315185546875, 2.49114990234375, 2.6671142578125, 2.84307861328125, 3.01904296875, 3.19500732421875, 3.3709716796875, 3.54693603515625, 3.722900390625, 3.89886474609375, 4.0748291015625, 4.25079345703125, 4.4267578125, 4.60272216796875, 4.7786865234375, 4.95465087890625, 5.130615234375, 5.30657958984375, 5.4825439453125, 5.65850830078125, 5.83447265625, 6.01043701171875, 6.1864013671875, 6.36236572265625, 6.538330078125, 6.71429443359375, 6.8902587890625, 7.06622314453125, 7.2421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 10.0, 19.0, 42.0, 59.0, 129.0, 223.0, 364.0, 650.0, 1356.0, 4078.0, 38437.0, 773800.0, 214567.0, 10527.0, 2160.0, 948.0, 516.0, 290.0, 163.0, 84.0, 53.0, 34.0, 19.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.77099609375, -20.8544921875, -19.93798828125, -19.021484375, -18.10498046875, -17.1884765625, -16.27197265625, -15.35546875, -14.43896484375, -13.5224609375, -12.60595703125, -11.689453125, -10.77294921875, -9.8564453125, -8.93994140625, -8.0234375, -7.10693359375, -6.1904296875, -5.27392578125, -4.357421875, -3.44091796875, -2.5244140625, -1.60791015625, -0.69140625, 0.22509765625, 1.1416015625, 2.05810546875, 2.974609375, 3.89111328125, 4.8076171875, 5.72412109375, 6.640625, 7.55712890625, 8.4736328125, 9.39013671875, 10.306640625, 11.22314453125, 12.1396484375, 13.05615234375, 13.97265625, 14.88916015625, 15.8056640625, 16.72216796875, 17.638671875, 18.55517578125, 19.4716796875, 20.38818359375, 21.3046875, 22.22119140625, 23.1376953125, 24.05419921875, 24.970703125, 25.88720703125, 26.8037109375, 27.72021484375, 28.63671875, 29.55322265625, 30.4697265625, 31.38623046875, 32.302734375, 33.21923828125, 34.1357421875, 35.05224609375, 35.96875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 11.0, 15.0, 22.0, 22.0, 22.0, 37.0, 31.0, 32.0, 56.0, 29.0, 42.0, 43.0, 35.0, 45.0, 45.0, 30.0, 46.0, 56.0, 40.0, 40.0, 33.0, 31.0, 30.0, 27.0, 28.0, 16.0, 17.0, 14.0, 9.0, 11.0, 5.0, 8.0, 9.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.7138671875, -16.193359375, -15.6728515625, -15.15234375, -14.6318359375, -14.111328125, -13.5908203125, -13.0703125, -12.5498046875, -12.029296875, -11.5087890625, -10.98828125, -10.4677734375, -9.947265625, -9.4267578125, -8.90625, -8.3857421875, -7.865234375, -7.3447265625, -6.82421875, -6.3037109375, -5.783203125, -5.2626953125, -4.7421875, -4.2216796875, -3.701171875, -3.1806640625, -2.66015625, -2.1396484375, -1.619140625, -1.0986328125, -0.578125, -0.0576171875, 0.462890625, 0.9833984375, 1.50390625, 2.0244140625, 2.544921875, 3.0654296875, 3.5859375, 4.1064453125, 4.626953125, 5.1474609375, 5.66796875, 6.1884765625, 6.708984375, 7.2294921875, 7.75, 8.2705078125, 8.791015625, 9.3115234375, 9.83203125, 10.3525390625, 10.873046875, 11.3935546875, 11.9140625, 12.4345703125, 12.955078125, 13.4755859375, 13.99609375, 14.5166015625, 15.037109375, 15.5576171875, 16.078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 27.0, 33.0, 58.0, 85.0, 144.0, 235.0, 423.0, 870.0, 2120.0, 6913.0, 31118.0, 261956.0, 650603.0, 74148.0, 13251.0, 3680.0, 1295.0, 605.0, 313.0, 174.0, 114.0, 83.0, 57.0, 41.0, 24.0, 20.0, 16.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.4921875, -9.20654296875, -8.9208984375, -8.63525390625, -8.349609375, -8.06396484375, -7.7783203125, -7.49267578125, -7.20703125, -6.92138671875, -6.6357421875, -6.35009765625, -6.064453125, -5.77880859375, -5.4931640625, -5.20751953125, -4.921875, -4.63623046875, -4.3505859375, -4.06494140625, -3.779296875, -3.49365234375, -3.2080078125, -2.92236328125, -2.63671875, -2.35107421875, -2.0654296875, -1.77978515625, -1.494140625, -1.20849609375, -0.9228515625, -0.63720703125, -0.3515625, -0.06591796875, 0.2197265625, 0.50537109375, 0.791015625, 1.07666015625, 1.3623046875, 1.64794921875, 1.93359375, 2.21923828125, 2.5048828125, 2.79052734375, 3.076171875, 3.36181640625, 3.6474609375, 3.93310546875, 4.21875, 4.50439453125, 4.7900390625, 5.07568359375, 5.361328125, 5.64697265625, 5.9326171875, 6.21826171875, 6.50390625, 6.78955078125, 7.0751953125, 7.36083984375, 7.646484375, 7.93212890625, 8.2177734375, 8.50341796875, 8.7890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 19.0, 30.0, 51.0, 83.0, 117.0, 168.0, 172.0, 127.0, 76.0, 39.0, 26.0, 16.0, 8.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001140594482421875, -0.001079946756362915, -0.001019299030303955, -0.0009586513042449951, -0.0008980035781860352, -0.0008373558521270752, -0.0007767081260681152, -0.0007160604000091553, -0.0006554126739501953, -0.0005947649478912354, -0.0005341172218322754, -0.00047346949577331543, -0.00041282176971435547, -0.0003521740436553955, -0.00029152631759643555, -0.00023087859153747559, -0.00017023086547851562, -0.00010958313941955566, -4.89354133605957e-05, 1.1712312698364258e-05, 7.236003875732422e-05, 0.00013300776481628418, 0.00019365549087524414, 0.0002543032169342041, 0.00031495094299316406, 0.000375598669052124, 0.000436246395111084, 0.0004968941211700439, 0.0005575418472290039, 0.0006181895732879639, 0.0006788372993469238, 0.0007394850254058838, 0.0008001327514648438, 0.0008607804775238037, 0.0009214282035827637, 0.0009820759296417236, 0.0010427236557006836, 0.0011033713817596436, 0.0011640191078186035, 0.0012246668338775635, 0.0012853145599365234, 0.0013459622859954834, 0.0014066100120544434, 0.0014672577381134033, 0.0015279054641723633, 0.0015885531902313232, 0.0016492009162902832, 0.0017098486423492432, 0.0017704963684082031, 0.001831144094467163, 0.001891791820526123, 0.001952439546585083, 0.002013087272644043, 0.002073734998703003, 0.002134382724761963, 0.002195030450820923, 0.002255678176879883, 0.0023163259029388428, 0.0023769736289978027, 0.0024376213550567627, 0.0024982690811157227, 0.0025589168071746826, 0.0026195645332336426, 0.0026802122592926025, 0.0027408599853515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 24.0, 36.0, 59.0, 94.0, 185.0, 305.0, 668.0, 2143.0, 10363.0, 150358.0, 823110.0, 52897.0, 5756.0, 1364.0, 546.0, 282.0, 146.0, 62.0, 34.0, 32.0, 20.0, 10.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8660888671875, -15.404052734375, -14.9420166015625, -14.47998046875, -14.0179443359375, -13.555908203125, -13.0938720703125, -12.6318359375, -12.1697998046875, -11.707763671875, -11.2457275390625, -10.78369140625, -10.3216552734375, -9.859619140625, -9.3975830078125, -8.935546875, -8.4735107421875, -8.011474609375, -7.5494384765625, -7.08740234375, -6.6253662109375, -6.163330078125, -5.7012939453125, -5.2392578125, -4.7772216796875, -4.315185546875, -3.8531494140625, -3.39111328125, -2.9290771484375, -2.467041015625, -2.0050048828125, -1.54296875, -1.0809326171875, -0.618896484375, -0.1568603515625, 0.30517578125, 0.7672119140625, 1.229248046875, 1.6912841796875, 2.1533203125, 2.6153564453125, 3.077392578125, 3.5394287109375, 4.00146484375, 4.4635009765625, 4.925537109375, 5.3875732421875, 5.849609375, 6.3116455078125, 6.773681640625, 7.2357177734375, 7.69775390625, 8.1597900390625, 8.621826171875, 9.0838623046875, 9.5458984375, 10.0079345703125, 10.469970703125, 10.9320068359375, 11.39404296875, 11.8560791015625, 12.318115234375, 12.7801513671875, 13.2421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 12.0, 12.0, 20.0, 28.0, 64.0, 93.0, 121.0, 142.0, 150.0, 101.0, 89.0, 53.0, 40.0, 22.0, 12.0, 4.0, 6.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-15.8359375, -15.4912109375, -15.146484375, -14.8017578125, -14.45703125, -14.1123046875, -13.767578125, -13.4228515625, -13.078125, -12.7333984375, -12.388671875, -12.0439453125, -11.69921875, -11.3544921875, -11.009765625, -10.6650390625, -10.3203125, -9.9755859375, -9.630859375, -9.2861328125, -8.94140625, -8.5966796875, -8.251953125, -7.9072265625, -7.5625, -7.2177734375, -6.873046875, -6.5283203125, -6.18359375, -5.8388671875, -5.494140625, -5.1494140625, -4.8046875, -4.4599609375, -4.115234375, -3.7705078125, -3.42578125, -3.0810546875, -2.736328125, -2.3916015625, -2.046875, -1.7021484375, -1.357421875, -1.0126953125, -0.66796875, -0.3232421875, 0.021484375, 0.3662109375, 0.7109375, 1.0556640625, 1.400390625, 1.7451171875, 2.08984375, 2.4345703125, 2.779296875, 3.1240234375, 3.46875, 3.8134765625, 4.158203125, 4.5029296875, 4.84765625, 5.1923828125, 5.537109375, 5.8818359375, 6.2265625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 12.0, 27.0, 76.0, 104.0, 149.0, 171.0, 165.0, 133.0, 68.0, 40.0, 14.0, 18.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.68679809570312, -84.5965805053711, -79.50636291503906, -74.41615295410156, -69.32593536376953, -64.2357177734375, -59.145503997802734, -54.05529022216797, -48.96507263183594, -43.874855041503906, -38.78464126586914, -33.694427490234375, -28.604209899902344, -23.513994216918945, -18.423778533935547, -13.333564758300781, -8.24334716796875, -3.1531314849853516, 1.9370841979980469, 7.027299880981445, 12.117515563964844, 17.207731246948242, 22.29794692993164, 27.388160705566406, 32.47837829589844, 37.56859588623047, 42.658809661865234, 47.7490234375, 52.83924102783203, 57.92945861816406, 63.01967239379883, 68.1098861694336, 73.20008850097656, 78.2903060913086, 83.38052368164062, 88.47073364257812, 93.56095123291016, 98.65116882324219, 103.74137878417969, 108.83159637451172, 113.92181396484375, 119.01203155517578, 124.10224914550781, 129.1924591064453, 134.28268432617188, 139.37289428710938, 144.46310424804688, 149.55331420898438, 154.64353942871094, 159.73374938964844, 164.823974609375, 169.9141845703125, 175.00439453125, 180.09461975097656, 185.18482971191406, 190.27505493164062, 195.36526489257812, 200.45547485351562, 205.5457000732422, 210.6359100341797, 215.72613525390625, 220.81634521484375, 225.90655517578125, 230.99676513671875, 236.0869903564453]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 8.0, 9.0, 18.0, 23.0, 27.0, 22.0, 25.0, 32.0, 31.0, 54.0, 39.0, 50.0, 45.0, 46.0, 62.0, 48.0, 49.0, 47.0, 38.0, 49.0, 36.0, 31.0, 25.0, 29.0, 28.0, 15.0, 17.0, 15.0, 14.0, 6.0, 16.0, 8.0, 5.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.55218505859375, -72.94676971435547, -70.34136199951172, -67.73594665527344, -65.13053894042969, -62.525123596191406, -59.919708251953125, -57.31429672241211, -54.708885192871094, -52.10347366333008, -49.49806213378906, -46.89264678955078, -44.287235260009766, -41.68182373046875, -39.07640838623047, -36.47099685668945, -33.86558532714844, -31.260173797607422, -28.654760360717773, -26.049346923828125, -23.44393539428711, -20.838523864746094, -18.233110427856445, -15.627696990966797, -13.022285461425781, -10.41687297821045, -7.811460494995117, -5.206048011779785, -2.600635528564453, 0.004776954650878906, 2.610189437866211, 5.215602874755859, 7.821014404296875, 10.426426887512207, 13.031839370727539, 15.637251853942871, 18.242664337158203, 20.84807586669922, 23.453489303588867, 26.058902740478516, 28.66431427001953, 31.269725799560547, 33.87513732910156, 36.480552673339844, 39.08596420288086, 41.691375732421875, 44.296791076660156, 46.90220260620117, 49.50761413574219, 52.1130256652832, 54.71843719482422, 57.3238525390625, 59.929264068603516, 62.53467559814453, 65.14009094238281, 67.74549865722656, 70.35091400146484, 72.95632934570312, 75.56173706054688, 78.16715240478516, 80.77256774902344, 83.37797546386719, 85.98339080810547, 88.58880615234375, 91.1942138671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 8.0, 13.0, 21.0, 41.0, 58.0, 78.0, 127.0, 253.0, 521.0, 1080.0, 2553.0, 6606.0, 24020.0, 4024467.0, 111675.0, 14509.0, 4673.0, 1831.0, 839.0, 406.0, 200.0, 112.0, 70.0, 32.0, 16.0, 19.0, 7.0, 12.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.8125, -32.841552734375, -31.87060546875, -30.899658203125, -29.9287109375, -28.957763671875, -27.98681640625, -27.015869140625, -26.044921875, -25.073974609375, -24.10302734375, -23.132080078125, -22.1611328125, -21.190185546875, -20.21923828125, -19.248291015625, -18.27734375, -17.306396484375, -16.33544921875, -15.364501953125, -14.3935546875, -13.422607421875, -12.45166015625, -11.480712890625, -10.509765625, -9.538818359375, -8.56787109375, -7.596923828125, -6.6259765625, -5.655029296875, -4.68408203125, -3.713134765625, -2.7421875, -1.771240234375, -0.80029296875, 0.170654296875, 1.1416015625, 2.112548828125, 3.08349609375, 4.054443359375, 5.025390625, 5.996337890625, 6.96728515625, 7.938232421875, 8.9091796875, 9.880126953125, 10.85107421875, 11.822021484375, 12.79296875, 13.763916015625, 14.73486328125, 15.705810546875, 16.6767578125, 17.647705078125, 18.61865234375, 19.589599609375, 20.560546875, 21.531494140625, 22.50244140625, 23.473388671875, 24.4443359375, 25.415283203125, 26.38623046875, 27.357177734375, 28.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 19.0, 16.0, 17.0, 27.0, 24.0, 38.0, 48.0, 44.0, 53.0, 53.0, 73.0, 76.0, 58.0, 50.0, 53.0, 71.0, 46.0, 33.0, 36.0, 37.0, 15.0, 24.0, 14.0, 9.0, 5.0, 13.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.824127197265625, -3.65020751953125, -3.476287841796875, -3.3023681640625, -3.128448486328125, -2.95452880859375, -2.780609130859375, -2.606689453125, -2.432769775390625, -2.25885009765625, -2.084930419921875, -1.9110107421875, -1.737091064453125, -1.56317138671875, -1.389251708984375, -1.21533203125, -1.041412353515625, -0.86749267578125, -0.693572998046875, -0.5196533203125, -0.345733642578125, -0.17181396484375, 0.002105712890625, 0.176025390625, 0.349945068359375, 0.52386474609375, 0.697784423828125, 0.8717041015625, 1.045623779296875, 1.21954345703125, 1.393463134765625, 1.5673828125, 1.741302490234375, 1.91522216796875, 2.089141845703125, 2.2630615234375, 2.436981201171875, 2.61090087890625, 2.784820556640625, 2.958740234375, 3.132659912109375, 3.30657958984375, 3.480499267578125, 3.6544189453125, 3.828338623046875, 4.00225830078125, 4.176177978515625, 4.35009765625, 4.524017333984375, 4.69793701171875, 4.871856689453125, 5.0457763671875, 5.219696044921875, 5.39361572265625, 5.567535400390625, 5.741455078125, 5.915374755859375, 6.08929443359375, 6.263214111328125, 6.4371337890625, 6.611053466796875, 6.78497314453125, 6.958892822265625, 7.1328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 16.0, 21.0, 32.0, 43.0, 98.0, 107.0, 204.0, 362.0, 608.0, 1099.0, 2037.0, 4160.0, 9508.0, 29304.0, 3782421.0, 321699.0, 25664.0, 8701.0, 3837.0, 1900.0, 1010.0, 579.0, 347.0, 191.0, 107.0, 74.0, 54.0, 40.0, 18.0, 12.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.88525390625, -26.1767578125, -25.46826171875, -24.759765625, -24.05126953125, -23.3427734375, -22.63427734375, -21.92578125, -21.21728515625, -20.5087890625, -19.80029296875, -19.091796875, -18.38330078125, -17.6748046875, -16.96630859375, -16.2578125, -15.54931640625, -14.8408203125, -14.13232421875, -13.423828125, -12.71533203125, -12.0068359375, -11.29833984375, -10.58984375, -9.88134765625, -9.1728515625, -8.46435546875, -7.755859375, -7.04736328125, -6.3388671875, -5.63037109375, -4.921875, -4.21337890625, -3.5048828125, -2.79638671875, -2.087890625, -1.37939453125, -0.6708984375, 0.03759765625, 0.74609375, 1.45458984375, 2.1630859375, 2.87158203125, 3.580078125, 4.28857421875, 4.9970703125, 5.70556640625, 6.4140625, 7.12255859375, 7.8310546875, 8.53955078125, 9.248046875, 9.95654296875, 10.6650390625, 11.37353515625, 12.08203125, 12.79052734375, 13.4990234375, 14.20751953125, 14.916015625, 15.62451171875, 16.3330078125, 17.04150390625, 17.75]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 3.0, 12.0, 20.0, 17.0, 26.0, 79.0, 645.0, 3027.0, 82.0, 40.0, 21.0, 23.0, 14.0, 13.0, 4.0, 4.0, 7.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.0562744140625, -3.921142578125, -3.7860107421875, -3.65087890625, -3.5157470703125, -3.380615234375, -3.2454833984375, -3.1103515625, -2.9752197265625, -2.840087890625, -2.7049560546875, -2.56982421875, -2.4346923828125, -2.299560546875, -2.1644287109375, -2.029296875, -1.8941650390625, -1.759033203125, -1.6239013671875, -1.48876953125, -1.3536376953125, -1.218505859375, -1.0833740234375, -0.9482421875, -0.8131103515625, -0.677978515625, -0.5428466796875, -0.40771484375, -0.2725830078125, -0.137451171875, -0.0023193359375, 0.1328125, 0.2679443359375, 0.403076171875, 0.5382080078125, 0.67333984375, 0.8084716796875, 0.943603515625, 1.0787353515625, 1.2138671875, 1.3489990234375, 1.484130859375, 1.6192626953125, 1.75439453125, 1.8895263671875, 2.024658203125, 2.1597900390625, 2.294921875, 2.4300537109375, 2.565185546875, 2.7003173828125, 2.83544921875, 2.9705810546875, 3.105712890625, 3.2408447265625, 3.3759765625, 3.5111083984375, 3.646240234375, 3.7813720703125, 3.91650390625, 4.0516357421875, 4.186767578125, 4.3218994140625, 4.45703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 15.0, 33.0, 37.0, 61.0, 52.0, 85.0, 92.0, 111.0, 124.0, 91.0, 74.0, 55.0, 40.0, 34.0, 31.0, 14.0, 7.0, 9.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.199918746948242, -17.660322189331055, -17.1207275390625, -16.581130981445312, -16.041534423828125, -15.50193977355957, -14.962343215942383, -14.422747611999512, -13.88315200805664, -13.34355640411377, -12.803960800170898, -12.264364242553711, -11.72476863861084, -11.185173034667969, -10.645576477050781, -10.10598087310791, -9.566385269165039, -9.026789665222168, -8.487194061279297, -7.947597503662109, -7.408001899719238, -6.868406295776367, -6.328810214996338, -5.789214134216309, -5.2496185302734375, -4.710022926330566, -4.170426845550537, -3.630831003189087, -3.0912351608276367, -2.5516393184661865, -2.0120434761047363, -1.4724476337432861, -0.9328498840332031, -0.39325404167175293, 0.14634180068969727, 0.6859376430511475, 1.2255334854125977, 1.7651293277740479, 2.304725170135498, 2.8443210124969482, 3.3839168548583984, 3.9235126972198486, 4.463108539581299, 5.002704620361328, 5.542300224304199, 6.08189582824707, 6.6214919090271, 7.161087989807129, 7.70068359375, 8.240279197692871, 8.779874801635742, 9.31947135925293, 9.8590669631958, 10.398662567138672, 10.93825912475586, 11.47785472869873, 12.017450332641602, 12.557045936584473, 13.096641540527344, 13.636238098144531, 14.175833702087402, 14.715429306030273, 15.255025863647461, 15.794621467590332, 16.334217071533203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 9.0, 8.0, 9.0, 9.0, 7.0, 16.0, 21.0, 21.0, 24.0, 22.0, 24.0, 25.0, 30.0, 44.0, 34.0, 40.0, 40.0, 41.0, 32.0, 37.0, 45.0, 37.0, 29.0, 40.0, 32.0, 37.0, 28.0, 34.0, 32.0, 28.0, 25.0, 23.0, 12.0, 16.0, 13.0, 8.0, 5.0, 10.0, 6.0, 6.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.987802505493164, -7.732031345367432, -7.476259708404541, -7.220488548278809, -6.964717388153076, -6.708946228027344, -6.453174591064453, -6.197403430938721, -5.941632270812988, -5.685861110687256, -5.430089473724365, -5.174318313598633, -4.9185471534729, -4.662775993347168, -4.407004356384277, -4.151233196258545, -3.8954615592956543, -3.6396901607513428, -3.3839190006256104, -3.128147602081299, -2.8723764419555664, -2.616605043411255, -2.3608336448669434, -2.105062484741211, -1.8492910861968994, -1.5935198068618774, -1.3377485275268555, -1.081977128982544, -0.826205849647522, -0.5704345703125, -0.3146631717681885, -0.058891892433166504, 0.19687938690185547, 0.45265069603919983, 0.7084220051765442, 0.9641933441162109, 1.219964623451233, 1.4757359027862549, 1.7315073013305664, 1.9872785806655884, 2.2430498600006104, 2.498821258544922, 2.7545924186706543, 3.010363817214966, 3.2661352157592773, 3.5219063758850098, 3.7776777744293213, 4.033449172973633, 4.289220333099365, 4.544991493225098, 4.800763130187988, 5.056534290313721, 5.312305450439453, 5.568077087402344, 5.823848247528076, 6.079619407653809, 6.335391044616699, 6.591162204742432, 6.846933841705322, 7.102705001831055, 7.358476161956787, 7.6142473220825195, 7.87001895904541, 8.1257905960083, 8.381561279296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 21.0, 35.0, 55.0, 95.0, 139.0, 260.0, 477.0, 1126.0, 2731.0, 7795.0, 25658.0, 93392.0, 314884.0, 404607.0, 140615.0, 38772.0, 11315.0, 3691.0, 1432.0, 643.0, 367.0, 154.0, 102.0, 59.0, 49.0, 18.0, 15.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.8792724609375, -10.492919921875, -10.1065673828125, -9.72021484375, -9.3338623046875, -8.947509765625, -8.5611572265625, -8.1748046875, -7.7884521484375, -7.402099609375, -7.0157470703125, -6.62939453125, -6.2430419921875, -5.856689453125, -5.4703369140625, -5.083984375, -4.6976318359375, -4.311279296875, -3.9249267578125, -3.53857421875, -3.1522216796875, -2.765869140625, -2.3795166015625, -1.9931640625, -1.6068115234375, -1.220458984375, -0.8341064453125, -0.44775390625, -0.0614013671875, 0.324951171875, 0.7113037109375, 1.09765625, 1.4840087890625, 1.870361328125, 2.2567138671875, 2.64306640625, 3.0294189453125, 3.415771484375, 3.8021240234375, 4.1884765625, 4.5748291015625, 4.961181640625, 5.3475341796875, 5.73388671875, 6.1202392578125, 6.506591796875, 6.8929443359375, 7.279296875, 7.6656494140625, 8.052001953125, 8.4383544921875, 8.82470703125, 9.2110595703125, 9.597412109375, 9.9837646484375, 10.3701171875, 10.7564697265625, 11.142822265625, 11.5291748046875, 11.91552734375, 12.3018798828125, 12.688232421875, 13.0745849609375, 13.4609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 19.0, 14.0, 21.0, 27.0, 30.0, 41.0, 39.0, 44.0, 51.0, 57.0, 67.0, 62.0, 62.0, 57.0, 58.0, 42.0, 60.0, 40.0, 24.0, 29.0, 21.0, 30.0, 15.0, 11.0, 8.0, 6.0, 7.0, 8.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0347900390625, -3.858642578125, -3.6824951171875, -3.50634765625, -3.3302001953125, -3.154052734375, -2.9779052734375, -2.8017578125, -2.6256103515625, -2.449462890625, -2.2733154296875, -2.09716796875, -1.9210205078125, -1.744873046875, -1.5687255859375, -1.392578125, -1.2164306640625, -1.040283203125, -0.8641357421875, -0.68798828125, -0.5118408203125, -0.335693359375, -0.1595458984375, 0.0166015625, 0.1927490234375, 0.368896484375, 0.5450439453125, 0.72119140625, 0.8973388671875, 1.073486328125, 1.2496337890625, 1.42578125, 1.6019287109375, 1.778076171875, 1.9542236328125, 2.13037109375, 2.3065185546875, 2.482666015625, 2.6588134765625, 2.8349609375, 3.0111083984375, 3.187255859375, 3.3634033203125, 3.53955078125, 3.7156982421875, 3.891845703125, 4.0679931640625, 4.244140625, 4.4202880859375, 4.596435546875, 4.7725830078125, 4.94873046875, 5.1248779296875, 5.301025390625, 5.4771728515625, 5.6533203125, 5.8294677734375, 6.005615234375, 6.1817626953125, 6.35791015625, 6.5340576171875, 6.710205078125, 6.8863525390625, 7.0625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 8.0, 20.0, 16.0, 24.0, 29.0, 56.0, 63.0, 108.0, 162.0, 209.0, 295.0, 423.0, 733.0, 1113.0, 2581.0, 10957.0, 101474.0, 746283.0, 161853.0, 15421.0, 3157.0, 1297.0, 675.0, 482.0, 339.0, 206.0, 163.0, 124.0, 76.0, 60.0, 33.0, 34.0, 19.0, 18.0, 9.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.296875, -17.69873046875, -17.1005859375, -16.50244140625, -15.904296875, -15.30615234375, -14.7080078125, -14.10986328125, -13.51171875, -12.91357421875, -12.3154296875, -11.71728515625, -11.119140625, -10.52099609375, -9.9228515625, -9.32470703125, -8.7265625, -8.12841796875, -7.5302734375, -6.93212890625, -6.333984375, -5.73583984375, -5.1376953125, -4.53955078125, -3.94140625, -3.34326171875, -2.7451171875, -2.14697265625, -1.548828125, -0.95068359375, -0.3525390625, 0.24560546875, 0.84375, 1.44189453125, 2.0400390625, 2.63818359375, 3.236328125, 3.83447265625, 4.4326171875, 5.03076171875, 5.62890625, 6.22705078125, 6.8251953125, 7.42333984375, 8.021484375, 8.61962890625, 9.2177734375, 9.81591796875, 10.4140625, 11.01220703125, 11.6103515625, 12.20849609375, 12.806640625, 13.40478515625, 14.0029296875, 14.60107421875, 15.19921875, 15.79736328125, 16.3955078125, 16.99365234375, 17.591796875, 18.18994140625, 18.7880859375, 19.38623046875, 19.984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 5.0, 10.0, 14.0, 16.0, 26.0, 23.0, 18.0, 29.0, 37.0, 43.0, 53.0, 40.0, 43.0, 54.0, 59.0, 50.0, 48.0, 55.0, 43.0, 46.0, 42.0, 30.0, 25.0, 29.0, 28.0, 25.0, 11.0, 17.0, 21.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.927490234375, -21.26123046875, -20.594970703125, -19.9287109375, -19.262451171875, -18.59619140625, -17.929931640625, -17.263671875, -16.597412109375, -15.93115234375, -15.264892578125, -14.5986328125, -13.932373046875, -13.26611328125, -12.599853515625, -11.93359375, -11.267333984375, -10.60107421875, -9.934814453125, -9.2685546875, -8.602294921875, -7.93603515625, -7.269775390625, -6.603515625, -5.937255859375, -5.27099609375, -4.604736328125, -3.9384765625, -3.272216796875, -2.60595703125, -1.939697265625, -1.2734375, -0.607177734375, 0.05908203125, 0.725341796875, 1.3916015625, 2.057861328125, 2.72412109375, 3.390380859375, 4.056640625, 4.722900390625, 5.38916015625, 6.055419921875, 6.7216796875, 7.387939453125, 8.05419921875, 8.720458984375, 9.38671875, 10.052978515625, 10.71923828125, 11.385498046875, 12.0517578125, 12.718017578125, 13.38427734375, 14.050537109375, 14.716796875, 15.383056640625, 16.04931640625, 16.715576171875, 17.3818359375, 18.048095703125, 18.71435546875, 19.380615234375, 20.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 12.0, 7.0, 14.0, 15.0, 24.0, 46.0, 59.0, 106.0, 160.0, 247.0, 516.0, 1272.0, 4753.0, 34527.0, 590646.0, 385539.0, 24693.0, 3766.0, 1076.0, 434.0, 232.0, 125.0, 95.0, 61.0, 41.0, 19.0, 17.0, 13.0, 10.0, 3.0, 10.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1015625, -9.7640380859375, -9.426513671875, -9.0889892578125, -8.75146484375, -8.4139404296875, -8.076416015625, -7.7388916015625, -7.4013671875, -7.0638427734375, -6.726318359375, -6.3887939453125, -6.05126953125, -5.7137451171875, -5.376220703125, -5.0386962890625, -4.701171875, -4.3636474609375, -4.026123046875, -3.6885986328125, -3.35107421875, -3.0135498046875, -2.676025390625, -2.3385009765625, -2.0009765625, -1.6634521484375, -1.325927734375, -0.9884033203125, -0.65087890625, -0.3133544921875, 0.024169921875, 0.3616943359375, 0.69921875, 1.0367431640625, 1.374267578125, 1.7117919921875, 2.04931640625, 2.3868408203125, 2.724365234375, 3.0618896484375, 3.3994140625, 3.7369384765625, 4.074462890625, 4.4119873046875, 4.74951171875, 5.0870361328125, 5.424560546875, 5.7620849609375, 6.099609375, 6.4371337890625, 6.774658203125, 7.1121826171875, 7.44970703125, 7.7872314453125, 8.124755859375, 8.4622802734375, 8.7998046875, 9.1373291015625, 9.474853515625, 9.8123779296875, 10.14990234375, 10.4874267578125, 10.824951171875, 11.1624755859375, 11.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 11.0, 14.0, 13.0, 15.0, 29.0, 41.0, 57.0, 56.0, 100.0, 131.0, 117.0, 91.0, 74.0, 60.0, 41.0, 35.0, 23.0, 17.0, 16.0, 12.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010431110858917236, -0.0010085701942443848, -0.0009740293025970459, -0.000939488410949707, -0.0009049475193023682, -0.0008704066276550293, -0.0008358657360076904, -0.0008013248443603516, -0.0007667839527130127, -0.0007322430610656738, -0.000697702169418335, -0.0006631612777709961, -0.0006286203861236572, -0.0005940794944763184, -0.0005595386028289795, -0.0005249977111816406, -0.0004904568195343018, -0.0004559159278869629, -0.000421375036239624, -0.00038683414459228516, -0.0003522932529449463, -0.0003177523612976074, -0.00028321146965026855, -0.0002486705780029297, -0.00021412968635559082, -0.00017958879470825195, -0.00014504790306091309, -0.00011050701141357422, -7.596611976623535e-05, -4.1425228118896484e-05, -6.884336471557617e-06, 2.765655517578125e-05, 6.219744682312012e-05, 9.673833847045898e-05, 0.00013127923011779785, 0.00016582012176513672, 0.00020036101341247559, 0.00023490190505981445, 0.0002694427967071533, 0.0003039836883544922, 0.00033852458000183105, 0.0003730654716491699, 0.0004076063632965088, 0.00044214725494384766, 0.0004766881465911865, 0.0005112290382385254, 0.0005457699298858643, 0.0005803108215332031, 0.000614851713180542, 0.0006493926048278809, 0.0006839334964752197, 0.0007184743881225586, 0.0007530152797698975, 0.0007875561714172363, 0.0008220970630645752, 0.0008566379547119141, 0.0008911788463592529, 0.0009257197380065918, 0.0009602606296539307, 0.0009948015213012695, 0.0010293424129486084, 0.0010638833045959473, 0.0010984241962432861, 0.001132965087890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 13.0, 15.0, 36.0, 55.0, 101.0, 155.0, 338.0, 718.0, 2007.0, 8034.0, 89338.0, 827586.0, 107431.0, 9055.0, 2100.0, 765.0, 345.0, 176.0, 102.0, 61.0, 42.0, 29.0, 11.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.375, -7.967041015625, -7.55908203125, -7.151123046875, -6.7431640625, -6.335205078125, -5.92724609375, -5.519287109375, -5.111328125, -4.703369140625, -4.29541015625, -3.887451171875, -3.4794921875, -3.071533203125, -2.66357421875, -2.255615234375, -1.84765625, -1.439697265625, -1.03173828125, -0.623779296875, -0.2158203125, 0.192138671875, 0.60009765625, 1.008056640625, 1.416015625, 1.823974609375, 2.23193359375, 2.639892578125, 3.0478515625, 3.455810546875, 3.86376953125, 4.271728515625, 4.6796875, 5.087646484375, 5.49560546875, 5.903564453125, 6.3115234375, 6.719482421875, 7.12744140625, 7.535400390625, 7.943359375, 8.351318359375, 8.75927734375, 9.167236328125, 9.5751953125, 9.983154296875, 10.39111328125, 10.799072265625, 11.20703125, 11.614990234375, 12.02294921875, 12.430908203125, 12.8388671875, 13.246826171875, 13.65478515625, 14.062744140625, 14.470703125, 14.878662109375, 15.28662109375, 15.694580078125, 16.1025390625, 16.510498046875, 16.91845703125, 17.326416015625, 17.734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 13.0, 21.0, 15.0, 29.0, 33.0, 48.0, 60.0, 70.0, 98.0, 95.0, 84.0, 92.0, 69.0, 54.0, 38.0, 42.0, 32.0, 23.0, 19.0, 10.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.23858642578125, -4.9888916015625, -4.73919677734375, -4.489501953125, -4.23980712890625, -3.9901123046875, -3.74041748046875, -3.49072265625, -3.24102783203125, -2.9913330078125, -2.74163818359375, -2.491943359375, -2.24224853515625, -1.9925537109375, -1.74285888671875, -1.4931640625, -1.24346923828125, -0.9937744140625, -0.74407958984375, -0.494384765625, -0.24468994140625, 0.0050048828125, 0.25469970703125, 0.50439453125, 0.75408935546875, 1.0037841796875, 1.25347900390625, 1.503173828125, 1.75286865234375, 2.0025634765625, 2.25225830078125, 2.501953125, 2.75164794921875, 3.0013427734375, 3.25103759765625, 3.500732421875, 3.75042724609375, 4.0001220703125, 4.24981689453125, 4.49951171875, 4.74920654296875, 4.9989013671875, 5.24859619140625, 5.498291015625, 5.74798583984375, 5.9976806640625, 6.24737548828125, 6.4970703125, 6.74676513671875, 6.9964599609375, 7.24615478515625, 7.495849609375, 7.74554443359375, 7.9952392578125, 8.24493408203125, 8.49462890625, 8.74432373046875, 8.9940185546875, 9.24371337890625, 9.493408203125, 9.74310302734375, 9.9927978515625, 10.24249267578125, 10.4921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 58.0, 378.0, 467.0, 81.0, 20.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-569.9039916992188, -554.0897216796875, -538.2754516601562, -522.461181640625, -506.6469421386719, -490.83270263671875, -475.0184326171875, -459.20416259765625, -443.389892578125, -427.57562255859375, -411.7613830566406, -395.9471130371094, -380.1328430175781, -364.318603515625, -348.50433349609375, -332.6900634765625, -316.87579345703125, -301.0615234375, -285.2472839355469, -269.4330139160156, -253.61874389648438, -237.8044891357422, -221.990234375, -206.17596435546875, -190.36172485351562, -174.54747009277344, -158.7332000732422, -142.9189453125, -127.10467529296875, -111.29042053222656, -95.47615814208984, -79.66189575195312, -63.847625732421875, -48.033363342285156, -32.21910095214844, -16.404842376708984, -0.5905799865722656, 15.223678588867188, 31.037940979003906, 46.852203369140625, 62.666465759277344, 78.48072814941406, 94.29499053955078, 110.1092529296875, 125.92350769042969, 141.73776245117188, 157.55203247070312, 173.36630249023438, 189.18055725097656, 204.99481201171875, 220.80908203125, 236.6233367919922, 252.43760681152344, 268.2518615722656, 284.0661315917969, 299.88037109375, 315.69464111328125, 331.5089111328125, 347.3231506347656, 363.1374206542969, 378.9516906738281, 394.76593017578125, 410.5802001953125, 426.39447021484375, 442.208740234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 5.0, 10.0, 20.0, 21.0, 20.0, 22.0, 22.0, 23.0, 33.0, 29.0, 27.0, 41.0, 44.0, 55.0, 40.0, 50.0, 49.0, 34.0, 48.0, 34.0, 48.0, 41.0, 39.0, 30.0, 33.0, 27.0, 15.0, 22.0, 20.0, 20.0, 15.0, 10.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.88735961914062, -79.22712707519531, -76.56689453125, -73.90666198730469, -71.2464370727539, -68.5862045288086, -65.92597198486328, -63.26573944091797, -60.605506896972656, -57.945274353027344, -55.2850456237793, -52.624813079833984, -49.96458053588867, -47.304351806640625, -44.64411926269531, -41.98388671875, -39.32365798950195, -36.66342544555664, -34.003196716308594, -31.34296417236328, -28.68273162841797, -26.02250099182129, -23.36227035522461, -20.702037811279297, -18.041807174682617, -15.381575584411621, -12.721343994140625, -10.061113357543945, -7.400881767272949, -4.740650177001953, -2.0804195404052734, 0.5798130035400391, 3.2400436401367188, 5.900275230407715, 8.560506820678711, 11.22073745727539, 13.880969047546387, 16.541200637817383, 19.201431274414062, 21.861663818359375, 24.521894454956055, 27.182125091552734, 29.842357635498047, 32.502586364746094, 35.162818908691406, 37.82305145263672, 40.48328399658203, 43.143516540527344, 45.80374526977539, 48.4639778137207, 51.12420654296875, 53.78443908691406, 56.444671630859375, 59.10490417480469, 61.765132904052734, 64.42536926269531, 67.0855941772461, 69.7458267211914, 72.40605926513672, 75.0662841796875, 77.72651672363281, 80.38674926757812, 83.04698181152344, 85.70721435546875, 88.36744689941406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 5.0, 12.0, 10.0, 24.0, 49.0, 91.0, 141.0, 287.0, 628.0, 1324.0, 4011.0, 14591.0, 135207.0, 3992015.0, 34687.0, 7312.0, 2214.0, 836.0, 396.0, 192.0, 116.0, 42.0, 36.0, 15.0, 16.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.75, -21.88330078125, -21.0166015625, -20.14990234375, -19.283203125, -18.41650390625, -17.5498046875, -16.68310546875, -15.81640625, -14.94970703125, -14.0830078125, -13.21630859375, -12.349609375, -11.48291015625, -10.6162109375, -9.74951171875, -8.8828125, -8.01611328125, -7.1494140625, -6.28271484375, -5.416015625, -4.54931640625, -3.6826171875, -2.81591796875, -1.94921875, -1.08251953125, -0.2158203125, 0.65087890625, 1.517578125, 2.38427734375, 3.2509765625, 4.11767578125, 4.984375, 5.85107421875, 6.7177734375, 7.58447265625, 8.451171875, 9.31787109375, 10.1845703125, 11.05126953125, 11.91796875, 12.78466796875, 13.6513671875, 14.51806640625, 15.384765625, 16.25146484375, 17.1181640625, 17.98486328125, 18.8515625, 19.71826171875, 20.5849609375, 21.45166015625, 22.318359375, 23.18505859375, 24.0517578125, 24.91845703125, 25.78515625, 26.65185546875, 27.5185546875, 28.38525390625, 29.251953125, 30.11865234375, 30.9853515625, 31.85205078125, 32.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 16.0, 18.0, 22.0, 25.0, 40.0, 48.0, 47.0, 65.0, 56.0, 64.0, 73.0, 63.0, 74.0, 55.0, 51.0, 37.0, 44.0, 35.0, 26.0, 26.0, 13.0, 14.0, 5.0, 15.0, 5.0, 13.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.3380126953125, -4.156494140625, -3.9749755859375, -3.79345703125, -3.6119384765625, -3.430419921875, -3.2489013671875, -3.0673828125, -2.8858642578125, -2.704345703125, -2.5228271484375, -2.34130859375, -2.1597900390625, -1.978271484375, -1.7967529296875, -1.615234375, -1.4337158203125, -1.252197265625, -1.0706787109375, -0.88916015625, -0.7076416015625, -0.526123046875, -0.3446044921875, -0.1630859375, 0.0184326171875, 0.199951171875, 0.3814697265625, 0.56298828125, 0.7445068359375, 0.926025390625, 1.1075439453125, 1.2890625, 1.4705810546875, 1.652099609375, 1.8336181640625, 2.01513671875, 2.1966552734375, 2.378173828125, 2.5596923828125, 2.7412109375, 2.9227294921875, 3.104248046875, 3.2857666015625, 3.46728515625, 3.6488037109375, 3.830322265625, 4.0118408203125, 4.193359375, 4.3748779296875, 4.556396484375, 4.7379150390625, 4.91943359375, 5.1009521484375, 5.282470703125, 5.4639892578125, 5.6455078125, 5.8270263671875, 6.008544921875, 6.1900634765625, 6.37158203125, 6.5531005859375, 6.734619140625, 6.9161376953125, 7.09765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 16.0, 21.0, 22.0, 41.0, 51.0, 83.0, 135.0, 228.0, 445.0, 873.0, 1727.0, 4537.0, 13553.0, 78514.0, 3971090.0, 98426.0, 15538.0, 4905.0, 2017.0, 924.0, 487.0, 239.0, 134.0, 88.0, 46.0, 31.0, 30.0, 15.0, 25.0, 12.0, 3.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0], "bins": [-27.765625, -27.0972900390625, -26.428955078125, -25.7606201171875, -25.09228515625, -24.4239501953125, -23.755615234375, -23.0872802734375, -22.4189453125, -21.7506103515625, -21.082275390625, -20.4139404296875, -19.74560546875, -19.0772705078125, -18.408935546875, -17.7406005859375, -17.072265625, -16.4039306640625, -15.735595703125, -15.0672607421875, -14.39892578125, -13.7305908203125, -13.062255859375, -12.3939208984375, -11.7255859375, -11.0572509765625, -10.388916015625, -9.7205810546875, -9.05224609375, -8.3839111328125, -7.715576171875, -7.0472412109375, -6.37890625, -5.7105712890625, -5.042236328125, -4.3739013671875, -3.70556640625, -3.0372314453125, -2.368896484375, -1.7005615234375, -1.0322265625, -0.3638916015625, 0.304443359375, 0.9727783203125, 1.64111328125, 2.3094482421875, 2.977783203125, 3.6461181640625, 4.314453125, 4.9827880859375, 5.651123046875, 6.3194580078125, 6.98779296875, 7.6561279296875, 8.324462890625, 8.9927978515625, 9.6611328125, 10.3294677734375, 10.997802734375, 11.6661376953125, 12.33447265625, 13.0028076171875, 13.671142578125, 14.3394775390625, 15.0078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 14.0, 14.0, 22.0, 25.0, 56.0, 117.0, 328.0, 3038.0, 233.0, 88.0, 44.0, 22.0, 15.0, 12.0, 14.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.68414306640625, -7.4542236328125, -7.22430419921875, -6.994384765625, -6.76446533203125, -6.5345458984375, -6.30462646484375, -6.07470703125, -5.84478759765625, -5.6148681640625, -5.38494873046875, -5.155029296875, -4.92510986328125, -4.6951904296875, -4.46527099609375, -4.2353515625, -4.00543212890625, -3.7755126953125, -3.54559326171875, -3.315673828125, -3.08575439453125, -2.8558349609375, -2.62591552734375, -2.39599609375, -2.16607666015625, -1.9361572265625, -1.70623779296875, -1.476318359375, -1.24639892578125, -1.0164794921875, -0.78656005859375, -0.556640625, -0.32672119140625, -0.0968017578125, 0.13311767578125, 0.363037109375, 0.59295654296875, 0.8228759765625, 1.05279541015625, 1.28271484375, 1.51263427734375, 1.7425537109375, 1.97247314453125, 2.202392578125, 2.43231201171875, 2.6622314453125, 2.89215087890625, 3.1220703125, 3.35198974609375, 3.5819091796875, 3.81182861328125, 4.041748046875, 4.27166748046875, 4.5015869140625, 4.73150634765625, 4.96142578125, 5.19134521484375, 5.4212646484375, 5.65118408203125, 5.881103515625, 6.11102294921875, 6.3409423828125, 6.57086181640625, 6.80078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 17.0, 31.0, 61.0, 108.0, 148.0, 141.0, 164.0, 127.0, 74.0, 55.0, 28.0, 17.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-61.56011962890625, -60.20906448364258, -58.85800552368164, -57.50695037841797, -56.1558952331543, -54.80483627319336, -53.45378112792969, -52.10272216796875, -50.75166702270508, -49.400611877441406, -48.04955291748047, -46.6984977722168, -45.347442626953125, -43.99638366699219, -42.645328521728516, -41.294273376464844, -39.943214416503906, -38.592159271240234, -37.2411003112793, -35.890045166015625, -34.53899002075195, -33.187931060791016, -31.836875915527344, -30.48581886291504, -29.134765625, -27.783708572387695, -26.432653427124023, -25.08159637451172, -23.730539321899414, -22.37948226928711, -21.028427124023438, -19.677370071411133, -18.326311111450195, -16.97525405883789, -15.624197959899902, -14.273141860961914, -12.92208480834961, -11.571028709411621, -10.219972610473633, -8.868915557861328, -7.51785945892334, -6.166802883148193, -4.815746307373047, -3.4646902084350586, -2.113633632659912, -0.7625770568847656, 0.5884790420532227, 1.9395360946655273, 3.2905921936035156, 4.641648769378662, 5.992705345153809, 7.343761444091797, 8.694818496704102, 10.04587459564209, 11.396930694580078, 12.747987747192383, 14.099043846130371, 15.45009994506836, 16.801156997680664, 18.15221405029297, 19.50326919555664, 20.854326248168945, 22.20538330078125, 23.556438446044922, 24.907495498657227]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 16.0, 20.0, 22.0, 24.0, 21.0, 26.0, 29.0, 43.0, 36.0, 34.0, 45.0, 39.0, 57.0, 43.0, 44.0, 41.0, 56.0, 39.0, 41.0, 49.0, 32.0, 37.0, 31.0, 27.0, 19.0, 20.0, 21.0, 16.0, 6.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.312578201293945, -15.806832313537598, -15.301087379455566, -14.795341491699219, -14.289596557617188, -13.78385066986084, -13.278104782104492, -12.772359848022461, -12.266613960266113, -11.760868072509766, -11.255123138427734, -10.749377250671387, -10.243631362915039, -9.737886428833008, -9.23214054107666, -8.726394653320312, -8.220649719238281, -7.714904308319092, -7.209158897399902, -6.703413009643555, -6.197667598724365, -5.691922187805176, -5.186176300048828, -4.680430889129639, -4.174685478210449, -3.6689400672912598, -3.163194417953491, -2.6574487686157227, -2.151703357696533, -1.6459579467773438, -1.1402122974395752, -0.6344666481018066, -0.12871932983398438, 0.37702620029449463, 0.8827717304229736, 1.3885172605514526, 1.8942627906799316, 2.400008201599121, 2.9057538509368896, 3.411499500274658, 3.9172449111938477, 4.422990322113037, 4.928735733032227, 5.434481620788574, 5.940227031707764, 6.445972442626953, 6.951718330383301, 7.45746374130249, 7.96320915222168, 8.468955039978027, 8.974699974060059, 9.480445861816406, 9.986190795898438, 10.491936683654785, 10.997682571411133, 11.503427505493164, 12.009173393249512, 12.51491928100586, 13.02066421508789, 13.526410102844238, 14.032155990600586, 14.537900924682617, 15.043646812438965, 15.549392700195312, 16.055137634277344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 16.0, 24.0, 47.0, 78.0, 142.0, 249.0, 489.0, 1050.0, 2452.0, 7092.0, 23054.0, 88408.0, 341679.0, 425838.0, 114107.0, 29894.0, 8500.0, 3019.0, 1151.0, 575.0, 290.0, 140.0, 89.0, 58.0, 36.0, 16.0, 9.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-24.921875, -24.30029296875, -23.6787109375, -23.05712890625, -22.435546875, -21.81396484375, -21.1923828125, -20.57080078125, -19.94921875, -19.32763671875, -18.7060546875, -18.08447265625, -17.462890625, -16.84130859375, -16.2197265625, -15.59814453125, -14.9765625, -14.35498046875, -13.7333984375, -13.11181640625, -12.490234375, -11.86865234375, -11.2470703125, -10.62548828125, -10.00390625, -9.38232421875, -8.7607421875, -8.13916015625, -7.517578125, -6.89599609375, -6.2744140625, -5.65283203125, -5.03125, -4.40966796875, -3.7880859375, -3.16650390625, -2.544921875, -1.92333984375, -1.3017578125, -0.68017578125, -0.05859375, 0.56298828125, 1.1845703125, 1.80615234375, 2.427734375, 3.04931640625, 3.6708984375, 4.29248046875, 4.9140625, 5.53564453125, 6.1572265625, 6.77880859375, 7.400390625, 8.02197265625, 8.6435546875, 9.26513671875, 9.88671875, 10.50830078125, 11.1298828125, 11.75146484375, 12.373046875, 12.99462890625, 13.6162109375, 14.23779296875, 14.859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 6.0, 10.0, 6.0, 11.0, 15.0, 15.0, 18.0, 27.0, 26.0, 42.0, 41.0, 39.0, 65.0, 73.0, 52.0, 79.0, 71.0, 55.0, 65.0, 48.0, 42.0, 28.0, 37.0, 24.0, 26.0, 14.0, 13.0, 14.0, 14.0, 10.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.92645263671875, -4.7357177734375, -4.54498291015625, -4.354248046875, -4.16351318359375, -3.9727783203125, -3.78204345703125, -3.59130859375, -3.40057373046875, -3.2098388671875, -3.01910400390625, -2.828369140625, -2.63763427734375, -2.4468994140625, -2.25616455078125, -2.0654296875, -1.87469482421875, -1.6839599609375, -1.49322509765625, -1.302490234375, -1.11175537109375, -0.9210205078125, -0.73028564453125, -0.53955078125, -0.34881591796875, -0.1580810546875, 0.03265380859375, 0.223388671875, 0.41412353515625, 0.6048583984375, 0.79559326171875, 0.986328125, 1.17706298828125, 1.3677978515625, 1.55853271484375, 1.749267578125, 1.94000244140625, 2.1307373046875, 2.32147216796875, 2.51220703125, 2.70294189453125, 2.8936767578125, 3.08441162109375, 3.275146484375, 3.46588134765625, 3.6566162109375, 3.84735107421875, 4.0380859375, 4.22882080078125, 4.4195556640625, 4.61029052734375, 4.801025390625, 4.99176025390625, 5.1824951171875, 5.37322998046875, 5.56396484375, 5.75469970703125, 5.9454345703125, 6.13616943359375, 6.326904296875, 6.51763916015625, 6.7083740234375, 6.89910888671875, 7.08984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 9.0, 9.0, 21.0, 40.0, 61.0, 106.0, 179.0, 309.0, 584.0, 1327.0, 4097.0, 39276.0, 790051.0, 197810.0, 10656.0, 2162.0, 825.0, 428.0, 248.0, 116.0, 89.0, 55.0, 32.0, 21.0, 11.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.388671875, -35.27734375, -34.166015625, -33.0546875, -31.943359375, -30.83203125, -29.720703125, -28.609375, -27.498046875, -26.38671875, -25.275390625, -24.1640625, -23.052734375, -21.94140625, -20.830078125, -19.71875, -18.607421875, -17.49609375, -16.384765625, -15.2734375, -14.162109375, -13.05078125, -11.939453125, -10.828125, -9.716796875, -8.60546875, -7.494140625, -6.3828125, -5.271484375, -4.16015625, -3.048828125, -1.9375, -0.826171875, 0.28515625, 1.396484375, 2.5078125, 3.619140625, 4.73046875, 5.841796875, 6.953125, 8.064453125, 9.17578125, 10.287109375, 11.3984375, 12.509765625, 13.62109375, 14.732421875, 15.84375, 16.955078125, 18.06640625, 19.177734375, 20.2890625, 21.400390625, 22.51171875, 23.623046875, 24.734375, 25.845703125, 26.95703125, 28.068359375, 29.1796875, 30.291015625, 31.40234375, 32.513671875, 33.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 11.0, 10.0, 15.0, 12.0, 22.0, 23.0, 29.0, 25.0, 28.0, 35.0, 32.0, 44.0, 37.0, 42.0, 38.0, 40.0, 45.0, 38.0, 39.0, 42.0, 24.0, 33.0, 37.0, 36.0, 29.0, 25.0, 28.0, 22.0, 18.0, 23.0, 14.0, 12.0, 12.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.9296875, -14.4205322265625, -13.911376953125, -13.4022216796875, -12.89306640625, -12.3839111328125, -11.874755859375, -11.3656005859375, -10.8564453125, -10.3472900390625, -9.838134765625, -9.3289794921875, -8.81982421875, -8.3106689453125, -7.801513671875, -7.2923583984375, -6.783203125, -6.2740478515625, -5.764892578125, -5.2557373046875, -4.74658203125, -4.2374267578125, -3.728271484375, -3.2191162109375, -2.7099609375, -2.2008056640625, -1.691650390625, -1.1824951171875, -0.67333984375, -0.1641845703125, 0.344970703125, 0.8541259765625, 1.36328125, 1.8724365234375, 2.381591796875, 2.8907470703125, 3.39990234375, 3.9090576171875, 4.418212890625, 4.9273681640625, 5.4365234375, 5.9456787109375, 6.454833984375, 6.9639892578125, 7.47314453125, 7.9822998046875, 8.491455078125, 9.0006103515625, 9.509765625, 10.0189208984375, 10.528076171875, 11.0372314453125, 11.54638671875, 12.0555419921875, 12.564697265625, 13.0738525390625, 13.5830078125, 14.0921630859375, 14.601318359375, 15.1104736328125, 15.61962890625, 16.1287841796875, 16.637939453125, 17.1470947265625, 17.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 25.0, 31.0, 48.0, 62.0, 101.0, 197.0, 366.0, 687.0, 1518.0, 3737.0, 11686.0, 55358.0, 404600.0, 486311.0, 63347.0, 13206.0, 4095.0, 1555.0, 714.0, 387.0, 186.0, 121.0, 64.0, 45.0, 22.0, 10.0, 15.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.45513916015625, -7.2149658203125, -6.97479248046875, -6.734619140625, -6.49444580078125, -6.2542724609375, -6.01409912109375, -5.77392578125, -5.53375244140625, -5.2935791015625, -5.05340576171875, -4.813232421875, -4.57305908203125, -4.3328857421875, -4.09271240234375, -3.8525390625, -3.61236572265625, -3.3721923828125, -3.13201904296875, -2.891845703125, -2.65167236328125, -2.4114990234375, -2.17132568359375, -1.93115234375, -1.69097900390625, -1.4508056640625, -1.21063232421875, -0.970458984375, -0.73028564453125, -0.4901123046875, -0.24993896484375, -0.009765625, 0.23040771484375, 0.4705810546875, 0.71075439453125, 0.950927734375, 1.19110107421875, 1.4312744140625, 1.67144775390625, 1.91162109375, 2.15179443359375, 2.3919677734375, 2.63214111328125, 2.872314453125, 3.11248779296875, 3.3526611328125, 3.59283447265625, 3.8330078125, 4.07318115234375, 4.3133544921875, 4.55352783203125, 4.793701171875, 5.03387451171875, 5.2740478515625, 5.51422119140625, 5.75439453125, 5.99456787109375, 6.2347412109375, 6.47491455078125, 6.715087890625, 6.95526123046875, 7.1954345703125, 7.43560791015625, 7.67578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 13.0, 14.0, 10.0, 10.0, 15.0, 24.0, 26.0, 18.0, 37.0, 40.0, 41.0, 70.0, 83.0, 103.0, 110.0, 81.0, 54.0, 44.0, 34.0, 34.0, 27.0, 25.0, 11.0, 19.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.001495361328125, -0.0014546513557434082, -0.0014139413833618164, -0.0013732314109802246, -0.0013325214385986328, -0.001291811466217041, -0.0012511014938354492, -0.0012103915214538574, -0.0011696815490722656, -0.0011289715766906738, -0.001088261604309082, -0.0010475516319274902, -0.0010068416595458984, -0.0009661316871643066, -0.0009254217147827148, -0.000884711742401123, -0.0008440017700195312, -0.0008032917976379395, -0.0007625818252563477, -0.0007218718528747559, -0.0006811618804931641, -0.0006404519081115723, -0.0005997419357299805, -0.0005590319633483887, -0.0005183219909667969, -0.0004776120185852051, -0.0004369020462036133, -0.0003961920738220215, -0.0003554821014404297, -0.0003147721290588379, -0.0002740621566772461, -0.0002333521842956543, -0.0001926422119140625, -0.0001519322395324707, -0.0001112222671508789, -7.051229476928711e-05, -2.9802322387695312e-05, 1.0907649993896484e-05, 5.161762237548828e-05, 9.232759475708008e-05, 0.00013303756713867188, 0.00017374753952026367, 0.00021445751190185547, 0.00025516748428344727, 0.00029587745666503906, 0.00033658742904663086, 0.00037729740142822266, 0.00041800737380981445, 0.00045871734619140625, 0.000499427318572998, 0.0005401372909545898, 0.0005808472633361816, 0.0006215572357177734, 0.0006622672080993652, 0.000702977180480957, 0.0007436871528625488, 0.0007843971252441406, 0.0008251070976257324, 0.0008658170700073242, 0.000906527042388916, 0.0009472370147705078, 0.0009879469871520996, 0.0010286569595336914, 0.0010693669319152832, 0.001110076904296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 6.0, 20.0, 12.0, 23.0, 36.0, 38.0, 47.0, 72.0, 114.0, 189.0, 330.0, 563.0, 1121.0, 2534.0, 7517.0, 34216.0, 283265.0, 618654.0, 78887.0, 13560.0, 4000.0, 1531.0, 747.0, 374.0, 230.0, 123.0, 89.0, 59.0, 42.0, 35.0, 30.0, 24.0, 16.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9765625, -8.706298828125, -8.43603515625, -8.165771484375, -7.8955078125, -7.625244140625, -7.35498046875, -7.084716796875, -6.814453125, -6.544189453125, -6.27392578125, -6.003662109375, -5.7333984375, -5.463134765625, -5.19287109375, -4.922607421875, -4.65234375, -4.382080078125, -4.11181640625, -3.841552734375, -3.5712890625, -3.301025390625, -3.03076171875, -2.760498046875, -2.490234375, -2.219970703125, -1.94970703125, -1.679443359375, -1.4091796875, -1.138916015625, -0.86865234375, -0.598388671875, -0.328125, -0.057861328125, 0.21240234375, 0.482666015625, 0.7529296875, 1.023193359375, 1.29345703125, 1.563720703125, 1.833984375, 2.104248046875, 2.37451171875, 2.644775390625, 2.9150390625, 3.185302734375, 3.45556640625, 3.725830078125, 3.99609375, 4.266357421875, 4.53662109375, 4.806884765625, 5.0771484375, 5.347412109375, 5.61767578125, 5.887939453125, 6.158203125, 6.428466796875, 6.69873046875, 6.968994140625, 7.2392578125, 7.509521484375, 7.77978515625, 8.050048828125, 8.3203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 7.0, 13.0, 12.0, 12.0, 12.0, 23.0, 30.0, 34.0, 32.0, 50.0, 48.0, 72.0, 67.0, 61.0, 64.0, 56.0, 75.0, 69.0, 48.0, 38.0, 28.0, 25.0, 16.0, 18.0, 14.0, 8.0, 18.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.55126953125, -4.3837890625, -4.21630859375, -4.048828125, -3.88134765625, -3.7138671875, -3.54638671875, -3.37890625, -3.21142578125, -3.0439453125, -2.87646484375, -2.708984375, -2.54150390625, -2.3740234375, -2.20654296875, -2.0390625, -1.87158203125, -1.7041015625, -1.53662109375, -1.369140625, -1.20166015625, -1.0341796875, -0.86669921875, -0.69921875, -0.53173828125, -0.3642578125, -0.19677734375, -0.029296875, 0.13818359375, 0.3056640625, 0.47314453125, 0.640625, 0.80810546875, 0.9755859375, 1.14306640625, 1.310546875, 1.47802734375, 1.6455078125, 1.81298828125, 1.98046875, 2.14794921875, 2.3154296875, 2.48291015625, 2.650390625, 2.81787109375, 2.9853515625, 3.15283203125, 3.3203125, 3.48779296875, 3.6552734375, 3.82275390625, 3.990234375, 4.15771484375, 4.3251953125, 4.49267578125, 4.66015625, 4.82763671875, 4.9951171875, 5.16259765625, 5.330078125, 5.49755859375, 5.6650390625, 5.83251953125, 6.0]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 14.0, 28.0, 67.0, 117.0, 202.0, 208.0, 163.0, 114.0, 38.0, 25.0, 10.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.2626953125, -342.99365234375, -335.724609375, -328.45556640625, -321.1864929199219, -313.9174499511719, -306.6484069824219, -299.3793640136719, -292.1103210449219, -284.8412780761719, -277.5722351074219, -270.30316162109375, -263.03411865234375, -255.76507568359375, -248.49603271484375, -241.22698974609375, -233.9579315185547, -226.6888885498047, -219.41983032226562, -212.15078735351562, -204.88174438476562, -197.61270141601562, -190.34364318847656, -183.07460021972656, -175.8055419921875, -168.5364990234375, -161.26744079589844, -153.99839782714844, -146.72935485839844, -139.46029663085938, -132.19125366210938, -124.92221069335938, -117.65316009521484, -110.38410949707031, -103.11506652832031, -95.84601593017578, -88.57696533203125, -81.30792236328125, -74.03887176513672, -66.76982116699219, -59.50077819824219, -52.23173141479492, -44.962684631347656, -37.693634033203125, -30.42458724975586, -23.155540466308594, -15.886489868164062, -8.617443084716797, -1.3483963012695312, 5.920651435852051, 13.189699172973633, 20.45874786376953, 27.727794647216797, 34.99684143066406, 42.265892028808594, 49.53493881225586, 56.803985595703125, 64.07303619384766, 71.34207916259766, 78.61112976074219, 85.88017272949219, 93.14922332763672, 100.41827392578125, 107.68731689453125, 114.95636749267578]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 17.0, 8.0, 16.0, 17.0, 18.0, 15.0, 24.0, 34.0, 35.0, 41.0, 44.0, 53.0, 44.0, 52.0, 58.0, 48.0, 59.0, 53.0, 46.0, 36.0, 30.0, 38.0, 28.0, 28.0, 34.0, 23.0, 15.0, 17.0, 16.0, 7.0, 5.0, 4.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.4207763671875, -80.5611801147461, -77.70158386230469, -74.84198760986328, -71.98239135742188, -69.12278747558594, -66.26319885253906, -63.403594970703125, -60.54399871826172, -57.68440246582031, -54.824806213378906, -51.9652099609375, -49.10560989379883, -46.24601364135742, -43.386417388916016, -40.526817321777344, -37.6672248840332, -34.8076286315918, -31.948030471801758, -29.08843421936035, -26.228836059570312, -23.369239807128906, -20.5096435546875, -17.65004539489746, -14.790449142456055, -11.930851936340332, -9.07125473022461, -6.211658477783203, -3.3520612716674805, -0.4924640655517578, 2.3671321868896484, 5.2267303466796875, 8.086326599121094, 10.945923805236816, 13.805521011352539, 16.665117263793945, 19.524715423583984, 22.38431167602539, 25.243907928466797, 28.103506088256836, 30.963102340698242, 33.82270050048828, 36.68229675292969, 39.541893005371094, 42.4014892578125, 45.261085510253906, 48.12068176269531, 50.980281829833984, 53.83987808227539, 56.6994743347168, 59.5590705871582, 62.418670654296875, 65.27826690673828, 68.13786315917969, 70.9974594116211, 73.8570556640625, 76.7166519165039, 79.57624816894531, 82.43584442138672, 85.29544067382812, 88.15503692626953, 91.01463317871094, 93.87423706054688, 96.73383331298828, 99.59342956542969]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 5.0, 6.0, 10.0, 15.0, 21.0, 19.0, 40.0, 62.0, 94.0, 158.0, 218.0, 413.0, 669.0, 1240.0, 2376.0, 4768.0, 10230.0, 23543.0, 64721.0, 259439.0, 2578862.0, 1032371.0, 141509.0, 42068.0, 16479.0, 7227.0, 3536.0, 1791.0, 883.0, 568.0, 300.0, 205.0, 132.0, 81.0, 52.0, 54.0, 32.0, 21.0, 13.0, 15.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.92401123046875, -6.6331787109375, -6.34234619140625, -6.051513671875, -5.76068115234375, -5.4698486328125, -5.17901611328125, -4.88818359375, -4.59735107421875, -4.3065185546875, -4.01568603515625, -3.724853515625, -3.43402099609375, -3.1431884765625, -2.85235595703125, -2.5615234375, -2.27069091796875, -1.9798583984375, -1.68902587890625, -1.398193359375, -1.10736083984375, -0.8165283203125, -0.52569580078125, -0.23486328125, 0.05596923828125, 0.3468017578125, 0.63763427734375, 0.928466796875, 1.21929931640625, 1.5101318359375, 1.80096435546875, 2.091796875, 2.38262939453125, 2.6734619140625, 2.96429443359375, 3.255126953125, 3.54595947265625, 3.8367919921875, 4.12762451171875, 4.41845703125, 4.70928955078125, 5.0001220703125, 5.29095458984375, 5.581787109375, 5.87261962890625, 6.1634521484375, 6.45428466796875, 6.7451171875, 7.03594970703125, 7.3267822265625, 7.61761474609375, 7.908447265625, 8.19927978515625, 8.4901123046875, 8.78094482421875, 9.07177734375, 9.36260986328125, 9.6534423828125, 9.94427490234375, 10.235107421875, 10.52593994140625, 10.8167724609375, 11.10760498046875, 11.3984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 7.0, 8.0, 5.0, 13.0, 18.0, 24.0, 26.0, 34.0, 32.0, 41.0, 53.0, 46.0, 46.0, 77.0, 57.0, 68.0, 56.0, 61.0, 41.0, 50.0, 49.0, 31.0, 30.0, 27.0, 20.0, 26.0, 13.0, 15.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.16455078125, -3.9853515625, -3.80615234375, -3.626953125, -3.44775390625, -3.2685546875, -3.08935546875, -2.91015625, -2.73095703125, -2.5517578125, -2.37255859375, -2.193359375, -2.01416015625, -1.8349609375, -1.65576171875, -1.4765625, -1.29736328125, -1.1181640625, -0.93896484375, -0.759765625, -0.58056640625, -0.4013671875, -0.22216796875, -0.04296875, 0.13623046875, 0.3154296875, 0.49462890625, 0.673828125, 0.85302734375, 1.0322265625, 1.21142578125, 1.390625, 1.56982421875, 1.7490234375, 1.92822265625, 2.107421875, 2.28662109375, 2.4658203125, 2.64501953125, 2.82421875, 3.00341796875, 3.1826171875, 3.36181640625, 3.541015625, 3.72021484375, 3.8994140625, 4.07861328125, 4.2578125, 4.43701171875, 4.6162109375, 4.79541015625, 4.974609375, 5.15380859375, 5.3330078125, 5.51220703125, 5.69140625, 5.87060546875, 6.0498046875, 6.22900390625, 6.408203125, 6.58740234375, 6.7666015625, 6.94580078125, 7.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 24.0, 28.0, 47.0, 95.0, 200.0, 375.0, 1060.0, 3148.0, 11401.0, 54108.0, 597135.0, 3340933.0, 151927.0, 24324.0, 6180.0, 1964.0, 697.0, 266.0, 128.0, 77.0, 46.0, 20.0, 16.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.5848388671875, -19.044677734375, -18.5045166015625, -17.96435546875, -17.4241943359375, -16.884033203125, -16.3438720703125, -15.8037109375, -15.2635498046875, -14.723388671875, -14.1832275390625, -13.64306640625, -13.1029052734375, -12.562744140625, -12.0225830078125, -11.482421875, -10.9422607421875, -10.402099609375, -9.8619384765625, -9.32177734375, -8.7816162109375, -8.241455078125, -7.7012939453125, -7.1611328125, -6.6209716796875, -6.080810546875, -5.5406494140625, -5.00048828125, -4.4603271484375, -3.920166015625, -3.3800048828125, -2.83984375, -2.2996826171875, -1.759521484375, -1.2193603515625, -0.67919921875, -0.1390380859375, 0.401123046875, 0.9412841796875, 1.4814453125, 2.0216064453125, 2.561767578125, 3.1019287109375, 3.64208984375, 4.1822509765625, 4.722412109375, 5.2625732421875, 5.802734375, 6.3428955078125, 6.883056640625, 7.4232177734375, 7.96337890625, 8.5035400390625, 9.043701171875, 9.5838623046875, 10.1240234375, 10.6641845703125, 11.204345703125, 11.7445068359375, 12.28466796875, 12.8248291015625, 13.364990234375, 13.9051513671875, 14.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 17.0, 20.0, 30.0, 31.0, 51.0, 82.0, 117.0, 190.0, 267.0, 567.0, 947.0, 679.0, 358.0, 213.0, 144.0, 82.0, 56.0, 44.0, 28.0, 24.0, 13.0, 13.0, 13.0, 13.0, 10.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8553466796875, -11.468505859375, -11.0816650390625, -10.69482421875, -10.3079833984375, -9.921142578125, -9.5343017578125, -9.1474609375, -8.7606201171875, -8.373779296875, -7.9869384765625, -7.60009765625, -7.2132568359375, -6.826416015625, -6.4395751953125, -6.052734375, -5.6658935546875, -5.279052734375, -4.8922119140625, -4.50537109375, -4.1185302734375, -3.731689453125, -3.3448486328125, -2.9580078125, -2.5711669921875, -2.184326171875, -1.7974853515625, -1.41064453125, -1.0238037109375, -0.636962890625, -0.2501220703125, 0.13671875, 0.5235595703125, 0.910400390625, 1.2972412109375, 1.68408203125, 2.0709228515625, 2.457763671875, 2.8446044921875, 3.2314453125, 3.6182861328125, 4.005126953125, 4.3919677734375, 4.77880859375, 5.1656494140625, 5.552490234375, 5.9393310546875, 6.326171875, 6.7130126953125, 7.099853515625, 7.4866943359375, 7.87353515625, 8.2603759765625, 8.647216796875, 9.0340576171875, 9.4208984375, 9.8077392578125, 10.194580078125, 10.5814208984375, 10.96826171875, 11.3551025390625, 11.741943359375, 12.1287841796875, 12.515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 12.0, 24.0, 37.0, 95.0, 216.0, 271.0, 193.0, 72.0, 34.0, 19.0, 5.0, 11.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.68299865722656, -107.0890121459961, -100.49502563476562, -93.90104675292969, -87.30706024169922, -80.71307373046875, -74.11909484863281, -67.52510833740234, -60.931121826171875, -54.337135314941406, -47.7431526184082, -41.149169921875, -34.55518341064453, -27.961196899414062, -21.36721420288086, -14.773231506347656, -8.179244995117188, -1.5852603912353516, 5.008724212646484, 11.60270881652832, 18.196693420410156, 24.790679931640625, 31.384662628173828, 37.97864532470703, 44.5726318359375, 51.16661834716797, 57.76060104370117, 64.35458374023438, 70.94857025146484, 77.54255676269531, 84.13653564453125, 90.73052215576172, 97.32452392578125, 103.91851043701172, 110.51249694824219, 117.10647583007812, 123.7004623413086, 130.29444885253906, 136.888427734375, 143.482421875, 150.07640075683594, 156.67037963867188, 163.26437377929688, 169.8583526611328, 176.45233154296875, 183.04632568359375, 189.6403045654297, 196.23428344726562, 202.82827758789062, 209.42225646972656, 216.01625061035156, 222.6102294921875, 229.2042236328125, 235.79820251464844, 242.39218139648438, 248.98617553710938, 255.5801544189453, 262.17413330078125, 268.76812744140625, 275.36212158203125, 281.9560852050781, 288.5500793457031, 295.1440734863281, 301.738037109375, 308.33203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 13.0, 5.0, 8.0, 14.0, 10.0, 18.0, 22.0, 25.0, 22.0, 25.0, 32.0, 34.0, 37.0, 37.0, 41.0, 36.0, 43.0, 52.0, 50.0, 43.0, 45.0, 46.0, 42.0, 30.0, 31.0, 53.0, 28.0, 18.0, 16.0, 27.0, 16.0, 11.0, 20.0, 11.0, 5.0, 7.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.31375122070312, -68.34270477294922, -66.37165832519531, -64.4006118774414, -62.429569244384766, -60.45852279663086, -58.48748016357422, -56.51643371582031, -54.545387268066406, -52.5743408203125, -50.603294372558594, -48.63225173950195, -46.66120529174805, -44.69015884399414, -42.7191162109375, -40.748069763183594, -38.77702331542969, -36.80597686767578, -34.834930419921875, -32.863887786865234, -30.892841339111328, -28.921794891357422, -26.95075035095215, -24.979705810546875, -23.00865936279297, -21.037612915039062, -19.06656837463379, -17.095523834228516, -15.12447738647461, -13.15343189239502, -11.18238639831543, -9.21134090423584, -7.24029541015625, -5.26924991607666, -3.2982044219970703, -1.3271589279174805, 0.6438865661621094, 2.614932060241699, 4.585977554321289, 6.557023048400879, 8.528068542480469, 10.499114036560059, 12.470159530639648, 14.441205024719238, 16.412250518798828, 18.383296966552734, 20.354341506958008, 22.32538604736328, 24.296432495117188, 26.267478942871094, 28.238523483276367, 30.20956802368164, 32.18061447143555, 34.15166091918945, 36.122703552246094, 38.09375, 40.064796447753906, 42.03584289550781, 44.00688934326172, 45.97793197631836, 47.948978424072266, 49.92002487182617, 51.89106750488281, 53.86211395263672, 55.833160400390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 10.0, 15.0, 17.0, 26.0, 38.0, 81.0, 150.0, 213.0, 401.0, 770.0, 1499.0, 3062.0, 7076.0, 17537.0, 49133.0, 147556.0, 454754.0, 247304.0, 74369.0, 25992.0, 10026.0, 4299.0, 2026.0, 998.0, 504.0, 271.0, 163.0, 104.0, 57.0, 30.0, 21.0, 10.0, 11.0, 5.0, 3.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.664794921875, -11.24365234375, -10.822509765625, -10.4013671875, -9.980224609375, -9.55908203125, -9.137939453125, -8.716796875, -8.295654296875, -7.87451171875, -7.453369140625, -7.0322265625, -6.611083984375, -6.18994140625, -5.768798828125, -5.34765625, -4.926513671875, -4.50537109375, -4.084228515625, -3.6630859375, -3.241943359375, -2.82080078125, -2.399658203125, -1.978515625, -1.557373046875, -1.13623046875, -0.715087890625, -0.2939453125, 0.127197265625, 0.54833984375, 0.969482421875, 1.390625, 1.811767578125, 2.23291015625, 2.654052734375, 3.0751953125, 3.496337890625, 3.91748046875, 4.338623046875, 4.759765625, 5.180908203125, 5.60205078125, 6.023193359375, 6.4443359375, 6.865478515625, 7.28662109375, 7.707763671875, 8.12890625, 8.550048828125, 8.97119140625, 9.392333984375, 9.8134765625, 10.234619140625, 10.65576171875, 11.076904296875, 11.498046875, 11.919189453125, 12.34033203125, 12.761474609375, 13.1826171875, 13.603759765625, 14.02490234375, 14.446044921875, 14.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 7.0, 9.0, 5.0, 8.0, 21.0, 22.0, 24.0, 29.0, 42.0, 33.0, 39.0, 55.0, 50.0, 53.0, 57.0, 66.0, 72.0, 54.0, 52.0, 53.0, 41.0, 53.0, 35.0, 20.0, 17.0, 25.0, 21.0, 12.0, 14.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.27947998046875, -4.0980224609375, -3.91656494140625, -3.735107421875, -3.55364990234375, -3.3721923828125, -3.19073486328125, -3.00927734375, -2.82781982421875, -2.6463623046875, -2.46490478515625, -2.283447265625, -2.10198974609375, -1.9205322265625, -1.73907470703125, -1.5576171875, -1.37615966796875, -1.1947021484375, -1.01324462890625, -0.831787109375, -0.65032958984375, -0.4688720703125, -0.28741455078125, -0.10595703125, 0.07550048828125, 0.2569580078125, 0.43841552734375, 0.619873046875, 0.80133056640625, 0.9827880859375, 1.16424560546875, 1.345703125, 1.52716064453125, 1.7086181640625, 1.89007568359375, 2.071533203125, 2.25299072265625, 2.4344482421875, 2.61590576171875, 2.79736328125, 2.97882080078125, 3.1602783203125, 3.34173583984375, 3.523193359375, 3.70465087890625, 3.8861083984375, 4.06756591796875, 4.2490234375, 4.43048095703125, 4.6119384765625, 4.79339599609375, 4.974853515625, 5.15631103515625, 5.3377685546875, 5.51922607421875, 5.70068359375, 5.88214111328125, 6.0635986328125, 6.24505615234375, 6.426513671875, 6.60797119140625, 6.7894287109375, 6.97088623046875, 7.15234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 18.0, 23.0, 30.0, 57.0, 67.0, 99.0, 127.0, 248.0, 375.0, 737.0, 1498.0, 3860.0, 19586.0, 253895.0, 715485.0, 42105.0, 6228.0, 1935.0, 895.0, 427.0, 290.0, 195.0, 108.0, 65.0, 49.0, 36.0, 32.0, 23.0, 12.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.234619140625, -20.39111328125, -19.547607421875, -18.7041015625, -17.860595703125, -17.01708984375, -16.173583984375, -15.330078125, -14.486572265625, -13.64306640625, -12.799560546875, -11.9560546875, -11.112548828125, -10.26904296875, -9.425537109375, -8.58203125, -7.738525390625, -6.89501953125, -6.051513671875, -5.2080078125, -4.364501953125, -3.52099609375, -2.677490234375, -1.833984375, -0.990478515625, -0.14697265625, 0.696533203125, 1.5400390625, 2.383544921875, 3.22705078125, 4.070556640625, 4.9140625, 5.757568359375, 6.60107421875, 7.444580078125, 8.2880859375, 9.131591796875, 9.97509765625, 10.818603515625, 11.662109375, 12.505615234375, 13.34912109375, 14.192626953125, 15.0361328125, 15.879638671875, 16.72314453125, 17.566650390625, 18.41015625, 19.253662109375, 20.09716796875, 20.940673828125, 21.7841796875, 22.627685546875, 23.47119140625, 24.314697265625, 25.158203125, 26.001708984375, 26.84521484375, 27.688720703125, 28.5322265625, 29.375732421875, 30.21923828125, 31.062744140625, 31.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 4.0, 9.0, 7.0, 9.0, 12.0, 16.0, 27.0, 20.0, 28.0, 38.0, 34.0, 41.0, 66.0, 40.0, 65.0, 49.0, 56.0, 53.0, 56.0, 58.0, 49.0, 41.0, 37.0, 41.0, 32.0, 21.0, 18.0, 17.0, 9.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-29.78125, -29.025146484375, -28.26904296875, -27.512939453125, -26.7568359375, -26.000732421875, -25.24462890625, -24.488525390625, -23.732421875, -22.976318359375, -22.22021484375, -21.464111328125, -20.7080078125, -19.951904296875, -19.19580078125, -18.439697265625, -17.68359375, -16.927490234375, -16.17138671875, -15.415283203125, -14.6591796875, -13.903076171875, -13.14697265625, -12.390869140625, -11.634765625, -10.878662109375, -10.12255859375, -9.366455078125, -8.6103515625, -7.854248046875, -7.09814453125, -6.342041015625, -5.5859375, -4.829833984375, -4.07373046875, -3.317626953125, -2.5615234375, -1.805419921875, -1.04931640625, -0.293212890625, 0.462890625, 1.218994140625, 1.97509765625, 2.731201171875, 3.4873046875, 4.243408203125, 4.99951171875, 5.755615234375, 6.51171875, 7.267822265625, 8.02392578125, 8.780029296875, 9.5361328125, 10.292236328125, 11.04833984375, 11.804443359375, 12.560546875, 13.316650390625, 14.07275390625, 14.828857421875, 15.5849609375, 16.341064453125, 17.09716796875, 17.853271484375, 18.609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 15.0, 14.0, 23.0, 30.0, 50.0, 105.0, 166.0, 413.0, 1158.0, 4823.0, 40159.0, 811002.0, 174596.0, 12510.0, 2237.0, 639.0, 294.0, 136.0, 66.0, 27.0, 29.0, 20.0, 7.0, 7.0, 6.0, 4.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0, -14.6026611328125, -14.205322265625, -13.8079833984375, -13.41064453125, -13.0133056640625, -12.615966796875, -12.2186279296875, -11.8212890625, -11.4239501953125, -11.026611328125, -10.6292724609375, -10.23193359375, -9.8345947265625, -9.437255859375, -9.0399169921875, -8.642578125, -8.2452392578125, -7.847900390625, -7.4505615234375, -7.05322265625, -6.6558837890625, -6.258544921875, -5.8612060546875, -5.4638671875, -5.0665283203125, -4.669189453125, -4.2718505859375, -3.87451171875, -3.4771728515625, -3.079833984375, -2.6824951171875, -2.28515625, -1.8878173828125, -1.490478515625, -1.0931396484375, -0.69580078125, -0.2984619140625, 0.098876953125, 0.4962158203125, 0.8935546875, 1.2908935546875, 1.688232421875, 2.0855712890625, 2.48291015625, 2.8802490234375, 3.277587890625, 3.6749267578125, 4.072265625, 4.4696044921875, 4.866943359375, 5.2642822265625, 5.66162109375, 6.0589599609375, 6.456298828125, 6.8536376953125, 7.2509765625, 7.6483154296875, 8.045654296875, 8.4429931640625, 8.84033203125, 9.2376708984375, 9.635009765625, 10.0323486328125, 10.4296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 8.0, 14.0, 11.0, 19.0, 14.0, 12.0, 18.0, 31.0, 37.0, 74.0, 106.0, 173.0, 150.0, 84.0, 49.0, 39.0, 28.0, 24.0, 18.0, 14.0, 15.0, 9.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013780593872070312, -0.0013283789157867432, -0.001278698444366455, -0.001229017972946167, -0.001179337501525879, -0.0011296570301055908, -0.0010799765586853027, -0.0010302960872650146, -0.0009806156158447266, -0.0009309351444244385, -0.0008812546730041504, -0.0008315742015838623, -0.0007818937301635742, -0.0007322132587432861, -0.000682532787322998, -0.00063285231590271, -0.0005831718444824219, -0.0005334913730621338, -0.0004838109016418457, -0.0004341304302215576, -0.00038444995880126953, -0.00033476948738098145, -0.00028508901596069336, -0.00023540854454040527, -0.0001857280731201172, -0.0001360476016998291, -8.636713027954102e-05, -3.668665885925293e-05, 1.2993812561035156e-05, 6.267428398132324e-05, 0.00011235475540161133, 0.00016203522682189941, 0.0002117156982421875, 0.0002613961696624756, 0.00031107664108276367, 0.00036075711250305176, 0.00041043758392333984, 0.00046011805534362793, 0.000509798526763916, 0.0005594789981842041, 0.0006091594696044922, 0.0006588399410247803, 0.0007085204124450684, 0.0007582008838653564, 0.0008078813552856445, 0.0008575618267059326, 0.0009072422981262207, 0.0009569227695465088, 0.0010066032409667969, 0.001056283712387085, 0.001105964183807373, 0.0011556446552276611, 0.0012053251266479492, 0.0012550055980682373, 0.0013046860694885254, 0.0013543665409088135, 0.0014040470123291016, 0.0014537274837493896, 0.0015034079551696777, 0.0015530884265899658, 0.001602768898010254, 0.001652449369430542, 0.00170212984085083, 0.0017518103122711182, 0.0018014907836914062]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 22.0, 26.0, 34.0, 54.0, 105.0, 115.0, 164.0, 299.0, 585.0, 1031.0, 2349.0, 7500.0, 40156.0, 487434.0, 457646.0, 38768.0, 7431.0, 2373.0, 1014.0, 519.0, 330.0, 190.0, 120.0, 71.0, 54.0, 32.0, 28.0, 17.0, 10.0, 10.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5859375, -8.2996826171875, -8.013427734375, -7.7271728515625, -7.44091796875, -7.1546630859375, -6.868408203125, -6.5821533203125, -6.2958984375, -6.0096435546875, -5.723388671875, -5.4371337890625, -5.15087890625, -4.8646240234375, -4.578369140625, -4.2921142578125, -4.005859375, -3.7196044921875, -3.433349609375, -3.1470947265625, -2.86083984375, -2.5745849609375, -2.288330078125, -2.0020751953125, -1.7158203125, -1.4295654296875, -1.143310546875, -0.8570556640625, -0.57080078125, -0.2845458984375, 0.001708984375, 0.2879638671875, 0.57421875, 0.8604736328125, 1.146728515625, 1.4329833984375, 1.71923828125, 2.0054931640625, 2.291748046875, 2.5780029296875, 2.8642578125, 3.1505126953125, 3.436767578125, 3.7230224609375, 4.00927734375, 4.2955322265625, 4.581787109375, 4.8680419921875, 5.154296875, 5.4405517578125, 5.726806640625, 6.0130615234375, 6.29931640625, 6.5855712890625, 6.871826171875, 7.1580810546875, 7.4443359375, 7.7305908203125, 8.016845703125, 8.3031005859375, 8.58935546875, 8.8756103515625, 9.161865234375, 9.4481201171875, 9.734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 5.0, 8.0, 22.0, 12.0, 12.0, 18.0, 17.0, 22.0, 30.0, 33.0, 48.0, 56.0, 57.0, 55.0, 56.0, 83.0, 70.0, 70.0, 53.0, 35.0, 38.0, 37.0, 25.0, 21.0, 13.0, 11.0, 8.0, 16.0, 9.0, 7.0, 5.0, 2.0, 5.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4715576171875, -4.310302734375, -4.1490478515625, -3.98779296875, -3.8265380859375, -3.665283203125, -3.5040283203125, -3.3427734375, -3.1815185546875, -3.020263671875, -2.8590087890625, -2.69775390625, -2.5364990234375, -2.375244140625, -2.2139892578125, -2.052734375, -1.8914794921875, -1.730224609375, -1.5689697265625, -1.40771484375, -1.2464599609375, -1.085205078125, -0.9239501953125, -0.7626953125, -0.6014404296875, -0.440185546875, -0.2789306640625, -0.11767578125, 0.0435791015625, 0.204833984375, 0.3660888671875, 0.52734375, 0.6885986328125, 0.849853515625, 1.0111083984375, 1.17236328125, 1.3336181640625, 1.494873046875, 1.6561279296875, 1.8173828125, 1.9786376953125, 2.139892578125, 2.3011474609375, 2.46240234375, 2.6236572265625, 2.784912109375, 2.9461669921875, 3.107421875, 3.2686767578125, 3.429931640625, 3.5911865234375, 3.75244140625, 3.9136962890625, 4.074951171875, 4.2362060546875, 4.3974609375, 4.5587158203125, 4.719970703125, 4.8812255859375, 5.04248046875, 5.2037353515625, 5.364990234375, 5.5262451171875, 5.6875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 31.0, 64.0, 118.0, 228.0, 228.0, 147.0, 95.0, 38.0, 17.0, 13.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.19520568847656, -146.1154327392578, -140.03565979003906, -133.95590209960938, -127.87612915039062, -121.79635620117188, -115.71658325195312, -109.63681030273438, -103.55704498291016, -97.4772720336914, -91.39750671386719, -85.31773376464844, -79.23796081542969, -73.15819549560547, -67.07842254638672, -60.998653411865234, -54.91888427734375, -48.839115142822266, -42.75934600830078, -36.67957305908203, -30.599803924560547, -24.520034790039062, -18.440261840820312, -12.360492706298828, -6.280723571777344, -0.20095348358154297, 5.878816604614258, 11.958587646484375, 18.03835678100586, 24.118125915527344, 30.197898864746094, 36.27766799926758, 42.35743713378906, 48.43720626831055, 54.51697540283203, 60.59674835205078, 66.676513671875, 72.75628662109375, 78.8360595703125, 84.91583251953125, 90.99559783935547, 97.07537078857422, 103.15513610839844, 109.23490905761719, 115.31468200683594, 121.39444732666016, 127.4742202758789, 133.55398559570312, 139.63375854492188, 145.71353149414062, 151.79330444335938, 157.87307739257812, 163.9528350830078, 170.03260803222656, 176.1123809814453, 182.19215393066406, 188.27191162109375, 194.3516845703125, 200.43145751953125, 206.51123046875, 212.5909881591797, 218.67076110839844, 224.7505340576172, 230.83030700683594, 236.9100799560547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 15.0, 16.0, 11.0, 23.0, 20.0, 13.0, 21.0, 28.0, 29.0, 40.0, 29.0, 48.0, 42.0, 48.0, 63.0, 55.0, 65.0, 47.0, 47.0, 45.0, 36.0, 31.0, 30.0, 32.0, 26.0, 13.0, 27.0, 21.0, 15.0, 14.0, 13.0, 9.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.97138977050781, -68.39381408691406, -65.81623840332031, -63.2386589050293, -60.66108322143555, -58.0835075378418, -55.50592803955078, -52.92835235595703, -50.35077667236328, -47.77320098876953, -45.19562530517578, -42.618045806884766, -40.040470123291016, -37.462894439697266, -34.88531494140625, -32.3077392578125, -29.73016357421875, -27.152587890625, -24.575010299682617, -21.997432708740234, -19.419857025146484, -16.842281341552734, -14.264703750610352, -11.687126159667969, -9.109550476074219, -6.531973838806152, -3.954397201538086, -1.3768205642700195, 1.2007560729980469, 3.7783327102661133, 6.35590934753418, 8.933486938476562, 11.511062622070312, 14.088639259338379, 16.666215896606445, 19.243793487548828, 21.821369171142578, 24.398944854736328, 26.97652244567871, 29.554100036621094, 32.131675720214844, 34.709251403808594, 37.286827087402344, 39.86440658569336, 42.44198226928711, 45.01955795288086, 47.597137451171875, 50.174713134765625, 52.752288818359375, 55.329864501953125, 57.907440185546875, 60.48501968383789, 63.06259536743164, 65.64017486572266, 68.2177505493164, 70.79532623291016, 73.3729019165039, 75.95047760009766, 78.5280532836914, 81.10562896728516, 83.68321228027344, 86.26078796386719, 88.83836364746094, 91.41593933105469, 93.99351501464844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 12.0, 17.0, 32.0, 30.0, 32.0, 54.0, 72.0, 85.0, 135.0, 162.0, 329.0, 1231.0, 11079.0, 2270857.0, 1897233.0, 10674.0, 1200.0, 335.0, 173.0, 135.0, 93.0, 60.0, 67.0, 43.0, 29.0, 14.0, 26.0, 12.0, 10.0, 6.0, 5.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-42.25, -41.137939453125, -40.02587890625, -38.913818359375, -37.8017578125, -36.689697265625, -35.57763671875, -34.465576171875, -33.353515625, -32.241455078125, -31.12939453125, -30.017333984375, -28.9052734375, -27.793212890625, -26.68115234375, -25.569091796875, -24.45703125, -23.344970703125, -22.23291015625, -21.120849609375, -20.0087890625, -18.896728515625, -17.78466796875, -16.672607421875, -15.560546875, -14.448486328125, -13.33642578125, -12.224365234375, -11.1123046875, -10.000244140625, -8.88818359375, -7.776123046875, -6.6640625, -5.552001953125, -4.43994140625, -3.327880859375, -2.2158203125, -1.103759765625, 0.00830078125, 1.120361328125, 2.232421875, 3.344482421875, 4.45654296875, 5.568603515625, 6.6806640625, 7.792724609375, 8.90478515625, 10.016845703125, 11.12890625, 12.240966796875, 13.35302734375, 14.465087890625, 15.5771484375, 16.689208984375, 17.80126953125, 18.913330078125, 20.025390625, 21.137451171875, 22.24951171875, 23.361572265625, 24.4736328125, 25.585693359375, 26.69775390625, 27.809814453125, 28.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 22.0, 33.0, 55.0, 57.0, 87.0, 113.0, 137.0, 137.0, 107.0, 88.0, 63.0, 42.0, 21.0, 14.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9405517578125, -11.576416015625, -11.2122802734375, -10.84814453125, -10.4840087890625, -10.119873046875, -9.7557373046875, -9.3916015625, -9.0274658203125, -8.663330078125, -8.2991943359375, -7.93505859375, -7.5709228515625, -7.206787109375, -6.8426513671875, -6.478515625, -6.1143798828125, -5.750244140625, -5.3861083984375, -5.02197265625, -4.6578369140625, -4.293701171875, -3.9295654296875, -3.5654296875, -3.2012939453125, -2.837158203125, -2.4730224609375, -2.10888671875, -1.7447509765625, -1.380615234375, -1.0164794921875, -0.65234375, -0.2882080078125, 0.075927734375, 0.4400634765625, 0.80419921875, 1.1683349609375, 1.532470703125, 1.8966064453125, 2.2607421875, 2.6248779296875, 2.989013671875, 3.3531494140625, 3.71728515625, 4.0814208984375, 4.445556640625, 4.8096923828125, 5.173828125, 5.5379638671875, 5.902099609375, 6.2662353515625, 6.63037109375, 6.9945068359375, 7.358642578125, 7.7227783203125, 8.0869140625, 8.4510498046875, 8.815185546875, 9.1793212890625, 9.54345703125, 9.9075927734375, 10.271728515625, 10.6358642578125, 11.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 20.0, 17.0, 30.0, 49.0, 95.0, 138.0, 261.0, 590.0, 1285.0, 3463.0, 11894.0, 56687.0, 924001.0, 3068882.0, 102290.0, 17233.0, 4519.0, 1510.0, 623.0, 264.0, 168.0, 103.0, 67.0, 35.0, 14.0, 18.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.439208984375, -14.90966796875, -14.380126953125, -13.8505859375, -13.321044921875, -12.79150390625, -12.261962890625, -11.732421875, -11.202880859375, -10.67333984375, -10.143798828125, -9.6142578125, -9.084716796875, -8.55517578125, -8.025634765625, -7.49609375, -6.966552734375, -6.43701171875, -5.907470703125, -5.3779296875, -4.848388671875, -4.31884765625, -3.789306640625, -3.259765625, -2.730224609375, -2.20068359375, -1.671142578125, -1.1416015625, -0.612060546875, -0.08251953125, 0.447021484375, 0.9765625, 1.506103515625, 2.03564453125, 2.565185546875, 3.0947265625, 3.624267578125, 4.15380859375, 4.683349609375, 5.212890625, 5.742431640625, 6.27197265625, 6.801513671875, 7.3310546875, 7.860595703125, 8.39013671875, 8.919677734375, 9.44921875, 9.978759765625, 10.50830078125, 11.037841796875, 11.5673828125, 12.096923828125, 12.62646484375, 13.156005859375, 13.685546875, 14.215087890625, 14.74462890625, 15.274169921875, 15.8037109375, 16.333251953125, 16.86279296875, 17.392333984375, 17.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 27.0, 32.0, 28.0, 52.0, 77.0, 114.0, 189.0, 337.0, 588.0, 952.0, 703.0, 382.0, 194.0, 123.0, 57.0, 50.0, 24.0, 27.0, 18.0, 12.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.4609375, -13.0926513671875, -12.724365234375, -12.3560791015625, -11.98779296875, -11.6195068359375, -11.251220703125, -10.8829345703125, -10.5146484375, -10.1463623046875, -9.778076171875, -9.4097900390625, -9.04150390625, -8.6732177734375, -8.304931640625, -7.9366455078125, -7.568359375, -7.2000732421875, -6.831787109375, -6.4635009765625, -6.09521484375, -5.7269287109375, -5.358642578125, -4.9903564453125, -4.6220703125, -4.2537841796875, -3.885498046875, -3.5172119140625, -3.14892578125, -2.7806396484375, -2.412353515625, -2.0440673828125, -1.67578125, -1.3074951171875, -0.939208984375, -0.5709228515625, -0.20263671875, 0.1656494140625, 0.533935546875, 0.9022216796875, 1.2705078125, 1.6387939453125, 2.007080078125, 2.3753662109375, 2.74365234375, 3.1119384765625, 3.480224609375, 3.8485107421875, 4.216796875, 4.5850830078125, 4.953369140625, 5.3216552734375, 5.68994140625, 6.0582275390625, 6.426513671875, 6.7947998046875, 7.1630859375, 7.5313720703125, 7.899658203125, 8.2679443359375, 8.63623046875, 9.0045166015625, 9.372802734375, 9.7410888671875, 10.109375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 6.0, 11.0, 11.0, 19.0, 33.0, 43.0, 76.0, 137.0, 165.0, 168.0, 123.0, 105.0, 53.0, 22.0, 14.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.77225494384766, -112.29562377929688, -108.81898498535156, -105.34235382080078, -101.86572265625, -98.38908386230469, -94.9124526977539, -91.43582153320312, -87.95918273925781, -84.48255157470703, -81.00591278076172, -77.52928161621094, -74.05265045166016, -70.57601928710938, -67.09938049316406, -63.62274932861328, -60.1461181640625, -56.66948318481445, -53.19285202026367, -49.716217041015625, -46.239585876464844, -42.7629508972168, -39.28631591796875, -35.80968475341797, -32.33304977416992, -28.856416702270508, -25.379783630371094, -21.903148651123047, -18.426515579223633, -14.949882507324219, -11.473247528076172, -7.996614456176758, -4.519989013671875, -1.0433554649353027, 2.4332780838012695, 5.909912109375, 9.386545181274414, 12.863178253173828, 16.339813232421875, 19.81644630432129, 23.293079376220703, 26.769712448120117, 30.24634552001953, 33.72298049926758, 37.199615478515625, 40.676246643066406, 44.15288162231445, 47.6295166015625, 51.10614776611328, 54.58278274536133, 58.05941390991211, 61.536048889160156, 65.01268005371094, 68.48931884765625, 71.96595001220703, 75.44258117675781, 78.91921997070312, 82.3958511352539, 85.87248992919922, 89.34912109375, 92.82575225830078, 96.30238342285156, 99.77902221679688, 103.25565338134766, 106.73228454589844]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 16.0, 19.0, 14.0, 15.0, 31.0, 26.0, 34.0, 43.0, 55.0, 36.0, 38.0, 46.0, 53.0, 52.0, 54.0, 51.0, 57.0, 49.0, 45.0, 30.0, 29.0, 36.0, 26.0, 25.0, 21.0, 22.0, 14.0, 1.0, 12.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.971282958984375, -41.211490631103516, -39.45170211791992, -37.69190979003906, -35.93212127685547, -34.17232894897461, -32.412540435791016, -30.652748107910156, -28.892959594726562, -27.133169174194336, -25.37337875366211, -23.613588333129883, -21.853797912597656, -20.094005584716797, -18.334217071533203, -16.574424743652344, -14.814634323120117, -13.05484390258789, -11.295053482055664, -9.535263061523438, -7.775472164154053, -6.015681266784668, -4.255890846252441, -2.496100425720215, -0.7363100051879883, 1.0234805345535278, 2.783271074295044, 4.54306173324585, 6.302852153778076, 8.062643051147461, 9.822433471679688, 11.582223892211914, 13.34201431274414, 15.101804733276367, 16.861595153808594, 18.62138557434082, 20.381175994873047, 22.140968322753906, 23.9007568359375, 25.66054916381836, 27.420337677001953, 29.18012809753418, 30.939918518066406, 32.699710845947266, 34.45949935913086, 36.21929168701172, 37.97908020019531, 39.73887252807617, 41.49866485595703, 43.25845718383789, 45.018245697021484, 46.778038024902344, 48.53782653808594, 50.2976188659668, 52.05740737915039, 53.81719970703125, 55.576988220214844, 57.3367805480957, 59.0965690612793, 60.856361389160156, 62.61614990234375, 64.37593841552734, 66.13573455810547, 67.89552307128906, 69.65531158447266]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 6.0, 7.0, 22.0, 16.0, 20.0, 38.0, 70.0, 87.0, 152.0, 251.0, 501.0, 909.0, 1790.0, 3482.0, 7497.0, 16720.0, 40533.0, 112881.0, 354989.0, 334298.0, 106091.0, 38324.0, 15772.0, 7121.0, 3334.0, 1666.0, 843.0, 456.0, 271.0, 152.0, 85.0, 61.0, 22.0, 31.0, 6.0, 14.0, 9.0, 9.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-11.640625, -11.3077392578125, -10.974853515625, -10.6419677734375, -10.30908203125, -9.9761962890625, -9.643310546875, -9.3104248046875, -8.9775390625, -8.6446533203125, -8.311767578125, -7.9788818359375, -7.64599609375, -7.3131103515625, -6.980224609375, -6.6473388671875, -6.314453125, -5.9815673828125, -5.648681640625, -5.3157958984375, -4.98291015625, -4.6500244140625, -4.317138671875, -3.9842529296875, -3.6513671875, -3.3184814453125, -2.985595703125, -2.6527099609375, -2.31982421875, -1.9869384765625, -1.654052734375, -1.3211669921875, -0.98828125, -0.6553955078125, -0.322509765625, 0.0103759765625, 0.34326171875, 0.6761474609375, 1.009033203125, 1.3419189453125, 1.6748046875, 2.0076904296875, 2.340576171875, 2.6734619140625, 3.00634765625, 3.3392333984375, 3.672119140625, 4.0050048828125, 4.337890625, 4.6707763671875, 5.003662109375, 5.3365478515625, 5.66943359375, 6.0023193359375, 6.335205078125, 6.6680908203125, 7.0009765625, 7.3338623046875, 7.666748046875, 7.9996337890625, 8.33251953125, 8.6654052734375, 8.998291015625, 9.3311767578125, 9.6640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 4.0, 6.0, 8.0, 16.0, 15.0, 17.0, 25.0, 33.0, 33.0, 31.0, 48.0, 56.0, 56.0, 65.0, 56.0, 67.0, 65.0, 52.0, 62.0, 60.0, 39.0, 33.0, 24.0, 38.0, 24.0, 17.0, 12.0, 11.0, 11.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.49151611328125, -4.3072509765625, -4.12298583984375, -3.938720703125, -3.75445556640625, -3.5701904296875, -3.38592529296875, -3.20166015625, -3.01739501953125, -2.8331298828125, -2.64886474609375, -2.464599609375, -2.28033447265625, -2.0960693359375, -1.91180419921875, -1.7275390625, -1.54327392578125, -1.3590087890625, -1.17474365234375, -0.990478515625, -0.80621337890625, -0.6219482421875, -0.43768310546875, -0.25341796875, -0.06915283203125, 0.1151123046875, 0.29937744140625, 0.483642578125, 0.66790771484375, 0.8521728515625, 1.03643798828125, 1.220703125, 1.40496826171875, 1.5892333984375, 1.77349853515625, 1.957763671875, 2.14202880859375, 2.3262939453125, 2.51055908203125, 2.69482421875, 2.87908935546875, 3.0633544921875, 3.24761962890625, 3.431884765625, 3.61614990234375, 3.8004150390625, 3.98468017578125, 4.1689453125, 4.35321044921875, 4.5374755859375, 4.72174072265625, 4.906005859375, 5.09027099609375, 5.2745361328125, 5.45880126953125, 5.64306640625, 5.82733154296875, 6.0115966796875, 6.19586181640625, 6.380126953125, 6.56439208984375, 6.7486572265625, 6.93292236328125, 7.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 15.0, 28.0, 49.0, 66.0, 84.0, 165.0, 256.0, 376.0, 829.0, 1993.0, 6077.0, 28055.0, 215884.0, 697328.0, 77747.0, 13213.0, 3561.0, 1280.0, 642.0, 305.0, 190.0, 114.0, 85.0, 51.0, 36.0, 27.0, 20.0, 15.0, 9.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.212646484375, -16.58154296875, -15.950439453125, -15.3193359375, -14.688232421875, -14.05712890625, -13.426025390625, -12.794921875, -12.163818359375, -11.53271484375, -10.901611328125, -10.2705078125, -9.639404296875, -9.00830078125, -8.377197265625, -7.74609375, -7.114990234375, -6.48388671875, -5.852783203125, -5.2216796875, -4.590576171875, -3.95947265625, -3.328369140625, -2.697265625, -2.066162109375, -1.43505859375, -0.803955078125, -0.1728515625, 0.458251953125, 1.08935546875, 1.720458984375, 2.3515625, 2.982666015625, 3.61376953125, 4.244873046875, 4.8759765625, 5.507080078125, 6.13818359375, 6.769287109375, 7.400390625, 8.031494140625, 8.66259765625, 9.293701171875, 9.9248046875, 10.555908203125, 11.18701171875, 11.818115234375, 12.44921875, 13.080322265625, 13.71142578125, 14.342529296875, 14.9736328125, 15.604736328125, 16.23583984375, 16.866943359375, 17.498046875, 18.129150390625, 18.76025390625, 19.391357421875, 20.0224609375, 20.653564453125, 21.28466796875, 21.915771484375, 22.546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 11.0, 9.0, 22.0, 20.0, 25.0, 27.0, 26.0, 33.0, 41.0, 38.0, 43.0, 31.0, 61.0, 44.0, 46.0, 55.0, 52.0, 35.0, 57.0, 46.0, 40.0, 30.0, 33.0, 27.0, 19.0, 18.0, 18.0, 10.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.421875, -16.849609375, -16.27734375, -15.705078125, -15.1328125, -14.560546875, -13.98828125, -13.416015625, -12.84375, -12.271484375, -11.69921875, -11.126953125, -10.5546875, -9.982421875, -9.41015625, -8.837890625, -8.265625, -7.693359375, -7.12109375, -6.548828125, -5.9765625, -5.404296875, -4.83203125, -4.259765625, -3.6875, -3.115234375, -2.54296875, -1.970703125, -1.3984375, -0.826171875, -0.25390625, 0.318359375, 0.890625, 1.462890625, 2.03515625, 2.607421875, 3.1796875, 3.751953125, 4.32421875, 4.896484375, 5.46875, 6.041015625, 6.61328125, 7.185546875, 7.7578125, 8.330078125, 8.90234375, 9.474609375, 10.046875, 10.619140625, 11.19140625, 11.763671875, 12.3359375, 12.908203125, 13.48046875, 14.052734375, 14.625, 15.197265625, 15.76953125, 16.341796875, 16.9140625, 17.486328125, 18.05859375, 18.630859375, 19.203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 18.0, 25.0, 32.0, 67.0, 140.0, 293.0, 685.0, 3259.0, 26242.0, 719726.0, 281572.0, 13345.0, 2070.0, 541.0, 233.0, 104.0, 54.0, 32.0, 21.0, 15.0, 11.0, 8.0, 7.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.8985595703125, -9.515869140625, -9.1331787109375, -8.75048828125, -8.3677978515625, -7.985107421875, -7.6024169921875, -7.2197265625, -6.8370361328125, -6.454345703125, -6.0716552734375, -5.68896484375, -5.3062744140625, -4.923583984375, -4.5408935546875, -4.158203125, -3.7755126953125, -3.392822265625, -3.0101318359375, -2.62744140625, -2.2447509765625, -1.862060546875, -1.4793701171875, -1.0966796875, -0.7139892578125, -0.331298828125, 0.0513916015625, 0.43408203125, 0.8167724609375, 1.199462890625, 1.5821533203125, 1.96484375, 2.3475341796875, 2.730224609375, 3.1129150390625, 3.49560546875, 3.8782958984375, 4.260986328125, 4.6436767578125, 5.0263671875, 5.4090576171875, 5.791748046875, 6.1744384765625, 6.55712890625, 6.9398193359375, 7.322509765625, 7.7052001953125, 8.087890625, 8.4705810546875, 8.853271484375, 9.2359619140625, 9.61865234375, 10.0013427734375, 10.384033203125, 10.7667236328125, 11.1494140625, 11.5321044921875, 11.914794921875, 12.2974853515625, 12.68017578125, 13.0628662109375, 13.445556640625, 13.8282470703125, 14.2109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 13.0, 12.0, 20.0, 48.0, 114.0, 262.0, 291.0, 114.0, 54.0, 30.0, 18.0, 6.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003963470458984375, -0.0038565993309020996, -0.0037497282028198242, -0.003642857074737549, -0.0035359859466552734, -0.003429114818572998, -0.0033222436904907227, -0.0032153725624084473, -0.003108501434326172, -0.0030016303062438965, -0.002894759178161621, -0.0027878880500793457, -0.0026810169219970703, -0.002574145793914795, -0.0024672746658325195, -0.002360403537750244, -0.0022535324096679688, -0.0021466612815856934, -0.002039790153503418, -0.0019329190254211426, -0.0018260478973388672, -0.0017191767692565918, -0.0016123056411743164, -0.001505434513092041, -0.0013985633850097656, -0.0012916922569274902, -0.0011848211288452148, -0.0010779500007629395, -0.0009710788726806641, -0.0008642077445983887, -0.0007573366165161133, -0.0006504654884338379, -0.0005435943603515625, -0.0004367232322692871, -0.0003298521041870117, -0.00022298097610473633, -0.00011610984802246094, -9.238719940185547e-06, 9.763240814208984e-05, 0.00020450353622436523, 0.0003113746643066406, 0.000418245792388916, 0.0005251169204711914, 0.0006319880485534668, 0.0007388591766357422, 0.0008457303047180176, 0.000952601432800293, 0.0010594725608825684, 0.0011663436889648438, 0.0012732148170471191, 0.0013800859451293945, 0.00148695707321167, 0.0015938282012939453, 0.0017006993293762207, 0.001807570457458496, 0.0019144415855407715, 0.002021312713623047, 0.0021281838417053223, 0.0022350549697875977, 0.002341926097869873, 0.0024487972259521484, 0.002555668354034424, 0.0026625394821166992, 0.0027694106101989746, 0.00287628173828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 50.0, 82.0, 164.0, 268.0, 651.0, 1603.0, 5396.0, 33723.0, 617344.0, 359321.0, 23113.0, 4306.0, 1334.0, 531.0, 282.0, 125.0, 67.0, 48.0, 25.0, 13.0, 13.0, 12.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1749267578125, -8.857666015625, -8.5404052734375, -8.22314453125, -7.9058837890625, -7.588623046875, -7.2713623046875, -6.9541015625, -6.6368408203125, -6.319580078125, -6.0023193359375, -5.68505859375, -5.3677978515625, -5.050537109375, -4.7332763671875, -4.416015625, -4.0987548828125, -3.781494140625, -3.4642333984375, -3.14697265625, -2.8297119140625, -2.512451171875, -2.1951904296875, -1.8779296875, -1.5606689453125, -1.243408203125, -0.9261474609375, -0.60888671875, -0.2916259765625, 0.025634765625, 0.3428955078125, 0.66015625, 0.9774169921875, 1.294677734375, 1.6119384765625, 1.92919921875, 2.2464599609375, 2.563720703125, 2.8809814453125, 3.1982421875, 3.5155029296875, 3.832763671875, 4.1500244140625, 4.46728515625, 4.7845458984375, 5.101806640625, 5.4190673828125, 5.736328125, 6.0535888671875, 6.370849609375, 6.6881103515625, 7.00537109375, 7.3226318359375, 7.639892578125, 7.9571533203125, 8.2744140625, 8.5916748046875, 8.908935546875, 9.2261962890625, 9.54345703125, 9.8607177734375, 10.177978515625, 10.4952392578125, 10.8125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 3.0, 4.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 45.0, 68.0, 69.0, 85.0, 97.0, 87.0, 88.0, 85.0, 66.0, 55.0, 34.0, 30.0, 24.0, 14.0, 8.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9454345703125, -5.750244140625, -5.5550537109375, -5.35986328125, -5.1646728515625, -4.969482421875, -4.7742919921875, -4.5791015625, -4.3839111328125, -4.188720703125, -3.9935302734375, -3.79833984375, -3.6031494140625, -3.407958984375, -3.2127685546875, -3.017578125, -2.8223876953125, -2.627197265625, -2.4320068359375, -2.23681640625, -2.0416259765625, -1.846435546875, -1.6512451171875, -1.4560546875, -1.2608642578125, -1.065673828125, -0.8704833984375, -0.67529296875, -0.4801025390625, -0.284912109375, -0.0897216796875, 0.10546875, 0.3006591796875, 0.495849609375, 0.6910400390625, 0.88623046875, 1.0814208984375, 1.276611328125, 1.4718017578125, 1.6669921875, 1.8621826171875, 2.057373046875, 2.2525634765625, 2.44775390625, 2.6429443359375, 2.838134765625, 3.0333251953125, 3.228515625, 3.4237060546875, 3.618896484375, 3.8140869140625, 4.00927734375, 4.2044677734375, 4.399658203125, 4.5948486328125, 4.7900390625, 4.9852294921875, 5.180419921875, 5.3756103515625, 5.57080078125, 5.7659912109375, 5.961181640625, 6.1563720703125, 6.3515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 4.0, 7.0, 20.0, 37.0, 61.0, 95.0, 124.0, 175.0, 169.0, 114.0, 66.0, 39.0, 38.0, 12.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-131.46990966796875, -127.91560363769531, -124.3613052368164, -120.80699920654297, -117.25269317626953, -113.69839477539062, -110.14408874511719, -106.58978271484375, -103.03548431396484, -99.4811782836914, -95.9268798828125, -92.37257385253906, -88.81826782226562, -85.26396942138672, -81.70966339111328, -78.15536499023438, -74.60105895996094, -71.0467529296875, -67.4924545288086, -63.938148498535156, -60.383846282958984, -56.82954406738281, -53.275238037109375, -49.7209358215332, -46.1666259765625, -42.61232376098633, -39.05801773071289, -35.50371551513672, -31.949413299560547, -28.395109176635742, -24.840805053710938, -21.286502838134766, -17.732200622558594, -14.177897453308105, -10.623594284057617, -7.0692901611328125, -3.514986991882324, 0.03931617736816406, 3.5936203002929688, 7.147922515869141, 10.702226638793945, 14.256529808044434, 17.810832977294922, 21.365137100219727, 24.91944122314453, 28.473743438720703, 32.028045654296875, 35.58235168457031, 39.136653900146484, 42.690956115722656, 46.245262145996094, 49.799564361572266, 53.35386657714844, 56.908172607421875, 60.46247482299805, 64.01677703857422, 67.57108306884766, 71.1253890991211, 74.6796875, 78.23399353027344, 81.78829956054688, 85.34259796142578, 88.89690399169922, 92.45120239257812, 96.00550842285156]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 9.0, 6.0, 13.0, 12.0, 16.0, 13.0, 19.0, 24.0, 25.0, 31.0, 32.0, 35.0, 35.0, 49.0, 48.0, 30.0, 57.0, 63.0, 55.0, 50.0, 52.0, 43.0, 37.0, 36.0, 28.0, 17.0, 30.0, 16.0, 23.0, 16.0, 11.0, 11.0, 10.0, 12.0, 6.0, 4.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-77.99589538574219, -75.7314224243164, -73.46694946289062, -71.20246887207031, -68.93799591064453, -66.67352294921875, -64.40904235839844, -62.144569396972656, -59.880096435546875, -57.615623474121094, -55.35114669799805, -53.086669921875, -50.82219696044922, -48.55772399902344, -46.29324722290039, -44.028770446777344, -41.76429748535156, -39.49982452392578, -37.235347747802734, -34.97087097167969, -32.706398010253906, -30.441923141479492, -28.177448272705078, -25.912973403930664, -23.64849853515625, -21.384023666381836, -19.119548797607422, -16.855073928833008, -14.590599060058594, -12.32612419128418, -10.061649322509766, -7.797174453735352, -5.5326995849609375, -3.2682247161865234, -1.0037498474121094, 1.2607250213623047, 3.5251998901367188, 5.789674758911133, 8.054149627685547, 10.318624496459961, 12.583099365234375, 14.847574234008789, 17.112049102783203, 19.376523971557617, 21.64099884033203, 23.905473709106445, 26.16994857788086, 28.434423446655273, 30.698898315429688, 32.96337127685547, 35.227848052978516, 37.49232482910156, 39.756797790527344, 42.021270751953125, 44.28574752807617, 46.55022430419922, 48.814697265625, 51.07917022705078, 53.34364700317383, 55.608123779296875, 57.872596740722656, 60.13706970214844, 62.401546478271484, 64.66602325439453, 66.93049621582031]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 18.0, 14.0, 20.0, 34.0, 64.0, 92.0, 167.0, 352.0, 658.0, 1399.0, 3503.0, 9308.0, 30035.0, 134144.0, 1286222.0, 2404793.0, 255695.0, 46486.0, 13141.0, 4636.0, 1785.0, 829.0, 383.0, 180.0, 117.0, 67.0, 46.0, 31.0, 20.0, 9.0, 18.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.829833984375, -9.55029296875, -9.270751953125, -8.9912109375, -8.711669921875, -8.43212890625, -8.152587890625, -7.873046875, -7.593505859375, -7.31396484375, -7.034423828125, -6.7548828125, -6.475341796875, -6.19580078125, -5.916259765625, -5.63671875, -5.357177734375, -5.07763671875, -4.798095703125, -4.5185546875, -4.239013671875, -3.95947265625, -3.679931640625, -3.400390625, -3.120849609375, -2.84130859375, -2.561767578125, -2.2822265625, -2.002685546875, -1.72314453125, -1.443603515625, -1.1640625, -0.884521484375, -0.60498046875, -0.325439453125, -0.0458984375, 0.233642578125, 0.51318359375, 0.792724609375, 1.072265625, 1.351806640625, 1.63134765625, 1.910888671875, 2.1904296875, 2.469970703125, 2.74951171875, 3.029052734375, 3.30859375, 3.588134765625, 3.86767578125, 4.147216796875, 4.4267578125, 4.706298828125, 4.98583984375, 5.265380859375, 5.544921875, 5.824462890625, 6.10400390625, 6.383544921875, 6.6630859375, 6.942626953125, 7.22216796875, 7.501708984375, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 18.0, 27.0, 24.0, 28.0, 39.0, 54.0, 59.0, 57.0, 75.0, 74.0, 63.0, 77.0, 55.0, 64.0, 52.0, 40.0, 29.0, 29.0, 28.0, 21.0, 11.0, 11.0, 12.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.561767578125, -4.37353515625, -4.185302734375, -3.9970703125, -3.808837890625, -3.62060546875, -3.432373046875, -3.244140625, -3.055908203125, -2.86767578125, -2.679443359375, -2.4912109375, -2.302978515625, -2.11474609375, -1.926513671875, -1.73828125, -1.550048828125, -1.36181640625, -1.173583984375, -0.9853515625, -0.797119140625, -0.60888671875, -0.420654296875, -0.232421875, -0.044189453125, 0.14404296875, 0.332275390625, 0.5205078125, 0.708740234375, 0.89697265625, 1.085205078125, 1.2734375, 1.461669921875, 1.64990234375, 1.838134765625, 2.0263671875, 2.214599609375, 2.40283203125, 2.591064453125, 2.779296875, 2.967529296875, 3.15576171875, 3.343994140625, 3.5322265625, 3.720458984375, 3.90869140625, 4.096923828125, 4.28515625, 4.473388671875, 4.66162109375, 4.849853515625, 5.0380859375, 5.226318359375, 5.41455078125, 5.602783203125, 5.791015625, 5.979248046875, 6.16748046875, 6.355712890625, 6.5439453125, 6.732177734375, 6.92041015625, 7.108642578125, 7.296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 6.0, 26.0, 26.0, 48.0, 62.0, 91.0, 150.0, 336.0, 656.0, 1671.0, 5573.0, 25266.0, 177935.0, 3167089.0, 741605.0, 58363.0, 10596.0, 2745.0, 950.0, 453.0, 228.0, 132.0, 79.0, 46.0, 37.0, 21.0, 18.0, 15.0, 12.0, 11.0, 13.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.75, -17.2918701171875, -16.833740234375, -16.3756103515625, -15.91748046875, -15.4593505859375, -15.001220703125, -14.5430908203125, -14.0849609375, -13.6268310546875, -13.168701171875, -12.7105712890625, -12.25244140625, -11.7943115234375, -11.336181640625, -10.8780517578125, -10.419921875, -9.9617919921875, -9.503662109375, -9.0455322265625, -8.58740234375, -8.1292724609375, -7.671142578125, -7.2130126953125, -6.7548828125, -6.2967529296875, -5.838623046875, -5.3804931640625, -4.92236328125, -4.4642333984375, -4.006103515625, -3.5479736328125, -3.08984375, -2.6317138671875, -2.173583984375, -1.7154541015625, -1.25732421875, -0.7991943359375, -0.341064453125, 0.1170654296875, 0.5751953125, 1.0333251953125, 1.491455078125, 1.9495849609375, 2.40771484375, 2.8658447265625, 3.323974609375, 3.7821044921875, 4.240234375, 4.6983642578125, 5.156494140625, 5.6146240234375, 6.07275390625, 6.5308837890625, 6.989013671875, 7.4471435546875, 7.9052734375, 8.3634033203125, 8.821533203125, 9.2796630859375, 9.73779296875, 10.1959228515625, 10.654052734375, 11.1121826171875, 11.5703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 17.0, 16.0, 32.0, 37.0, 68.0, 80.0, 143.0, 238.0, 393.0, 697.0, 800.0, 623.0, 328.0, 206.0, 111.0, 80.0, 48.0, 45.0, 25.0, 16.0, 16.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.9241943359375, -13.465576171875, -13.0069580078125, -12.54833984375, -12.0897216796875, -11.631103515625, -11.1724853515625, -10.7138671875, -10.2552490234375, -9.796630859375, -9.3380126953125, -8.87939453125, -8.4207763671875, -7.962158203125, -7.5035400390625, -7.044921875, -6.5863037109375, -6.127685546875, -5.6690673828125, -5.21044921875, -4.7518310546875, -4.293212890625, -3.8345947265625, -3.3759765625, -2.9173583984375, -2.458740234375, -2.0001220703125, -1.54150390625, -1.0828857421875, -0.624267578125, -0.1656494140625, 0.29296875, 0.7515869140625, 1.210205078125, 1.6688232421875, 2.12744140625, 2.5860595703125, 3.044677734375, 3.5032958984375, 3.9619140625, 4.4205322265625, 4.879150390625, 5.3377685546875, 5.79638671875, 6.2550048828125, 6.713623046875, 7.1722412109375, 7.630859375, 8.0894775390625, 8.548095703125, 9.0067138671875, 9.46533203125, 9.9239501953125, 10.382568359375, 10.8411865234375, 11.2998046875, 11.7584228515625, 12.217041015625, 12.6756591796875, 13.13427734375, 13.5928955078125, 14.051513671875, 14.5101318359375, 14.96875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 0.0, 4.0, 4.0, 12.0, 8.0, 17.0, 54.0, 97.0, 181.0, 196.0, 204.0, 121.0, 50.0, 25.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.23287963867188, -143.41714477539062, -138.60140991210938, -133.7856903076172, -128.96995544433594, -124.15422058105469, -119.33848571777344, -114.52275848388672, -109.70703125, -104.89129638671875, -100.07556915283203, -95.25983428955078, -90.44410705566406, -85.62837219238281, -80.81263732910156, -75.99691009521484, -71.1811752319336, -66.36544036865234, -61.549713134765625, -56.733978271484375, -51.918251037597656, -47.102516174316406, -42.28678512573242, -37.47105407714844, -32.65532302856445, -27.83959197998047, -23.023860931396484, -18.208127975463867, -13.392396926879883, -8.576665878295898, -3.7609329223632812, 1.0547981262207031, 5.8705291748046875, 10.686260223388672, 15.501992225646973, 20.317724227905273, 25.133455276489258, 29.949186325073242, 34.76491928100586, 39.580650329589844, 44.39638137817383, 49.21211242675781, 54.0278434753418, 58.84357452392578, 63.65930938720703, 68.47503662109375, 73.290771484375, 78.10650634765625, 82.92223358154297, 87.73796844482422, 92.55369567871094, 97.36943054199219, 102.1851577758789, 107.00089263916016, 111.81661987304688, 116.63235473632812, 121.44808959960938, 126.26382446289062, 131.07955932617188, 135.89527893066406, 140.7110137939453, 145.52674865722656, 150.3424835205078, 155.158203125, 159.97393798828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 17.0, 8.0, 11.0, 16.0, 16.0, 21.0, 15.0, 20.0, 32.0, 32.0, 29.0, 45.0, 30.0, 37.0, 38.0, 49.0, 53.0, 47.0, 56.0, 42.0, 34.0, 46.0, 32.0, 35.0, 39.0, 28.0, 37.0, 20.0, 12.0, 22.0, 16.0, 15.0, 12.0, 8.0, 2.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-58.22266387939453, -56.405364990234375, -54.588069915771484, -52.77077102661133, -50.95347213745117, -49.13617706298828, -47.318878173828125, -45.50157928466797, -43.68428039550781, -41.866981506347656, -40.049686431884766, -38.23238754272461, -36.41508865356445, -34.59779357910156, -32.780494689941406, -30.96319580078125, -29.14590072631836, -27.328603744506836, -25.51130485534668, -23.694007873535156, -21.876708984375, -20.059412002563477, -18.242115020751953, -16.424816131591797, -14.607519149780273, -12.790221214294434, -10.972923278808594, -9.15562629699707, -7.3383283615112305, -5.521030426025391, -3.703733444213867, -1.8864355087280273, -0.06914138793945312, 1.7481563091278076, 3.5654540061950684, 5.38275146484375, 7.20004940032959, 9.01734733581543, 10.834644317626953, 12.651942253112793, 14.469240188598633, 16.286537170410156, 18.103836059570312, 19.921133041381836, 21.73843002319336, 23.555728912353516, 25.37302589416504, 27.190322875976562, 29.00762176513672, 30.824918746948242, 32.642215728759766, 34.45951461791992, 36.27681350708008, 38.09410858154297, 39.911407470703125, 41.72870635986328, 43.54600524902344, 45.363304138183594, 47.180599212646484, 48.99789810180664, 50.8151969909668, 52.63249206542969, 54.449790954589844, 56.26708984375, 58.08438491821289]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 11.0, 9.0, 20.0, 24.0, 54.0, 82.0, 170.0, 290.0, 610.0, 1227.0, 2749.0, 7017.0, 19361.0, 56583.0, 170553.0, 420677.0, 244526.0, 80988.0, 27186.0, 9573.0, 3744.0, 1550.0, 722.0, 381.0, 185.0, 109.0, 65.0, 28.0, 33.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.295654296875, -10.92724609375, -10.558837890625, -10.1904296875, -9.822021484375, -9.45361328125, -9.085205078125, -8.716796875, -8.348388671875, -7.97998046875, -7.611572265625, -7.2431640625, -6.874755859375, -6.50634765625, -6.137939453125, -5.76953125, -5.401123046875, -5.03271484375, -4.664306640625, -4.2958984375, -3.927490234375, -3.55908203125, -3.190673828125, -2.822265625, -2.453857421875, -2.08544921875, -1.717041015625, -1.3486328125, -0.980224609375, -0.61181640625, -0.243408203125, 0.125, 0.493408203125, 0.86181640625, 1.230224609375, 1.5986328125, 1.967041015625, 2.33544921875, 2.703857421875, 3.072265625, 3.440673828125, 3.80908203125, 4.177490234375, 4.5458984375, 4.914306640625, 5.28271484375, 5.651123046875, 6.01953125, 6.387939453125, 6.75634765625, 7.124755859375, 7.4931640625, 7.861572265625, 8.22998046875, 8.598388671875, 8.966796875, 9.335205078125, 9.70361328125, 10.072021484375, 10.4404296875, 10.808837890625, 11.17724609375, 11.545654296875, 11.9140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 10.0, 20.0, 21.0, 32.0, 27.0, 33.0, 46.0, 65.0, 64.0, 78.0, 65.0, 82.0, 62.0, 66.0, 60.0, 47.0, 58.0, 28.0, 27.0, 20.0, 15.0, 13.0, 13.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.92987060546875, -4.7347412109375, -4.53961181640625, -4.344482421875, -4.14935302734375, -3.9542236328125, -3.75909423828125, -3.56396484375, -3.36883544921875, -3.1737060546875, -2.97857666015625, -2.783447265625, -2.58831787109375, -2.3931884765625, -2.19805908203125, -2.0029296875, -1.80780029296875, -1.6126708984375, -1.41754150390625, -1.222412109375, -1.02728271484375, -0.8321533203125, -0.63702392578125, -0.44189453125, -0.24676513671875, -0.0516357421875, 0.14349365234375, 0.338623046875, 0.53375244140625, 0.7288818359375, 0.92401123046875, 1.119140625, 1.31427001953125, 1.5093994140625, 1.70452880859375, 1.899658203125, 2.09478759765625, 2.2899169921875, 2.48504638671875, 2.68017578125, 2.87530517578125, 3.0704345703125, 3.26556396484375, 3.460693359375, 3.65582275390625, 3.8509521484375, 4.04608154296875, 4.2412109375, 4.43634033203125, 4.6314697265625, 4.82659912109375, 5.021728515625, 5.21685791015625, 5.4119873046875, 5.60711669921875, 5.80224609375, 5.99737548828125, 6.1925048828125, 6.38763427734375, 6.582763671875, 6.77789306640625, 6.9730224609375, 7.16815185546875, 7.36328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 9.0, 10.0, 18.0, 22.0, 21.0, 54.0, 64.0, 75.0, 117.0, 135.0, 223.0, 320.0, 470.0, 756.0, 1179.0, 2176.0, 5019.0, 20113.0, 142659.0, 725063.0, 121917.0, 17944.0, 4689.0, 2055.0, 1135.0, 726.0, 454.0, 329.0, 234.0, 151.0, 123.0, 88.0, 57.0, 36.0, 25.0, 24.0, 15.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.359375, -19.7509765625, -19.142578125, -18.5341796875, -17.92578125, -17.3173828125, -16.708984375, -16.1005859375, -15.4921875, -14.8837890625, -14.275390625, -13.6669921875, -13.05859375, -12.4501953125, -11.841796875, -11.2333984375, -10.625, -10.0166015625, -9.408203125, -8.7998046875, -8.19140625, -7.5830078125, -6.974609375, -6.3662109375, -5.7578125, -5.1494140625, -4.541015625, -3.9326171875, -3.32421875, -2.7158203125, -2.107421875, -1.4990234375, -0.890625, -0.2822265625, 0.326171875, 0.9345703125, 1.54296875, 2.1513671875, 2.759765625, 3.3681640625, 3.9765625, 4.5849609375, 5.193359375, 5.8017578125, 6.41015625, 7.0185546875, 7.626953125, 8.2353515625, 8.84375, 9.4521484375, 10.060546875, 10.6689453125, 11.27734375, 11.8857421875, 12.494140625, 13.1025390625, 13.7109375, 14.3193359375, 14.927734375, 15.5361328125, 16.14453125, 16.7529296875, 17.361328125, 17.9697265625, 18.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 9.0, 6.0, 13.0, 17.0, 6.0, 29.0, 29.0, 25.0, 32.0, 25.0, 43.0, 40.0, 36.0, 53.0, 55.0, 45.0, 55.0, 51.0, 32.0, 47.0, 40.0, 37.0, 36.0, 25.0, 33.0, 24.0, 22.0, 14.0, 21.0, 14.0, 13.0, 11.0, 3.0, 5.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.585205078125, -16.98291015625, -16.380615234375, -15.7783203125, -15.176025390625, -14.57373046875, -13.971435546875, -13.369140625, -12.766845703125, -12.16455078125, -11.562255859375, -10.9599609375, -10.357666015625, -9.75537109375, -9.153076171875, -8.55078125, -7.948486328125, -7.34619140625, -6.743896484375, -6.1416015625, -5.539306640625, -4.93701171875, -4.334716796875, -3.732421875, -3.130126953125, -2.52783203125, -1.925537109375, -1.3232421875, -0.720947265625, -0.11865234375, 0.483642578125, 1.0859375, 1.688232421875, 2.29052734375, 2.892822265625, 3.4951171875, 4.097412109375, 4.69970703125, 5.302001953125, 5.904296875, 6.506591796875, 7.10888671875, 7.711181640625, 8.3134765625, 8.915771484375, 9.51806640625, 10.120361328125, 10.72265625, 11.324951171875, 11.92724609375, 12.529541015625, 13.1318359375, 13.734130859375, 14.33642578125, 14.938720703125, 15.541015625, 16.143310546875, 16.74560546875, 17.347900390625, 17.9501953125, 18.552490234375, 19.15478515625, 19.757080078125, 20.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 12.0, 7.0, 5.0, 8.0, 11.0, 16.0, 21.0, 27.0, 30.0, 62.0, 101.0, 135.0, 298.0, 573.0, 1263.0, 3628.0, 13664.0, 76666.0, 673072.0, 234165.0, 33572.0, 7319.0, 2073.0, 847.0, 399.0, 188.0, 136.0, 78.0, 53.0, 36.0, 26.0, 16.0, 19.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.8717041015625, -5.680908203125, -5.4901123046875, -5.29931640625, -5.1085205078125, -4.917724609375, -4.7269287109375, -4.5361328125, -4.3453369140625, -4.154541015625, -3.9637451171875, -3.77294921875, -3.5821533203125, -3.391357421875, -3.2005615234375, -3.009765625, -2.8189697265625, -2.628173828125, -2.4373779296875, -2.24658203125, -2.0557861328125, -1.864990234375, -1.6741943359375, -1.4833984375, -1.2926025390625, -1.101806640625, -0.9110107421875, -0.72021484375, -0.5294189453125, -0.338623046875, -0.1478271484375, 0.04296875, 0.2337646484375, 0.424560546875, 0.6153564453125, 0.80615234375, 0.9969482421875, 1.187744140625, 1.3785400390625, 1.5693359375, 1.7601318359375, 1.950927734375, 2.1417236328125, 2.33251953125, 2.5233154296875, 2.714111328125, 2.9049072265625, 3.095703125, 3.2864990234375, 3.477294921875, 3.6680908203125, 3.85888671875, 4.0496826171875, 4.240478515625, 4.4312744140625, 4.6220703125, 4.8128662109375, 5.003662109375, 5.1944580078125, 5.38525390625, 5.5760498046875, 5.766845703125, 5.9576416015625, 6.1484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 15.0, 16.0, 28.0, 27.0, 37.0, 39.0, 65.0, 84.0, 125.0, 154.0, 98.0, 47.0, 55.0, 38.0, 32.0, 24.0, 19.0, 19.0, 10.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012280046939849854, -0.001182854175567627, -0.0011377036571502686, -0.0010925531387329102, -0.0010474026203155518, -0.0010022521018981934, -0.000957101583480835, -0.0009119510650634766, -0.0008668005466461182, -0.0008216500282287598, -0.0007764995098114014, -0.000731348991394043, -0.0006861984729766846, -0.0006410479545593262, -0.0005958974361419678, -0.0005507469177246094, -0.000505596399307251, -0.0004604458808898926, -0.0004152953624725342, -0.0003701448440551758, -0.0003249943256378174, -0.000279843807220459, -0.00023469328880310059, -0.0001895427703857422, -0.0001443922519683838, -9.924173355102539e-05, -5.409121513366699e-05, -8.940696716308594e-06, 3.6209821701049805e-05, 8.13603401184082e-05, 0.0001265108585357666, 0.000171661376953125, 0.0002168118953704834, 0.0002619624137878418, 0.0003071129322052002, 0.0003522634506225586, 0.000397413969039917, 0.0004425644874572754, 0.0004877150058746338, 0.0005328655242919922, 0.0005780160427093506, 0.000623166561126709, 0.0006683170795440674, 0.0007134675979614258, 0.0007586181163787842, 0.0008037686347961426, 0.000848919153213501, 0.0008940696716308594, 0.0009392201900482178, 0.0009843707084655762, 0.0010295212268829346, 0.001074671745300293, 0.0011198222637176514, 0.0011649727821350098, 0.0012101233005523682, 0.0012552738189697266, 0.001300424337387085, 0.0013455748558044434, 0.0013907253742218018, 0.0014358758926391602, 0.0014810264110565186, 0.001526176929473877, 0.0015713274478912354, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 11.0, 14.0, 22.0, 18.0, 26.0, 45.0, 86.0, 105.0, 186.0, 328.0, 530.0, 949.0, 2197.0, 5619.0, 21237.0, 155382.0, 734398.0, 102818.0, 16091.0, 4462.0, 1758.0, 900.0, 517.0, 299.0, 179.0, 127.0, 67.0, 64.0, 35.0, 30.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.30780029296875, -5.1273193359375, -4.94683837890625, -4.766357421875, -4.58587646484375, -4.4053955078125, -4.22491455078125, -4.04443359375, -3.86395263671875, -3.6834716796875, -3.50299072265625, -3.322509765625, -3.14202880859375, -2.9615478515625, -2.78106689453125, -2.6005859375, -2.42010498046875, -2.2396240234375, -2.05914306640625, -1.878662109375, -1.69818115234375, -1.5177001953125, -1.33721923828125, -1.15673828125, -0.97625732421875, -0.7957763671875, -0.61529541015625, -0.434814453125, -0.25433349609375, -0.0738525390625, 0.10662841796875, 0.287109375, 0.46759033203125, 0.6480712890625, 0.82855224609375, 1.009033203125, 1.18951416015625, 1.3699951171875, 1.55047607421875, 1.73095703125, 1.91143798828125, 2.0919189453125, 2.27239990234375, 2.452880859375, 2.63336181640625, 2.8138427734375, 2.99432373046875, 3.1748046875, 3.35528564453125, 3.5357666015625, 3.71624755859375, 3.896728515625, 4.07720947265625, 4.2576904296875, 4.43817138671875, 4.61865234375, 4.79913330078125, 4.9796142578125, 5.16009521484375, 5.340576171875, 5.52105712890625, 5.7015380859375, 5.88201904296875, 6.0625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 5.0, 3.0, 9.0, 8.0, 6.0, 2.0, 13.0, 14.0, 20.0, 21.0, 28.0, 34.0, 38.0, 41.0, 44.0, 63.0, 49.0, 62.0, 53.0, 52.0, 63.0, 52.0, 47.0, 42.0, 34.0, 24.0, 27.0, 32.0, 19.0, 24.0, 14.0, 5.0, 6.0, 5.0, 7.0, 3.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.634765625, -3.519287109375, -3.40380859375, -3.288330078125, -3.1728515625, -3.057373046875, -2.94189453125, -2.826416015625, -2.7109375, -2.595458984375, -2.47998046875, -2.364501953125, -2.2490234375, -2.133544921875, -2.01806640625, -1.902587890625, -1.787109375, -1.671630859375, -1.55615234375, -1.440673828125, -1.3251953125, -1.209716796875, -1.09423828125, -0.978759765625, -0.86328125, -0.747802734375, -0.63232421875, -0.516845703125, -0.4013671875, -0.285888671875, -0.17041015625, -0.054931640625, 0.060546875, 0.176025390625, 0.29150390625, 0.406982421875, 0.5224609375, 0.637939453125, 0.75341796875, 0.868896484375, 0.984375, 1.099853515625, 1.21533203125, 1.330810546875, 1.4462890625, 1.561767578125, 1.67724609375, 1.792724609375, 1.908203125, 2.023681640625, 2.13916015625, 2.254638671875, 2.3701171875, 2.485595703125, 2.60107421875, 2.716552734375, 2.83203125, 2.947509765625, 3.06298828125, 3.178466796875, 3.2939453125, 3.409423828125, 3.52490234375, 3.640380859375, 3.755859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 25.0, 51.0, 134.0, 243.0, 330.0, 123.0, 42.0, 21.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.59625244140625, -271.1712341308594, -264.7462158203125, -258.3211975097656, -251.89617919921875, -245.47116088867188, -239.046142578125, -232.62112426757812, -226.19610595703125, -219.77108764648438, -213.3460693359375, -206.92105102539062, -200.49603271484375, -194.07101440429688, -187.64599609375, -181.22097778320312, -174.79595947265625, -168.37094116210938, -161.9459228515625, -155.52090454101562, -149.09588623046875, -142.67086791992188, -136.245849609375, -129.82083129882812, -123.39579772949219, -116.97077941894531, -110.54576110839844, -104.12074279785156, -97.69572448730469, -91.27070617675781, -84.84568786621094, -78.42066955566406, -71.99565124511719, -65.57063293457031, -59.14561462402344, -52.72059631347656, -46.29557800292969, -39.87055587768555, -33.44553756713867, -27.020519256591797, -20.595500946044922, -14.170482635498047, -7.7454633712768555, -1.320444107055664, 5.104574203491211, 11.529594421386719, 17.954612731933594, 24.37963104248047, 30.804649353027344, 37.22966766357422, 43.654685974121094, 50.07970428466797, 56.504722595214844, 62.929744720458984, 69.35476684570312, 75.77978515625, 82.20480346679688, 88.62982177734375, 95.05484008789062, 101.4798583984375, 107.90487670898438, 114.32989501953125, 120.75491333007812, 127.179931640625, 133.60494995117188]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 10.0, 12.0, 13.0, 18.0, 23.0, 18.0, 26.0, 28.0, 27.0, 41.0, 41.0, 46.0, 54.0, 69.0, 88.0, 87.0, 53.0, 49.0, 40.0, 32.0, 34.0, 40.0, 32.0, 22.0, 22.0, 17.0, 9.0, 6.0, 11.0, 6.0, 11.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.84745025634766, -80.99778747558594, -78.14812469482422, -75.2984619140625, -72.44879913330078, -69.59913635253906, -66.74946594238281, -63.89980697631836, -61.05014419555664, -58.20048141479492, -55.3508186340332, -52.50115203857422, -49.6514892578125, -46.80182647705078, -43.95216369628906, -41.102500915527344, -38.252838134765625, -35.403175354003906, -32.55351257324219, -29.703847885131836, -26.854185104370117, -24.0045223236084, -21.154857635498047, -18.305194854736328, -15.45553207397461, -12.60586929321289, -9.756205558776855, -6.90654182434082, -4.056879043579102, -1.2072162628173828, 1.6424484252929688, 4.4921112060546875, 7.341773986816406, 10.191436767578125, 13.04110050201416, 15.890764236450195, 18.740427017211914, 21.590089797973633, 24.439754486083984, 27.289417266845703, 30.139080047607422, 32.98874282836914, 35.83840560913086, 38.688072204589844, 41.53773498535156, 44.38739776611328, 47.237060546875, 50.08672332763672, 52.93638610839844, 55.786048889160156, 58.635711669921875, 61.485374450683594, 64.33503723144531, 67.18470001220703, 70.03436279296875, 72.884033203125, 75.73368835449219, 78.5833511352539, 81.43301391601562, 84.28267669677734, 87.13233947753906, 89.98200225830078, 92.8316650390625, 95.68133544921875, 98.53099822998047]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 26.0, 40.0, 83.0, 149.0, 323.0, 742.0, 1787.0, 4393.0, 12485.0, 40840.0, 222417.0, 2410718.0, 1336251.0, 123819.0, 26695.0, 8242.0, 3046.0, 1151.0, 520.0, 205.0, 129.0, 68.0, 41.0, 21.0, 18.0, 16.0, 16.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.43096923828125, -5.1705322265625, -4.91009521484375, -4.649658203125, -4.38922119140625, -4.1287841796875, -3.86834716796875, -3.60791015625, -3.34747314453125, -3.0870361328125, -2.82659912109375, -2.566162109375, -2.30572509765625, -2.0452880859375, -1.78485107421875, -1.5244140625, -1.26397705078125, -1.0035400390625, -0.74310302734375, -0.482666015625, -0.22222900390625, 0.0382080078125, 0.29864501953125, 0.55908203125, 0.81951904296875, 1.0799560546875, 1.34039306640625, 1.600830078125, 1.86126708984375, 2.1217041015625, 2.38214111328125, 2.642578125, 2.90301513671875, 3.1634521484375, 3.42388916015625, 3.684326171875, 3.94476318359375, 4.2052001953125, 4.46563720703125, 4.72607421875, 4.98651123046875, 5.2469482421875, 5.50738525390625, 5.767822265625, 6.02825927734375, 6.2886962890625, 6.54913330078125, 6.8095703125, 7.07000732421875, 7.3304443359375, 7.59088134765625, 7.851318359375, 8.11175537109375, 8.3721923828125, 8.63262939453125, 8.89306640625, 9.15350341796875, 9.4139404296875, 9.67437744140625, 9.934814453125, 10.19525146484375, 10.4556884765625, 10.71612548828125, 10.9765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 20.0, 26.0, 38.0, 39.0, 89.0, 81.0, 86.0, 113.0, 85.0, 107.0, 67.0, 92.0, 44.0, 36.0, 23.0, 16.0, 15.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.00933837890625, -3.7257080078125, -3.44207763671875, -3.158447265625, -2.87481689453125, -2.5911865234375, -2.30755615234375, -2.02392578125, -1.74029541015625, -1.4566650390625, -1.17303466796875, -0.889404296875, -0.60577392578125, -0.3221435546875, -0.03851318359375, 0.2451171875, 0.52874755859375, 0.8123779296875, 1.09600830078125, 1.379638671875, 1.66326904296875, 1.9468994140625, 2.23052978515625, 2.51416015625, 2.79779052734375, 3.0814208984375, 3.36505126953125, 3.648681640625, 3.93231201171875, 4.2159423828125, 4.49957275390625, 4.783203125, 5.06683349609375, 5.3504638671875, 5.63409423828125, 5.917724609375, 6.20135498046875, 6.4849853515625, 6.76861572265625, 7.05224609375, 7.33587646484375, 7.6195068359375, 7.90313720703125, 8.186767578125, 8.47039794921875, 8.7540283203125, 9.03765869140625, 9.3212890625, 9.60491943359375, 9.8885498046875, 10.17218017578125, 10.455810546875, 10.73944091796875, 11.0230712890625, 11.30670166015625, 11.59033203125, 11.87396240234375, 12.1575927734375, 12.44122314453125, 12.724853515625, 13.00848388671875, 13.2921142578125, 13.57574462890625, 13.859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 2.0, 8.0, 8.0, 17.0, 12.0, 22.0, 37.0, 43.0, 66.0, 99.0, 152.0, 263.0, 380.0, 676.0, 1296.0, 2921.0, 7210.0, 22074.0, 88521.0, 820008.0, 2937293.0, 247634.0, 44517.0, 12480.0, 4422.0, 1795.0, 899.0, 482.0, 303.0, 187.0, 124.0, 79.0, 53.0, 54.0, 38.0, 18.0, 23.0, 12.0, 11.0, 7.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.6640625, -10.343505859375, -10.02294921875, -9.702392578125, -9.3818359375, -9.061279296875, -8.74072265625, -8.420166015625, -8.099609375, -7.779052734375, -7.45849609375, -7.137939453125, -6.8173828125, -6.496826171875, -6.17626953125, -5.855712890625, -5.53515625, -5.214599609375, -4.89404296875, -4.573486328125, -4.2529296875, -3.932373046875, -3.61181640625, -3.291259765625, -2.970703125, -2.650146484375, -2.32958984375, -2.009033203125, -1.6884765625, -1.367919921875, -1.04736328125, -0.726806640625, -0.40625, -0.085693359375, 0.23486328125, 0.555419921875, 0.8759765625, 1.196533203125, 1.51708984375, 1.837646484375, 2.158203125, 2.478759765625, 2.79931640625, 3.119873046875, 3.4404296875, 3.760986328125, 4.08154296875, 4.402099609375, 4.72265625, 5.043212890625, 5.36376953125, 5.684326171875, 6.0048828125, 6.325439453125, 6.64599609375, 6.966552734375, 7.287109375, 7.607666015625, 7.92822265625, 8.248779296875, 8.5693359375, 8.889892578125, 9.21044921875, 9.531005859375, 9.8515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 11.0, 10.0, 22.0, 36.0, 39.0, 59.0, 81.0, 134.0, 203.0, 327.0, 561.0, 784.0, 631.0, 415.0, 230.0, 157.0, 105.0, 67.0, 50.0, 32.0, 29.0, 12.0, 15.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.9473876953125, -10.590087890625, -10.2327880859375, -9.87548828125, -9.5181884765625, -9.160888671875, -8.8035888671875, -8.4462890625, -8.0889892578125, -7.731689453125, -7.3743896484375, -7.01708984375, -6.6597900390625, -6.302490234375, -5.9451904296875, -5.587890625, -5.2305908203125, -4.873291015625, -4.5159912109375, -4.15869140625, -3.8013916015625, -3.444091796875, -3.0867919921875, -2.7294921875, -2.3721923828125, -2.014892578125, -1.6575927734375, -1.30029296875, -0.9429931640625, -0.585693359375, -0.2283935546875, 0.12890625, 0.4862060546875, 0.843505859375, 1.2008056640625, 1.55810546875, 1.9154052734375, 2.272705078125, 2.6300048828125, 2.9873046875, 3.3446044921875, 3.701904296875, 4.0592041015625, 4.41650390625, 4.7738037109375, 5.131103515625, 5.4884033203125, 5.845703125, 6.2030029296875, 6.560302734375, 6.9176025390625, 7.27490234375, 7.6322021484375, 7.989501953125, 8.3468017578125, 8.7041015625, 9.0614013671875, 9.418701171875, 9.7760009765625, 10.13330078125, 10.4906005859375, 10.847900390625, 11.2052001953125, 11.5625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 33.0, 95.0, 242.0, 296.0, 195.0, 83.0, 24.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.0605163574219, -269.6875305175781, -263.3145751953125, -256.94158935546875, -250.56863403320312, -244.19564819335938, -237.8226776123047, -231.44970703125, -225.0767364501953, -218.70376586914062, -212.33079528808594, -205.95782470703125, -199.5848388671875, -193.2118682861328, -186.83889770507812, -180.46592712402344, -174.09295654296875, -167.71998596191406, -161.34701538085938, -154.9740447998047, -148.60107421875, -142.22808837890625, -135.85511779785156, -129.48214721679688, -123.10917663574219, -116.7362060546875, -110.36323547363281, -103.9902572631836, -97.6172866821289, -91.24431610107422, -84.871337890625, -78.49836730957031, -72.12541198730469, -65.75244140625, -59.37946701049805, -53.006492614746094, -46.633522033691406, -40.26055145263672, -33.887577056884766, -27.514602661132812, -21.141632080078125, -14.768659591674805, -8.395687103271484, -2.022714614868164, 4.350257873535156, 10.723230361938477, 17.096202850341797, 23.46917724609375, 29.842147827148438, 36.215118408203125, 42.58809280395508, 48.96106719970703, 55.33403778076172, 61.707008361816406, 68.07998657226562, 74.45295715332031, 80.825927734375, 87.19889831542969, 93.57186889648438, 99.9448471069336, 106.31781768798828, 112.69078826904297, 119.06376647949219, 125.43673706054688, 131.80970764160156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 1.0, 8.0, 7.0, 17.0, 25.0, 26.0, 37.0, 49.0, 50.0, 70.0, 74.0, 74.0, 83.0, 85.0, 72.0, 68.0, 58.0, 41.0, 49.0, 27.0, 25.0, 13.0, 8.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.61972045898438, -89.03205871582031, -86.44438934326172, -83.85671997070312, -81.26905822753906, -78.681396484375, -76.0937271118164, -73.50605773925781, -70.91839599609375, -68.33073425292969, -65.7430648803711, -63.155399322509766, -60.56773376464844, -57.98006820678711, -55.39240264892578, -52.80473709106445, -50.217071533203125, -47.6294059753418, -45.04174041748047, -42.45407485961914, -39.86640930175781, -37.278743743896484, -34.691078186035156, -32.10341262817383, -29.5157470703125, -26.928081512451172, -24.340415954589844, -21.752750396728516, -19.165084838867188, -16.57741928100586, -13.989753723144531, -11.402088165283203, -8.814422607421875, -6.226757049560547, -3.6390914916992188, -1.0514259338378906, 1.5362396240234375, 4.123905181884766, 6.711570739746094, 9.299236297607422, 11.88690185546875, 14.474567413330078, 17.062232971191406, 19.649898529052734, 22.237564086914062, 24.82522964477539, 27.41289520263672, 30.000560760498047, 32.588226318359375, 35.1758918762207, 37.76355743408203, 40.35122299194336, 42.93888854980469, 45.526554107666016, 48.114219665527344, 50.70188522338867, 53.28955078125, 55.87721633911133, 58.464881896972656, 61.052547454833984, 63.64021301269531, 66.22787475585938, 68.81554412841797, 71.40321350097656, 73.99087524414062]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 13.0, 20.0, 23.0, 69.0, 74.0, 125.0, 180.0, 300.0, 501.0, 844.0, 1512.0, 2784.0, 5326.0, 10355.0, 22368.0, 50700.0, 125306.0, 320853.0, 301747.0, 116251.0, 47261.0, 20911.0, 9945.0, 5023.0, 2588.0, 1472.0, 799.0, 465.0, 267.0, 159.0, 99.0, 77.0, 47.0, 26.0, 18.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.8983154296875, -6.632568359375, -6.3668212890625, -6.10107421875, -5.8353271484375, -5.569580078125, -5.3038330078125, -5.0380859375, -4.7723388671875, -4.506591796875, -4.2408447265625, -3.97509765625, -3.7093505859375, -3.443603515625, -3.1778564453125, -2.912109375, -2.6463623046875, -2.380615234375, -2.1148681640625, -1.84912109375, -1.5833740234375, -1.317626953125, -1.0518798828125, -0.7861328125, -0.5203857421875, -0.254638671875, 0.0111083984375, 0.27685546875, 0.5426025390625, 0.808349609375, 1.0740966796875, 1.33984375, 1.6055908203125, 1.871337890625, 2.1370849609375, 2.40283203125, 2.6685791015625, 2.934326171875, 3.2000732421875, 3.4658203125, 3.7315673828125, 3.997314453125, 4.2630615234375, 4.52880859375, 4.7945556640625, 5.060302734375, 5.3260498046875, 5.591796875, 5.8575439453125, 6.123291015625, 6.3890380859375, 6.65478515625, 6.9205322265625, 7.186279296875, 7.4520263671875, 7.7177734375, 7.9835205078125, 8.249267578125, 8.5150146484375, 8.78076171875, 9.0465087890625, 9.312255859375, 9.5780029296875, 9.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 16.0, 18.0, 22.0, 26.0, 25.0, 47.0, 53.0, 48.0, 48.0, 64.0, 74.0, 57.0, 61.0, 49.0, 53.0, 63.0, 49.0, 44.0, 36.0, 30.0, 15.0, 14.0, 17.0, 12.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.3885498046875, -4.202880859375, -4.0172119140625, -3.83154296875, -3.6458740234375, -3.460205078125, -3.2745361328125, -3.0888671875, -2.9031982421875, -2.717529296875, -2.5318603515625, -2.34619140625, -2.1605224609375, -1.974853515625, -1.7891845703125, -1.603515625, -1.4178466796875, -1.232177734375, -1.0465087890625, -0.86083984375, -0.6751708984375, -0.489501953125, -0.3038330078125, -0.1181640625, 0.0675048828125, 0.253173828125, 0.4388427734375, 0.62451171875, 0.8101806640625, 0.995849609375, 1.1815185546875, 1.3671875, 1.5528564453125, 1.738525390625, 1.9241943359375, 2.10986328125, 2.2955322265625, 2.481201171875, 2.6668701171875, 2.8525390625, 3.0382080078125, 3.223876953125, 3.4095458984375, 3.59521484375, 3.7808837890625, 3.966552734375, 4.1522216796875, 4.337890625, 4.5235595703125, 4.709228515625, 4.8948974609375, 5.08056640625, 5.2662353515625, 5.451904296875, 5.6375732421875, 5.8232421875, 6.0089111328125, 6.194580078125, 6.3802490234375, 6.56591796875, 6.7515869140625, 6.937255859375, 7.1229248046875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 9.0, 16.0, 18.0, 22.0, 33.0, 48.0, 74.0, 91.0, 127.0, 170.0, 278.0, 402.0, 675.0, 1159.0, 2251.0, 5855.0, 23728.0, 181519.0, 730467.0, 79795.0, 13390.0, 3951.0, 1757.0, 946.0, 576.0, 354.0, 255.0, 168.0, 123.0, 79.0, 66.0, 37.0, 22.0, 24.0, 20.0, 12.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.328125, -19.718017578125, -19.10791015625, -18.497802734375, -17.8876953125, -17.277587890625, -16.66748046875, -16.057373046875, -15.447265625, -14.837158203125, -14.22705078125, -13.616943359375, -13.0068359375, -12.396728515625, -11.78662109375, -11.176513671875, -10.56640625, -9.956298828125, -9.34619140625, -8.736083984375, -8.1259765625, -7.515869140625, -6.90576171875, -6.295654296875, -5.685546875, -5.075439453125, -4.46533203125, -3.855224609375, -3.2451171875, -2.635009765625, -2.02490234375, -1.414794921875, -0.8046875, -0.194580078125, 0.41552734375, 1.025634765625, 1.6357421875, 2.245849609375, 2.85595703125, 3.466064453125, 4.076171875, 4.686279296875, 5.29638671875, 5.906494140625, 6.5166015625, 7.126708984375, 7.73681640625, 8.346923828125, 8.95703125, 9.567138671875, 10.17724609375, 10.787353515625, 11.3974609375, 12.007568359375, 12.61767578125, 13.227783203125, 13.837890625, 14.447998046875, 15.05810546875, 15.668212890625, 16.2783203125, 16.888427734375, 17.49853515625, 18.108642578125, 18.71875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 23.0, 18.0, 17.0, 28.0, 34.0, 37.0, 45.0, 38.0, 49.0, 42.0, 52.0, 50.0, 77.0, 53.0, 54.0, 40.0, 51.0, 33.0, 37.0, 30.0, 25.0, 20.0, 21.0, 13.0, 14.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.782470703125, -16.17431640625, -15.566162109375, -14.9580078125, -14.349853515625, -13.74169921875, -13.133544921875, -12.525390625, -11.917236328125, -11.30908203125, -10.700927734375, -10.0927734375, -9.484619140625, -8.87646484375, -8.268310546875, -7.66015625, -7.052001953125, -6.44384765625, -5.835693359375, -5.2275390625, -4.619384765625, -4.01123046875, -3.403076171875, -2.794921875, -2.186767578125, -1.57861328125, -0.970458984375, -0.3623046875, 0.245849609375, 0.85400390625, 1.462158203125, 2.0703125, 2.678466796875, 3.28662109375, 3.894775390625, 4.5029296875, 5.111083984375, 5.71923828125, 6.327392578125, 6.935546875, 7.543701171875, 8.15185546875, 8.760009765625, 9.3681640625, 9.976318359375, 10.58447265625, 11.192626953125, 11.80078125, 12.408935546875, 13.01708984375, 13.625244140625, 14.2333984375, 14.841552734375, 15.44970703125, 16.057861328125, 16.666015625, 17.274169921875, 17.88232421875, 18.490478515625, 19.0986328125, 19.706787109375, 20.31494140625, 20.923095703125, 21.53125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 4.0, 10.0, 14.0, 25.0, 29.0, 49.0, 68.0, 106.0, 181.0, 264.0, 415.0, 742.0, 1317.0, 2693.0, 6693.0, 29652.0, 335434.0, 618651.0, 37633.0, 8033.0, 3023.0, 1451.0, 775.0, 475.0, 296.0, 163.0, 122.0, 70.0, 40.0, 32.0, 19.0, 17.0, 15.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.49432373046875, -5.2659912109375, -5.03765869140625, -4.809326171875, -4.58099365234375, -4.3526611328125, -4.12432861328125, -3.89599609375, -3.66766357421875, -3.4393310546875, -3.21099853515625, -2.982666015625, -2.75433349609375, -2.5260009765625, -2.29766845703125, -2.0693359375, -1.84100341796875, -1.6126708984375, -1.38433837890625, -1.156005859375, -0.92767333984375, -0.6993408203125, -0.47100830078125, -0.24267578125, -0.01434326171875, 0.2139892578125, 0.44232177734375, 0.670654296875, 0.89898681640625, 1.1273193359375, 1.35565185546875, 1.583984375, 1.81231689453125, 2.0406494140625, 2.26898193359375, 2.497314453125, 2.72564697265625, 2.9539794921875, 3.18231201171875, 3.41064453125, 3.63897705078125, 3.8673095703125, 4.09564208984375, 4.323974609375, 4.55230712890625, 4.7806396484375, 5.00897216796875, 5.2373046875, 5.46563720703125, 5.6939697265625, 5.92230224609375, 6.150634765625, 6.37896728515625, 6.6072998046875, 6.83563232421875, 7.06396484375, 7.29229736328125, 7.5206298828125, 7.74896240234375, 7.977294921875, 8.20562744140625, 8.4339599609375, 8.66229248046875, 8.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 14.0, 35.0, 63.0, 198.0, 456.0, 125.0, 44.0, 26.0, 16.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005268096923828125, -0.005105435848236084, -0.004942774772644043, -0.004780113697052002, -0.004617452621459961, -0.00445479154586792, -0.004292130470275879, -0.004129469394683838, -0.003966808319091797, -0.003804147243499756, -0.003641486167907715, -0.003478825092315674, -0.003316164016723633, -0.003153502941131592, -0.0029908418655395508, -0.0028281807899475098, -0.0026655197143554688, -0.0025028586387634277, -0.0023401975631713867, -0.0021775364875793457, -0.0020148754119873047, -0.0018522143363952637, -0.0016895532608032227, -0.0015268921852111816, -0.0013642311096191406, -0.0012015700340270996, -0.0010389089584350586, -0.0008762478828430176, -0.0007135868072509766, -0.0005509257316589355, -0.00038826465606689453, -0.00022560358047485352, -6.29425048828125e-05, 9.971857070922852e-05, 0.00026237964630126953, 0.00042504072189331055, 0.0005877017974853516, 0.0007503628730773926, 0.0009130239486694336, 0.0010756850242614746, 0.0012383460998535156, 0.0014010071754455566, 0.0015636682510375977, 0.0017263293266296387, 0.0018889904022216797, 0.0020516514778137207, 0.0022143125534057617, 0.0023769736289978027, 0.0025396347045898438, 0.0027022957801818848, 0.0028649568557739258, 0.003027617931365967, 0.003190279006958008, 0.003352940082550049, 0.00351560115814209, 0.003678262233734131, 0.003840923309326172, 0.004003584384918213, 0.004166245460510254, 0.004328906536102295, 0.004491567611694336, 0.004654228687286377, 0.004816889762878418, 0.004979550838470459, 0.0051422119140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 11.0, 29.0, 47.0, 76.0, 137.0, 306.0, 787.0, 2554.0, 16868.0, 936504.0, 83914.0, 5144.0, 1257.0, 467.0, 179.0, 93.0, 53.0, 36.0, 23.0, 19.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.4375, -17.94873046875, -17.4599609375, -16.97119140625, -16.482421875, -15.99365234375, -15.5048828125, -15.01611328125, -14.52734375, -14.03857421875, -13.5498046875, -13.06103515625, -12.572265625, -12.08349609375, -11.5947265625, -11.10595703125, -10.6171875, -10.12841796875, -9.6396484375, -9.15087890625, -8.662109375, -8.17333984375, -7.6845703125, -7.19580078125, -6.70703125, -6.21826171875, -5.7294921875, -5.24072265625, -4.751953125, -4.26318359375, -3.7744140625, -3.28564453125, -2.796875, -2.30810546875, -1.8193359375, -1.33056640625, -0.841796875, -0.35302734375, 0.1357421875, 0.62451171875, 1.11328125, 1.60205078125, 2.0908203125, 2.57958984375, 3.068359375, 3.55712890625, 4.0458984375, 4.53466796875, 5.0234375, 5.51220703125, 6.0009765625, 6.48974609375, 6.978515625, 7.46728515625, 7.9560546875, 8.44482421875, 8.93359375, 9.42236328125, 9.9111328125, 10.39990234375, 10.888671875, 11.37744140625, 11.8662109375, 12.35498046875, 12.84375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 6.0, 14.0, 20.0, 31.0, 78.0, 138.0, 194.0, 210.0, 139.0, 64.0, 37.0, 23.0, 9.0, 12.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -11.0296630859375, -10.723388671875, -10.4171142578125, -10.11083984375, -9.8045654296875, -9.498291015625, -9.1920166015625, -8.8857421875, -8.5794677734375, -8.273193359375, -7.9669189453125, -7.66064453125, -7.3543701171875, -7.048095703125, -6.7418212890625, -6.435546875, -6.1292724609375, -5.822998046875, -5.5167236328125, -5.21044921875, -4.9041748046875, -4.597900390625, -4.2916259765625, -3.9853515625, -3.6790771484375, -3.372802734375, -3.0665283203125, -2.76025390625, -2.4539794921875, -2.147705078125, -1.8414306640625, -1.53515625, -1.2288818359375, -0.922607421875, -0.6163330078125, -0.31005859375, -0.0037841796875, 0.302490234375, 0.6087646484375, 0.9150390625, 1.2213134765625, 1.527587890625, 1.8338623046875, 2.14013671875, 2.4464111328125, 2.752685546875, 3.0589599609375, 3.365234375, 3.6715087890625, 3.977783203125, 4.2840576171875, 4.59033203125, 4.8966064453125, 5.202880859375, 5.5091552734375, 5.8154296875, 6.1217041015625, 6.427978515625, 6.7342529296875, 7.04052734375, 7.3468017578125, 7.653076171875, 7.9593505859375, 8.265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 15.0, 37.0, 72.0, 157.0, 264.0, 204.0, 117.0, 56.0, 31.0, 17.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.45606994628906, -123.65691375732422, -118.8577651977539, -114.05860900878906, -109.25946044921875, -104.4603042602539, -99.66114807128906, -94.86199951171875, -90.0628433227539, -85.26368713378906, -80.46453857421875, -75.6653823852539, -70.86622619628906, -66.06707763671875, -61.267921447753906, -56.46876907348633, -51.66961669921875, -46.87046432495117, -42.071311950683594, -37.27215576171875, -32.47300338745117, -27.673851013183594, -22.874696731567383, -18.075542449951172, -13.276390075683594, -8.4772367477417, -3.6780834197998047, 1.1210699081420898, 5.920223236083984, 10.719375610351562, 15.518529891967773, 20.317684173583984, 25.1168212890625, 29.915973663330078, 34.715126037597656, 39.5142822265625, 44.31343460083008, 49.112586975097656, 53.9117431640625, 58.71089553833008, 63.510047912597656, 68.3092041015625, 73.10835266113281, 77.90750885009766, 82.7066650390625, 87.50581359863281, 92.30496978759766, 97.1041259765625, 101.90327453613281, 106.70243072509766, 111.50157928466797, 116.30073547363281, 121.09988403320312, 125.89904022216797, 130.6981964111328, 135.49734497070312, 140.2965087890625, 145.0956573486328, 149.8948211669922, 154.6939697265625, 159.4931182861328, 164.29226684570312, 169.0914306640625, 173.8905792236328, 178.68972778320312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 13.0, 5.0, 11.0, 9.0, 11.0, 12.0, 11.0, 19.0, 21.0, 14.0, 25.0, 19.0, 20.0, 24.0, 32.0, 42.0, 55.0, 59.0, 65.0, 66.0, 58.0, 51.0, 41.0, 26.0, 28.0, 37.0, 21.0, 19.0, 24.0, 21.0, 14.0, 15.0, 21.0, 15.0, 13.0, 6.0, 5.0, 7.0, 13.0, 10.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-62.65190887451172, -60.691123962402344, -58.730342864990234, -56.76955795288086, -54.80877685546875, -52.847991943359375, -50.88720703125, -48.926422119140625, -46.965641021728516, -45.00485610961914, -43.04407501220703, -41.083290100097656, -39.12250518798828, -37.16172409057617, -35.2009391784668, -33.24015808105469, -31.279373168945312, -29.31859016418457, -27.357807159423828, -25.397022247314453, -23.43623924255371, -21.47545623779297, -19.514671325683594, -17.55388832092285, -15.59310531616211, -13.632322311401367, -11.671538352966309, -9.71075439453125, -7.749971389770508, -5.789188385009766, -3.828404426574707, -1.8676204681396484, 0.09316253662109375, 2.053946018218994, 4.0147294998168945, 5.975512981414795, 7.936296463012695, 9.897079467773438, 11.857863426208496, 13.818647384643555, 15.779430389404297, 17.74021339416504, 19.70099639892578, 21.661781311035156, 23.6225643157959, 25.58334732055664, 27.544132232666016, 29.504915237426758, 31.4656982421875, 33.426483154296875, 35.387264251708984, 37.34804916381836, 39.30883026123047, 41.269615173339844, 43.23040008544922, 45.191184997558594, 47.1519660949707, 49.11275100708008, 51.07353210449219, 53.03431701660156, 54.99510192871094, 56.95588302612305, 58.91666793823242, 60.87744903564453, 62.838233947753906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 12.0, 33.0, 38.0, 59.0, 98.0, 154.0, 242.0, 396.0, 598.0, 1149.0, 2162.0, 4373.0, 10423.0, 31826.0, 173013.0, 1872332.0, 1873943.0, 173458.0, 30872.0, 10036.0, 4199.0, 2023.0, 1079.0, 671.0, 416.0, 234.0, 141.0, 85.0, 61.0, 37.0, 26.0, 21.0, 16.0, 15.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65338134765625, -6.4239501953125, -6.19451904296875, -5.965087890625, -5.73565673828125, -5.5062255859375, -5.27679443359375, -5.04736328125, -4.81793212890625, -4.5885009765625, -4.35906982421875, -4.129638671875, -3.90020751953125, -3.6707763671875, -3.44134521484375, -3.2119140625, -2.98248291015625, -2.7530517578125, -2.52362060546875, -2.294189453125, -2.06475830078125, -1.8353271484375, -1.60589599609375, -1.37646484375, -1.14703369140625, -0.9176025390625, -0.68817138671875, -0.458740234375, -0.22930908203125, 0.0001220703125, 0.22955322265625, 0.458984375, 0.68841552734375, 0.9178466796875, 1.14727783203125, 1.376708984375, 1.60614013671875, 1.8355712890625, 2.06500244140625, 2.29443359375, 2.52386474609375, 2.7532958984375, 2.98272705078125, 3.212158203125, 3.44158935546875, 3.6710205078125, 3.90045166015625, 4.1298828125, 4.35931396484375, 4.5887451171875, 4.81817626953125, 5.047607421875, 5.27703857421875, 5.5064697265625, 5.73590087890625, 5.96533203125, 6.19476318359375, 6.4241943359375, 6.65362548828125, 6.883056640625, 7.11248779296875, 7.3419189453125, 7.57135009765625, 7.80078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 9.0, 12.0, 15.0, 14.0, 20.0, 28.0, 33.0, 30.0, 39.0, 37.0, 50.0, 69.0, 72.0, 62.0, 59.0, 52.0, 57.0, 55.0, 61.0, 34.0, 41.0, 42.0, 23.0, 20.0, 13.0, 10.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.456695556640625, -3.28643798828125, -3.116180419921875, -2.9459228515625, -2.775665283203125, -2.60540771484375, -2.435150146484375, -2.264892578125, -2.094635009765625, -1.92437744140625, -1.754119873046875, -1.5838623046875, -1.413604736328125, -1.24334716796875, -1.073089599609375, -0.90283203125, -0.732574462890625, -0.56231689453125, -0.392059326171875, -0.2218017578125, -0.051544189453125, 0.11871337890625, 0.288970947265625, 0.459228515625, 0.629486083984375, 0.79974365234375, 0.970001220703125, 1.1402587890625, 1.310516357421875, 1.48077392578125, 1.651031494140625, 1.8212890625, 1.991546630859375, 2.16180419921875, 2.332061767578125, 2.5023193359375, 2.672576904296875, 2.84283447265625, 3.013092041015625, 3.183349609375, 3.353607177734375, 3.52386474609375, 3.694122314453125, 3.8643798828125, 4.034637451171875, 4.20489501953125, 4.375152587890625, 4.54541015625, 4.715667724609375, 4.88592529296875, 5.056182861328125, 5.2264404296875, 5.396697998046875, 5.56695556640625, 5.737213134765625, 5.907470703125, 6.077728271484375, 6.24798583984375, 6.418243408203125, 6.5885009765625, 6.758758544921875, 6.92901611328125, 7.099273681640625, 7.26953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 17.0, 20.0, 27.0, 49.0, 57.0, 91.0, 97.0, 152.0, 265.0, 419.0, 744.0, 1509.0, 3921.0, 14466.0, 97647.0, 3298375.0, 720601.0, 42021.0, 8362.0, 2613.0, 1165.0, 579.0, 339.0, 216.0, 159.0, 92.0, 75.0, 48.0, 38.0, 27.0, 23.0, 12.0, 7.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.9296875, -13.477294921875, -13.02490234375, -12.572509765625, -12.1201171875, -11.667724609375, -11.21533203125, -10.762939453125, -10.310546875, -9.858154296875, -9.40576171875, -8.953369140625, -8.5009765625, -8.048583984375, -7.59619140625, -7.143798828125, -6.69140625, -6.239013671875, -5.78662109375, -5.334228515625, -4.8818359375, -4.429443359375, -3.97705078125, -3.524658203125, -3.072265625, -2.619873046875, -2.16748046875, -1.715087890625, -1.2626953125, -0.810302734375, -0.35791015625, 0.094482421875, 0.546875, 0.999267578125, 1.45166015625, 1.904052734375, 2.3564453125, 2.808837890625, 3.26123046875, 3.713623046875, 4.166015625, 4.618408203125, 5.07080078125, 5.523193359375, 5.9755859375, 6.427978515625, 6.88037109375, 7.332763671875, 7.78515625, 8.237548828125, 8.68994140625, 9.142333984375, 9.5947265625, 10.047119140625, 10.49951171875, 10.951904296875, 11.404296875, 11.856689453125, 12.30908203125, 12.761474609375, 13.2138671875, 13.666259765625, 14.11865234375, 14.571044921875, 15.0234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 12.0, 22.0, 26.0, 56.0, 93.0, 216.0, 454.0, 1086.0, 1052.0, 503.0, 213.0, 108.0, 71.0, 47.0, 32.0, 22.0, 16.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.469970703125, -15.97119140625, -15.472412109375, -14.9736328125, -14.474853515625, -13.97607421875, -13.477294921875, -12.978515625, -12.479736328125, -11.98095703125, -11.482177734375, -10.9833984375, -10.484619140625, -9.98583984375, -9.487060546875, -8.98828125, -8.489501953125, -7.99072265625, -7.491943359375, -6.9931640625, -6.494384765625, -5.99560546875, -5.496826171875, -4.998046875, -4.499267578125, -4.00048828125, -3.501708984375, -3.0029296875, -2.504150390625, -2.00537109375, -1.506591796875, -1.0078125, -0.509033203125, -0.01025390625, 0.488525390625, 0.9873046875, 1.486083984375, 1.98486328125, 2.483642578125, 2.982421875, 3.481201171875, 3.97998046875, 4.478759765625, 4.9775390625, 5.476318359375, 5.97509765625, 6.473876953125, 6.97265625, 7.471435546875, 7.97021484375, 8.468994140625, 8.9677734375, 9.466552734375, 9.96533203125, 10.464111328125, 10.962890625, 11.461669921875, 11.96044921875, 12.459228515625, 12.9580078125, 13.456787109375, 13.95556640625, 14.454345703125, 14.953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 14.0, 53.0, 133.0, 290.0, 295.0, 129.0, 35.0, 28.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.38079833984375, -253.84283447265625, -247.30487060546875, -240.76690673828125, -234.2289581298828, -227.6909942626953, -221.1530303955078, -214.6150665283203, -208.07711791992188, -201.53915405273438, -195.00119018554688, -188.46322631835938, -181.92527770996094, -175.38731384277344, -168.84934997558594, -162.31138610839844, -155.77342224121094, -149.23545837402344, -142.69749450683594, -136.1595458984375, -129.62158203125, -123.0836181640625, -116.545654296875, -110.0076904296875, -103.46973419189453, -96.93177032470703, -90.39381408691406, -83.85585021972656, -77.31788635253906, -70.7799301147461, -64.2419662475586, -57.70400619506836, -51.166046142578125, -44.62808609008789, -38.090126037597656, -31.552162170410156, -25.014202117919922, -18.476242065429688, -11.938278198242188, -5.400318145751953, 1.1376419067382812, 7.675602912902832, 14.213563919067383, 20.75152587890625, 27.289485931396484, 33.82744598388672, 40.36540985107422, 46.90336990356445, 53.44132995605469, 59.97929000854492, 66.51725006103516, 73.05521392822266, 79.59317016601562, 86.13113403320312, 92.66909790039062, 99.20706176757812, 105.7450180053711, 112.2829818725586, 118.82093811035156, 125.35890197753906, 131.89686584472656, 138.434814453125, 144.9727783203125, 151.5107421875, 158.0487060546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 13.0, 16.0, 28.0, 21.0, 43.0, 39.0, 37.0, 53.0, 56.0, 43.0, 58.0, 65.0, 74.0, 55.0, 59.0, 47.0, 54.0, 41.0, 37.0, 25.0, 25.0, 17.0, 11.0, 24.0, 8.0, 7.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.72247314453125, -62.74386978149414, -60.7652702331543, -58.78666687011719, -56.808067321777344, -54.829463958740234, -52.85086441040039, -50.87226104736328, -48.89366149902344, -46.91505813598633, -44.936458587646484, -42.957855224609375, -40.97925567626953, -39.00065231323242, -37.02205276489258, -35.04344940185547, -33.064849853515625, -31.08624839782715, -29.107646942138672, -27.129045486450195, -25.15044403076172, -23.17184066772461, -21.193241119384766, -19.214637756347656, -17.236034393310547, -15.25743293762207, -13.278831481933594, -11.300230026245117, -9.32162857055664, -7.343026161193848, -5.364424705505371, -3.3858232498168945, -1.4072227478027344, 0.5713788270950317, 2.549980401992798, 4.5285820960998535, 6.50718355178833, 8.485785484313965, 10.464386940002441, 12.442988395690918, 14.421589851379395, 16.400192260742188, 18.378793716430664, 20.35739517211914, 22.335996627807617, 24.314598083496094, 26.29319953918457, 28.271800994873047, 30.250402450561523, 32.22900390625, 34.20760726928711, 36.18620681762695, 38.16481018066406, 40.143409729003906, 42.122013092041016, 44.10061264038086, 46.07921600341797, 48.05781936645508, 50.03641891479492, 52.01502227783203, 53.993621826171875, 55.972225189208984, 57.95082473754883, 59.92942810058594, 61.90802764892578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 12.0, 14.0, 17.0, 25.0, 40.0, 84.0, 105.0, 153.0, 275.0, 475.0, 816.0, 1438.0, 2690.0, 5161.0, 11184.0, 25426.0, 63562.0, 159644.0, 308289.0, 265548.0, 118995.0, 46819.0, 19615.0, 8846.0, 4266.0, 2147.0, 1209.0, 679.0, 377.0, 259.0, 142.0, 89.0, 67.0, 31.0, 20.0, 9.0, 10.0, 5.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.49554443359375, -6.3035888671875, -6.11163330078125, -5.919677734375, -5.72772216796875, -5.5357666015625, -5.34381103515625, -5.15185546875, -4.95989990234375, -4.7679443359375, -4.57598876953125, -4.384033203125, -4.19207763671875, -4.0001220703125, -3.80816650390625, -3.6162109375, -3.42425537109375, -3.2322998046875, -3.04034423828125, -2.848388671875, -2.65643310546875, -2.4644775390625, -2.27252197265625, -2.08056640625, -1.88861083984375, -1.6966552734375, -1.50469970703125, -1.312744140625, -1.12078857421875, -0.9288330078125, -0.73687744140625, -0.544921875, -0.35296630859375, -0.1610107421875, 0.03094482421875, 0.222900390625, 0.41485595703125, 0.6068115234375, 0.79876708984375, 0.99072265625, 1.18267822265625, 1.3746337890625, 1.56658935546875, 1.758544921875, 1.95050048828125, 2.1424560546875, 2.33441162109375, 2.5263671875, 2.71832275390625, 2.9102783203125, 3.10223388671875, 3.294189453125, 3.48614501953125, 3.6781005859375, 3.87005615234375, 4.06201171875, 4.25396728515625, 4.4459228515625, 4.63787841796875, 4.829833984375, 5.02178955078125, 5.2137451171875, 5.40570068359375, 5.59765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 11.0, 10.0, 20.0, 25.0, 22.0, 37.0, 43.0, 49.0, 41.0, 55.0, 68.0, 61.0, 53.0, 61.0, 50.0, 64.0, 46.0, 44.0, 46.0, 26.0, 31.0, 30.0, 25.0, 17.0, 14.0, 8.0, 7.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.87664794921875, -3.6986083984375, -3.52056884765625, -3.342529296875, -3.16448974609375, -2.9864501953125, -2.80841064453125, -2.63037109375, -2.45233154296875, -2.2742919921875, -2.09625244140625, -1.918212890625, -1.74017333984375, -1.5621337890625, -1.38409423828125, -1.2060546875, -1.02801513671875, -0.8499755859375, -0.67193603515625, -0.493896484375, -0.31585693359375, -0.1378173828125, 0.04022216796875, 0.21826171875, 0.39630126953125, 0.5743408203125, 0.75238037109375, 0.930419921875, 1.10845947265625, 1.2864990234375, 1.46453857421875, 1.642578125, 1.82061767578125, 1.9986572265625, 2.17669677734375, 2.354736328125, 2.53277587890625, 2.7108154296875, 2.88885498046875, 3.06689453125, 3.24493408203125, 3.4229736328125, 3.60101318359375, 3.779052734375, 3.95709228515625, 4.1351318359375, 4.31317138671875, 4.4912109375, 4.66925048828125, 4.8472900390625, 5.02532958984375, 5.203369140625, 5.38140869140625, 5.5594482421875, 5.73748779296875, 5.91552734375, 6.09356689453125, 6.2716064453125, 6.44964599609375, 6.627685546875, 6.80572509765625, 6.9837646484375, 7.16180419921875, 7.33984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 4.0, 4.0, 6.0, 11.0, 16.0, 16.0, 36.0, 38.0, 56.0, 81.0, 133.0, 183.0, 282.0, 511.0, 950.0, 2030.0, 4527.0, 13564.0, 58104.0, 343150.0, 531231.0, 68851.0, 15140.0, 5099.0, 2013.0, 1046.0, 581.0, 324.0, 167.0, 126.0, 69.0, 63.0, 43.0, 25.0, 19.0, 9.0, 10.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.59375, -11.2203369140625, -10.846923828125, -10.4735107421875, -10.10009765625, -9.7266845703125, -9.353271484375, -8.9798583984375, -8.6064453125, -8.2330322265625, -7.859619140625, -7.4862060546875, -7.11279296875, -6.7393798828125, -6.365966796875, -5.9925537109375, -5.619140625, -5.2457275390625, -4.872314453125, -4.4989013671875, -4.12548828125, -3.7520751953125, -3.378662109375, -3.0052490234375, -2.6318359375, -2.2584228515625, -1.885009765625, -1.5115966796875, -1.13818359375, -0.7647705078125, -0.391357421875, -0.0179443359375, 0.35546875, 0.7288818359375, 1.102294921875, 1.4757080078125, 1.84912109375, 2.2225341796875, 2.595947265625, 2.9693603515625, 3.3427734375, 3.7161865234375, 4.089599609375, 4.4630126953125, 4.83642578125, 5.2098388671875, 5.583251953125, 5.9566650390625, 6.330078125, 6.7034912109375, 7.076904296875, 7.4503173828125, 7.82373046875, 8.1971435546875, 8.570556640625, 8.9439697265625, 9.3173828125, 9.6907958984375, 10.064208984375, 10.4376220703125, 10.81103515625, 11.1844482421875, 11.557861328125, 11.9312744140625, 12.3046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 18.0, 25.0, 32.0, 17.0, 37.0, 51.0, 48.0, 46.0, 47.0, 55.0, 44.0, 65.0, 39.0, 54.0, 56.0, 45.0, 41.0, 37.0, 33.0, 27.0, 23.0, 27.0, 20.0, 18.0, 8.0, 15.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.810791015625, -14.26220703125, -13.713623046875, -13.1650390625, -12.616455078125, -12.06787109375, -11.519287109375, -10.970703125, -10.422119140625, -9.87353515625, -9.324951171875, -8.7763671875, -8.227783203125, -7.67919921875, -7.130615234375, -6.58203125, -6.033447265625, -5.48486328125, -4.936279296875, -4.3876953125, -3.839111328125, -3.29052734375, -2.741943359375, -2.193359375, -1.644775390625, -1.09619140625, -0.547607421875, 0.0009765625, 0.549560546875, 1.09814453125, 1.646728515625, 2.1953125, 2.743896484375, 3.29248046875, 3.841064453125, 4.3896484375, 4.938232421875, 5.48681640625, 6.035400390625, 6.583984375, 7.132568359375, 7.68115234375, 8.229736328125, 8.7783203125, 9.326904296875, 9.87548828125, 10.424072265625, 10.97265625, 11.521240234375, 12.06982421875, 12.618408203125, 13.1669921875, 13.715576171875, 14.26416015625, 14.812744140625, 15.361328125, 15.909912109375, 16.45849609375, 17.007080078125, 17.5556640625, 18.104248046875, 18.65283203125, 19.201416015625, 19.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 9.0, 16.0, 27.0, 33.0, 26.0, 49.0, 74.0, 123.0, 215.0, 372.0, 600.0, 940.0, 1687.0, 3246.0, 6638.0, 15152.0, 40602.0, 146984.0, 600957.0, 157592.0, 43136.0, 15715.0, 6759.0, 3314.0, 1720.0, 997.0, 550.0, 369.0, 212.0, 162.0, 83.0, 62.0, 41.0, 28.0, 13.0, 10.0, 3.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.841796875, -2.75164794921875, -2.6614990234375, -2.57135009765625, -2.481201171875, -2.39105224609375, -2.3009033203125, -2.21075439453125, -2.12060546875, -2.03045654296875, -1.9403076171875, -1.85015869140625, -1.760009765625, -1.66986083984375, -1.5797119140625, -1.48956298828125, -1.3994140625, -1.30926513671875, -1.2191162109375, -1.12896728515625, -1.038818359375, -0.94866943359375, -0.8585205078125, -0.76837158203125, -0.67822265625, -0.58807373046875, -0.4979248046875, -0.40777587890625, -0.317626953125, -0.22747802734375, -0.1373291015625, -0.04718017578125, 0.04296875, 0.13311767578125, 0.2232666015625, 0.31341552734375, 0.403564453125, 0.49371337890625, 0.5838623046875, 0.67401123046875, 0.76416015625, 0.85430908203125, 0.9444580078125, 1.03460693359375, 1.124755859375, 1.21490478515625, 1.3050537109375, 1.39520263671875, 1.4853515625, 1.57550048828125, 1.6656494140625, 1.75579833984375, 1.845947265625, 1.93609619140625, 2.0262451171875, 2.11639404296875, 2.20654296875, 2.29669189453125, 2.3868408203125, 2.47698974609375, 2.567138671875, 2.65728759765625, 2.7474365234375, 2.83758544921875, 2.927734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 10.0, 11.0, 22.0, 36.0, 66.0, 209.0, 252.0, 175.0, 78.0, 40.0, 25.0, 10.0, 16.0, 9.0, 4.0, 4.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001651763916015625, -0.00159551203250885, -0.0015392601490020752, -0.0014830082654953003, -0.0014267563819885254, -0.0013705044984817505, -0.0013142526149749756, -0.0012580007314682007, -0.0012017488479614258, -0.0011454969644546509, -0.001089245080947876, -0.001032993197441101, -0.0009767413139343262, -0.0009204894304275513, -0.0008642375469207764, -0.0008079856634140015, -0.0007517337799072266, -0.0006954818964004517, -0.0006392300128936768, -0.0005829781293869019, -0.000526726245880127, -0.00047047436237335205, -0.00041422247886657715, -0.00035797059535980225, -0.00030171871185302734, -0.00024546682834625244, -0.00018921494483947754, -0.00013296306133270264, -7.671117782592773e-05, -2.0459294319152832e-05, 3.579258918762207e-05, 9.204447269439697e-05, 0.00014829635620117188, 0.00020454823970794678, 0.0002608001232147217, 0.0003170520067214966, 0.0003733038902282715, 0.0004295557737350464, 0.0004858076572418213, 0.0005420595407485962, 0.0005983114242553711, 0.000654563307762146, 0.0007108151912689209, 0.0007670670747756958, 0.0008233189582824707, 0.0008795708417892456, 0.0009358227252960205, 0.0009920746088027954, 0.0010483264923095703, 0.0011045783758163452, 0.0011608302593231201, 0.001217082142829895, 0.00127333402633667, 0.0013295859098434448, 0.0013858377933502197, 0.0014420896768569946, 0.0014983415603637695, 0.0015545934438705444, 0.0016108453273773193, 0.0016670972108840942, 0.0017233490943908691, 0.001779600977897644, 0.001835852861404419, 0.0018921047449111938, 0.0019483566284179688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 10.0, 12.0, 15.0, 25.0, 28.0, 40.0, 87.0, 158.0, 275.0, 555.0, 1343.0, 3403.0, 10394.0, 38977.0, 228327.0, 653311.0, 83414.0, 18674.0, 5652.0, 2098.0, 831.0, 437.0, 204.0, 90.0, 64.0, 47.0, 26.0, 12.0, 11.0, 12.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.96484375, -4.831512451171875, -4.69818115234375, -4.564849853515625, -4.4315185546875, -4.298187255859375, -4.16485595703125, -4.031524658203125, -3.898193359375, -3.764862060546875, -3.63153076171875, -3.498199462890625, -3.3648681640625, -3.231536865234375, -3.09820556640625, -2.964874267578125, -2.83154296875, -2.698211669921875, -2.56488037109375, -2.431549072265625, -2.2982177734375, -2.164886474609375, -2.03155517578125, -1.898223876953125, -1.764892578125, -1.631561279296875, -1.49822998046875, -1.364898681640625, -1.2315673828125, -1.098236083984375, -0.96490478515625, -0.831573486328125, -0.6982421875, -0.564910888671875, -0.43157958984375, -0.298248291015625, -0.1649169921875, -0.031585693359375, 0.10174560546875, 0.235076904296875, 0.368408203125, 0.501739501953125, 0.63507080078125, 0.768402099609375, 0.9017333984375, 1.035064697265625, 1.16839599609375, 1.301727294921875, 1.43505859375, 1.568389892578125, 1.70172119140625, 1.835052490234375, 1.9683837890625, 2.101715087890625, 2.23504638671875, 2.368377685546875, 2.501708984375, 2.635040283203125, 2.76837158203125, 2.901702880859375, 3.0350341796875, 3.168365478515625, 3.30169677734375, 3.435028076171875, 3.568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 14.0, 19.0, 17.0, 23.0, 31.0, 46.0, 51.0, 72.0, 79.0, 83.0, 86.0, 95.0, 63.0, 76.0, 43.0, 37.0, 33.0, 26.0, 12.0, 20.0, 6.0, 5.0, 4.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.619140625, -3.516143798828125, -3.41314697265625, -3.310150146484375, -3.2071533203125, -3.104156494140625, -3.00115966796875, -2.898162841796875, -2.795166015625, -2.692169189453125, -2.58917236328125, -2.486175537109375, -2.3831787109375, -2.280181884765625, -2.17718505859375, -2.074188232421875, -1.97119140625, -1.868194580078125, -1.76519775390625, -1.662200927734375, -1.5592041015625, -1.456207275390625, -1.35321044921875, -1.250213623046875, -1.147216796875, -1.044219970703125, -0.94122314453125, -0.838226318359375, -0.7352294921875, -0.632232666015625, -0.52923583984375, -0.426239013671875, -0.3232421875, -0.220245361328125, -0.11724853515625, -0.014251708984375, 0.0887451171875, 0.191741943359375, 0.29473876953125, 0.397735595703125, 0.500732421875, 0.603729248046875, 0.70672607421875, 0.809722900390625, 0.9127197265625, 1.015716552734375, 1.11871337890625, 1.221710205078125, 1.32470703125, 1.427703857421875, 1.53070068359375, 1.633697509765625, 1.7366943359375, 1.839691162109375, 1.94268798828125, 2.045684814453125, 2.148681640625, 2.251678466796875, 2.35467529296875, 2.457672119140625, 2.5606689453125, 2.663665771484375, 2.76666259765625, 2.869659423828125, 2.97265625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 20.0, 41.0, 71.0, 142.0, 258.0, 238.0, 112.0, 58.0, 24.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.380126953125, -96.49137115478516, -92.60261535644531, -88.71385192871094, -84.8250961303711, -80.93634033203125, -77.0475845336914, -73.15882873535156, -69.27006530761719, -65.38130950927734, -61.492549896240234, -57.60379409790039, -53.71503448486328, -49.82627868652344, -45.937522888183594, -42.048763275146484, -38.16000747680664, -34.2712516784668, -30.382492065429688, -26.493736267089844, -22.604976654052734, -18.71622085571289, -14.827463150024414, -10.938705444335938, -7.049947738647461, -3.1611902713775635, 0.727567195892334, 4.616324424743652, 8.505082130432129, 12.393838882446289, 16.282596588134766, 20.171354293823242, 24.06011199951172, 27.948869705200195, 31.837627410888672, 35.726383209228516, 39.615142822265625, 43.50389862060547, 47.39265441894531, 51.28141403198242, 55.17017364501953, 59.058929443359375, 62.947689056396484, 66.8364486694336, 70.72520446777344, 74.61396026611328, 78.50271606445312, 82.3914794921875, 86.28022766113281, 90.16898345947266, 94.0577392578125, 97.94650268554688, 101.83525848388672, 105.72401428222656, 109.6127700805664, 113.50152587890625, 117.39028930664062, 121.27904510498047, 125.16780090332031, 129.0565643310547, 132.9453125, 136.83407592773438, 140.72283935546875, 144.61158752441406, 148.50035095214844]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 6.0, 6.0, 5.0, 10.0, 10.0, 10.0, 9.0, 18.0, 19.0, 21.0, 26.0, 25.0, 21.0, 37.0, 27.0, 38.0, 33.0, 53.0, 60.0, 76.0, 64.0, 50.0, 39.0, 42.0, 33.0, 26.0, 37.0, 34.0, 23.0, 14.0, 15.0, 19.0, 19.0, 15.0, 9.0, 13.0, 5.0, 5.0, 5.0, 1.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.46983337402344, -52.68632888793945, -50.90282440185547, -49.11932373046875, -47.335819244384766, -45.55231475830078, -43.7688102722168, -41.98530578613281, -40.20180130004883, -38.418296813964844, -36.63479232788086, -34.851287841796875, -33.067787170410156, -31.284282684326172, -29.500778198242188, -27.717273712158203, -25.93377113342285, -24.150266647338867, -22.366764068603516, -20.58325958251953, -18.799755096435547, -17.016250610351562, -15.232748031616211, -13.449243545532227, -11.665740013122559, -9.88223648071289, -8.098731994628906, -6.315228462219238, -4.531724452972412, -2.748220443725586, -0.964716911315918, 0.8187875747680664, 2.6022911071777344, 4.3857951164245605, 6.169299125671387, 7.952802658081055, 9.736307144165039, 11.519810676574707, 13.303314208984375, 15.08681869506836, 16.870323181152344, 18.653827667236328, 20.43733024597168, 22.220834732055664, 24.00433921813965, 25.787841796875, 27.571346282958984, 29.35485076904297, 31.13835334777832, 32.92185592651367, 34.705360412597656, 36.48886489868164, 38.272369384765625, 40.05587387084961, 41.839378356933594, 43.62287902832031, 45.4063835144043, 47.18988800048828, 48.973392486572266, 50.75689697265625, 52.54039764404297, 54.32390213012695, 56.10740661621094, 57.89091110229492, 59.674415588378906]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 8.0, 21.0, 14.0, 41.0, 63.0, 112.0, 145.0, 258.0, 432.0, 832.0, 1538.0, 2990.0, 6275.0, 15362.0, 51537.0, 295141.0, 1901606.0, 1616351.0, 234322.0, 42923.0, 12991.0, 5324.0, 2586.0, 1357.0, 795.0, 465.0, 285.0, 183.0, 97.0, 65.0, 47.0, 30.0, 21.0, 20.0, 6.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.518798828125, -5.33447265625, -5.150146484375, -4.9658203125, -4.781494140625, -4.59716796875, -4.412841796875, -4.228515625, -4.044189453125, -3.85986328125, -3.675537109375, -3.4912109375, -3.306884765625, -3.12255859375, -2.938232421875, -2.75390625, -2.569580078125, -2.38525390625, -2.200927734375, -2.0166015625, -1.832275390625, -1.64794921875, -1.463623046875, -1.279296875, -1.094970703125, -0.91064453125, -0.726318359375, -0.5419921875, -0.357666015625, -0.17333984375, 0.010986328125, 0.1953125, 0.379638671875, 0.56396484375, 0.748291015625, 0.9326171875, 1.116943359375, 1.30126953125, 1.485595703125, 1.669921875, 1.854248046875, 2.03857421875, 2.222900390625, 2.4072265625, 2.591552734375, 2.77587890625, 2.960205078125, 3.14453125, 3.328857421875, 3.51318359375, 3.697509765625, 3.8818359375, 4.066162109375, 4.25048828125, 4.434814453125, 4.619140625, 4.803466796875, 4.98779296875, 5.172119140625, 5.3564453125, 5.540771484375, 5.72509765625, 5.909423828125, 6.09375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 9.0, 9.0, 8.0, 12.0, 22.0, 23.0, 29.0, 43.0, 42.0, 37.0, 39.0, 66.0, 70.0, 75.0, 59.0, 64.0, 49.0, 55.0, 52.0, 45.0, 50.0, 34.0, 30.0, 17.0, 19.0, 8.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.98046875, -3.803466796875, -3.62646484375, -3.449462890625, -3.2724609375, -3.095458984375, -2.91845703125, -2.741455078125, -2.564453125, -2.387451171875, -2.21044921875, -2.033447265625, -1.8564453125, -1.679443359375, -1.50244140625, -1.325439453125, -1.1484375, -0.971435546875, -0.79443359375, -0.617431640625, -0.4404296875, -0.263427734375, -0.08642578125, 0.090576171875, 0.267578125, 0.444580078125, 0.62158203125, 0.798583984375, 0.9755859375, 1.152587890625, 1.32958984375, 1.506591796875, 1.68359375, 1.860595703125, 2.03759765625, 2.214599609375, 2.3916015625, 2.568603515625, 2.74560546875, 2.922607421875, 3.099609375, 3.276611328125, 3.45361328125, 3.630615234375, 3.8076171875, 3.984619140625, 4.16162109375, 4.338623046875, 4.515625, 4.692626953125, 4.86962890625, 5.046630859375, 5.2236328125, 5.400634765625, 5.57763671875, 5.754638671875, 5.931640625, 6.108642578125, 6.28564453125, 6.462646484375, 6.6396484375, 6.816650390625, 6.99365234375, 7.170654296875, 7.34765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 6.0, 17.0, 42.0, 52.0, 101.0, 160.0, 253.0, 596.0, 3684.0, 1480916.0, 2703056.0, 4164.0, 621.0, 265.0, 133.0, 85.0, 55.0, 30.0, 21.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.58935546875, -34.2724609375, -32.95556640625, -31.638671875, -30.32177734375, -29.0048828125, -27.68798828125, -26.37109375, -25.05419921875, -23.7373046875, -22.42041015625, -21.103515625, -19.78662109375, -18.4697265625, -17.15283203125, -15.8359375, -14.51904296875, -13.2021484375, -11.88525390625, -10.568359375, -9.25146484375, -7.9345703125, -6.61767578125, -5.30078125, -3.98388671875, -2.6669921875, -1.35009765625, -0.033203125, 1.28369140625, 2.6005859375, 3.91748046875, 5.234375, 6.55126953125, 7.8681640625, 9.18505859375, 10.501953125, 11.81884765625, 13.1357421875, 14.45263671875, 15.76953125, 17.08642578125, 18.4033203125, 19.72021484375, 21.037109375, 22.35400390625, 23.6708984375, 24.98779296875, 26.3046875, 27.62158203125, 28.9384765625, 30.25537109375, 31.572265625, 32.88916015625, 34.2060546875, 35.52294921875, 36.83984375, 38.15673828125, 39.4736328125, 40.79052734375, 42.107421875, 43.42431640625, 44.7412109375, 46.05810546875, 47.375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 34.0, 80.0, 196.0, 685.0, 1820.0, 860.0, 223.0, 85.0, 43.0, 14.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.119140625, -19.30078125, -18.482421875, -17.6640625, -16.845703125, -16.02734375, -15.208984375, -14.390625, -13.572265625, -12.75390625, -11.935546875, -11.1171875, -10.298828125, -9.48046875, -8.662109375, -7.84375, -7.025390625, -6.20703125, -5.388671875, -4.5703125, -3.751953125, -2.93359375, -2.115234375, -1.296875, -0.478515625, 0.33984375, 1.158203125, 1.9765625, 2.794921875, 3.61328125, 4.431640625, 5.25, 6.068359375, 6.88671875, 7.705078125, 8.5234375, 9.341796875, 10.16015625, 10.978515625, 11.796875, 12.615234375, 13.43359375, 14.251953125, 15.0703125, 15.888671875, 16.70703125, 17.525390625, 18.34375, 19.162109375, 19.98046875, 20.798828125, 21.6171875, 22.435546875, 23.25390625, 24.072265625, 24.890625, 25.708984375, 26.52734375, 27.345703125, 28.1640625, 28.982421875, 29.80078125, 30.619140625, 31.4375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 21.0, 34.0, 115.0, 236.0, 320.0, 157.0, 61.0, 29.0, 11.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.21636962890625, -270.2434387207031, -264.2705078125, -258.2975769042969, -252.32464599609375, -246.3517303466797, -240.37879943847656, -234.40586853027344, -228.4329376220703, -222.4600067138672, -216.48707580566406, -210.51414489746094, -204.54122924804688, -198.56829833984375, -192.59536743164062, -186.6224365234375, -180.64950561523438, -174.67657470703125, -168.70364379882812, -162.730712890625, -156.75778198242188, -150.7848663330078, -144.8119354248047, -138.83900451660156, -132.86607360839844, -126.89314270019531, -120.92021179199219, -114.9472885131836, -108.97435760498047, -103.00142669677734, -97.02850341796875, -91.05557250976562, -85.08262634277344, -79.10969543457031, -73.13676452636719, -67.1638412475586, -61.19091033935547, -55.217979431152344, -49.245052337646484, -43.272125244140625, -37.2991943359375, -31.326265335083008, -25.353336334228516, -19.380407333374023, -13.407478332519531, -7.434549331665039, -1.4616203308105469, 4.5113067626953125, 10.484237670898438, 16.45716667175293, 22.430095672607422, 28.403024673461914, 34.375953674316406, 40.34888458251953, 46.32181167602539, 52.29473876953125, 58.267669677734375, 64.2406005859375, 70.21353149414062, 76.18645477294922, 82.15938568115234, 88.13231658935547, 94.10523986816406, 100.07817077636719, 106.05110168457031]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 15.0, 17.0, 23.0, 23.0, 25.0, 29.0, 40.0, 35.0, 40.0, 38.0, 39.0, 39.0, 35.0, 48.0, 54.0, 44.0, 39.0, 43.0, 38.0, 39.0, 44.0, 38.0, 14.0, 22.0, 20.0, 30.0, 12.0, 12.0, 21.0, 8.0, 7.0, 3.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.81529998779297, -42.46793746948242, -41.120574951171875, -39.773216247558594, -38.42585372924805, -37.0784912109375, -35.73113250732422, -34.38376998901367, -33.036407470703125, -31.689044952392578, -30.341684341430664, -28.99432373046875, -27.646961212158203, -26.299598693847656, -24.952238082885742, -23.604877471923828, -22.25751495361328, -20.910152435302734, -19.56279182434082, -18.215431213378906, -16.86806869506836, -15.520707130432129, -14.173345565795898, -12.825984001159668, -11.478622436523438, -10.131260871887207, -8.783899307250977, -7.436537742614746, -6.089176177978516, -4.741814613342285, -3.3944530487060547, -2.047091484069824, -0.6997337341308594, 0.6476278305053711, 1.9949893951416016, 3.342350959777832, 4.6897125244140625, 6.037074089050293, 7.384435653686523, 8.731797218322754, 10.079158782958984, 11.426520347595215, 12.773881912231445, 14.121243476867676, 15.468605041503906, 16.815967559814453, 18.163328170776367, 19.51068878173828, 20.858051300048828, 22.205413818359375, 23.55277442932129, 24.900135040283203, 26.24749755859375, 27.594860076904297, 28.94222068786621, 30.289581298828125, 31.636943817138672, 32.98430633544922, 34.3316650390625, 35.67902755737305, 37.026390075683594, 38.37375259399414, 39.72111511230469, 41.06847381591797, 42.415836334228516]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 18.0, 17.0, 35.0, 45.0, 67.0, 121.0, 208.0, 386.0, 786.0, 1522.0, 3080.0, 6667.0, 15850.0, 41400.0, 119087.0, 320268.0, 334486.0, 129602.0, 44218.0, 16983.0, 7057.0, 3272.0, 1545.0, 842.0, 409.0, 235.0, 140.0, 77.0, 38.0, 38.0, 14.0, 11.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.07440185546875, -7.8675537109375, -7.66070556640625, -7.453857421875, -7.24700927734375, -7.0401611328125, -6.83331298828125, -6.62646484375, -6.41961669921875, -6.2127685546875, -6.00592041015625, -5.799072265625, -5.59222412109375, -5.3853759765625, -5.17852783203125, -4.9716796875, -4.76483154296875, -4.5579833984375, -4.35113525390625, -4.144287109375, -3.93743896484375, -3.7305908203125, -3.52374267578125, -3.31689453125, -3.11004638671875, -2.9031982421875, -2.69635009765625, -2.489501953125, -2.28265380859375, -2.0758056640625, -1.86895751953125, -1.662109375, -1.45526123046875, -1.2484130859375, -1.04156494140625, -0.834716796875, -0.62786865234375, -0.4210205078125, -0.21417236328125, -0.00732421875, 0.19952392578125, 0.4063720703125, 0.61322021484375, 0.820068359375, 1.02691650390625, 1.2337646484375, 1.44061279296875, 1.6474609375, 1.85430908203125, 2.0611572265625, 2.26800537109375, 2.474853515625, 2.68170166015625, 2.8885498046875, 3.09539794921875, 3.30224609375, 3.50909423828125, 3.7159423828125, 3.92279052734375, 4.129638671875, 4.33648681640625, 4.5433349609375, 4.75018310546875, 4.95703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 1.0, 5.0, 12.0, 13.0, 16.0, 20.0, 22.0, 36.0, 33.0, 34.0, 48.0, 52.0, 50.0, 53.0, 66.0, 54.0, 56.0, 61.0, 55.0, 49.0, 51.0, 44.0, 35.0, 26.0, 21.0, 24.0, 18.0, 10.0, 7.0, 6.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.13818359375, -3.9560546875, -3.77392578125, -3.591796875, -3.40966796875, -3.2275390625, -3.04541015625, -2.86328125, -2.68115234375, -2.4990234375, -2.31689453125, -2.134765625, -1.95263671875, -1.7705078125, -1.58837890625, -1.40625, -1.22412109375, -1.0419921875, -0.85986328125, -0.677734375, -0.49560546875, -0.3134765625, -0.13134765625, 0.05078125, 0.23291015625, 0.4150390625, 0.59716796875, 0.779296875, 0.96142578125, 1.1435546875, 1.32568359375, 1.5078125, 1.68994140625, 1.8720703125, 2.05419921875, 2.236328125, 2.41845703125, 2.6005859375, 2.78271484375, 2.96484375, 3.14697265625, 3.3291015625, 3.51123046875, 3.693359375, 3.87548828125, 4.0576171875, 4.23974609375, 4.421875, 4.60400390625, 4.7861328125, 4.96826171875, 5.150390625, 5.33251953125, 5.5146484375, 5.69677734375, 5.87890625, 6.06103515625, 6.2431640625, 6.42529296875, 6.607421875, 6.78955078125, 6.9716796875, 7.15380859375, 7.3359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 4.0, 9.0, 14.0, 17.0, 33.0, 33.0, 37.0, 58.0, 56.0, 83.0, 123.0, 180.0, 254.0, 301.0, 537.0, 878.0, 1737.0, 3837.0, 11355.0, 42307.0, 222247.0, 636035.0, 94963.0, 21430.0, 6411.0, 2436.0, 1160.0, 617.0, 404.0, 257.0, 179.0, 126.0, 103.0, 68.0, 65.0, 43.0, 37.0, 26.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.994140625, -8.67578125, -8.357421875, -8.0390625, -7.720703125, -7.40234375, -7.083984375, -6.765625, -6.447265625, -6.12890625, -5.810546875, -5.4921875, -5.173828125, -4.85546875, -4.537109375, -4.21875, -3.900390625, -3.58203125, -3.263671875, -2.9453125, -2.626953125, -2.30859375, -1.990234375, -1.671875, -1.353515625, -1.03515625, -0.716796875, -0.3984375, -0.080078125, 0.23828125, 0.556640625, 0.875, 1.193359375, 1.51171875, 1.830078125, 2.1484375, 2.466796875, 2.78515625, 3.103515625, 3.421875, 3.740234375, 4.05859375, 4.376953125, 4.6953125, 5.013671875, 5.33203125, 5.650390625, 5.96875, 6.287109375, 6.60546875, 6.923828125, 7.2421875, 7.560546875, 7.87890625, 8.197265625, 8.515625, 8.833984375, 9.15234375, 9.470703125, 9.7890625, 10.107421875, 10.42578125, 10.744140625, 11.0625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 6.0, 12.0, 10.0, 12.0, 11.0, 23.0, 14.0, 8.0, 32.0, 33.0, 29.0, 37.0, 37.0, 44.0, 44.0, 42.0, 49.0, 49.0, 51.0, 52.0, 50.0, 46.0, 39.0, 37.0, 32.0, 18.0, 20.0, 29.0, 18.0, 10.0, 22.0, 8.0, 11.0, 8.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8515625, -14.3704833984375, -13.889404296875, -13.4083251953125, -12.92724609375, -12.4461669921875, -11.965087890625, -11.4840087890625, -11.0029296875, -10.5218505859375, -10.040771484375, -9.5596923828125, -9.07861328125, -8.5975341796875, -8.116455078125, -7.6353759765625, -7.154296875, -6.6732177734375, -6.192138671875, -5.7110595703125, -5.22998046875, -4.7489013671875, -4.267822265625, -3.7867431640625, -3.3056640625, -2.8245849609375, -2.343505859375, -1.8624267578125, -1.38134765625, -0.9002685546875, -0.419189453125, 0.0618896484375, 0.54296875, 1.0240478515625, 1.505126953125, 1.9862060546875, 2.46728515625, 2.9483642578125, 3.429443359375, 3.9105224609375, 4.3916015625, 4.8726806640625, 5.353759765625, 5.8348388671875, 6.31591796875, 6.7969970703125, 7.278076171875, 7.7591552734375, 8.240234375, 8.7213134765625, 9.202392578125, 9.6834716796875, 10.16455078125, 10.6456298828125, 11.126708984375, 11.6077880859375, 12.0888671875, 12.5699462890625, 13.051025390625, 13.5321044921875, 14.01318359375, 14.4942626953125, 14.975341796875, 15.4564208984375, 15.9375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 16.0, 15.0, 32.0, 35.0, 46.0, 85.0, 134.0, 192.0, 387.0, 612.0, 1039.0, 2112.0, 4225.0, 9238.0, 22809.0, 65131.0, 279464.0, 540697.0, 76211.0, 25850.0, 10519.0, 4665.0, 2164.0, 1135.0, 680.0, 357.0, 228.0, 144.0, 84.0, 69.0, 47.0, 23.0, 14.0, 16.0, 10.0, 16.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8603515625, -1.7963409423828125, -1.732330322265625, -1.6683197021484375, -1.60430908203125, -1.5402984619140625, -1.476287841796875, -1.4122772216796875, -1.3482666015625, -1.2842559814453125, -1.220245361328125, -1.1562347412109375, -1.09222412109375, -1.0282135009765625, -0.964202880859375, -0.9001922607421875, -0.836181640625, -0.7721710205078125, -0.708160400390625, -0.6441497802734375, -0.58013916015625, -0.5161285400390625, -0.452117919921875, -0.3881072998046875, -0.3240966796875, -0.2600860595703125, -0.196075439453125, -0.1320648193359375, -0.06805419921875, -0.0040435791015625, 0.059967041015625, 0.1239776611328125, 0.18798828125, 0.2519989013671875, 0.316009521484375, 0.3800201416015625, 0.44403076171875, 0.5080413818359375, 0.572052001953125, 0.6360626220703125, 0.7000732421875, 0.7640838623046875, 0.828094482421875, 0.8921051025390625, 0.95611572265625, 1.0201263427734375, 1.084136962890625, 1.1481475830078125, 1.212158203125, 1.2761688232421875, 1.340179443359375, 1.4041900634765625, 1.46820068359375, 1.5322113037109375, 1.596221923828125, 1.6602325439453125, 1.7242431640625, 1.7882537841796875, 1.852264404296875, 1.9162750244140625, 1.98028564453125, 2.0442962646484375, 2.108306884765625, 2.1723175048828125, 2.236328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 13.0, 6.0, 17.0, 35.0, 36.0, 56.0, 105.0, 184.0, 195.0, 111.0, 71.0, 35.0, 30.0, 16.0, 7.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0012502670288085938, -0.001214638352394104, -0.0011790096759796143, -0.0011433809995651245, -0.0011077523231506348, -0.001072123646736145, -0.0010364949703216553, -0.0010008662939071655, -0.0009652376174926758, -0.000929608941078186, -0.0008939802646636963, -0.0008583515882492065, -0.0008227229118347168, -0.000787094235420227, -0.0007514655590057373, -0.0007158368825912476, -0.0006802082061767578, -0.0006445795297622681, -0.0006089508533477783, -0.0005733221769332886, -0.0005376935005187988, -0.0005020648241043091, -0.00046643614768981934, -0.0004308074712753296, -0.00039517879486083984, -0.0003595501184463501, -0.00032392144203186035, -0.0002882927656173706, -0.00025266408920288086, -0.0002170354127883911, -0.00018140673637390137, -0.00014577805995941162, -0.00011014938354492188, -7.452070713043213e-05, -3.889203071594238e-05, -3.2633543014526367e-06, 3.236532211303711e-05, 6.799399852752686e-05, 0.0001036226749420166, 0.00013925135135650635, 0.0001748800277709961, 0.00021050870418548584, 0.0002461373805999756, 0.00028176605701446533, 0.0003173947334289551, 0.0003530234098434448, 0.00038865208625793457, 0.0004242807626724243, 0.00045990943908691406, 0.0004955381155014038, 0.0005311667919158936, 0.0005667954683303833, 0.000602424144744873, 0.0006380528211593628, 0.0006736814975738525, 0.0007093101739883423, 0.000744938850402832, 0.0007805675268173218, 0.0008161962032318115, 0.0008518248796463013, 0.000887453556060791, 0.0009230822324752808, 0.0009587109088897705, 0.0009943395853042603, 0.00102996826171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 10.0, 10.0, 7.0, 15.0, 16.0, 23.0, 20.0, 37.0, 54.0, 110.0, 171.0, 244.0, 349.0, 581.0, 967.0, 1657.0, 3076.0, 6850.0, 16421.0, 48015.0, 173606.0, 626858.0, 111462.0, 34195.0, 12355.0, 5183.0, 2646.0, 1332.0, 811.0, 493.0, 322.0, 200.0, 139.0, 104.0, 61.0, 46.0, 30.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 16.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.507080078125, -2.43408203125, -2.361083984375, -2.2880859375, -2.215087890625, -2.14208984375, -2.069091796875, -1.99609375, -1.923095703125, -1.85009765625, -1.777099609375, -1.7041015625, -1.631103515625, -1.55810546875, -1.485107421875, -1.412109375, -1.339111328125, -1.26611328125, -1.193115234375, -1.1201171875, -1.047119140625, -0.97412109375, -0.901123046875, -0.828125, -0.755126953125, -0.68212890625, -0.609130859375, -0.5361328125, -0.463134765625, -0.39013671875, -0.317138671875, -0.244140625, -0.171142578125, -0.09814453125, -0.025146484375, 0.0478515625, 0.120849609375, 0.19384765625, 0.266845703125, 0.33984375, 0.412841796875, 0.48583984375, 0.558837890625, 0.6318359375, 0.704833984375, 0.77783203125, 0.850830078125, 0.923828125, 0.996826171875, 1.06982421875, 1.142822265625, 1.2158203125, 1.288818359375, 1.36181640625, 1.434814453125, 1.5078125, 1.580810546875, 1.65380859375, 1.726806640625, 1.7998046875, 1.872802734375, 1.94580078125, 2.018798828125, 2.091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 3.0, 9.0, 11.0, 13.0, 11.0, 12.0, 14.0, 22.0, 22.0, 20.0, 32.0, 28.0, 37.0, 57.0, 61.0, 60.0, 87.0, 88.0, 76.0, 61.0, 47.0, 39.0, 34.0, 26.0, 20.0, 15.0, 16.0, 10.0, 6.0, 9.0, 6.0, 9.0, 10.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.30780029296875, -2.2347412109375, -2.16168212890625, -2.088623046875, -2.01556396484375, -1.9425048828125, -1.86944580078125, -1.79638671875, -1.72332763671875, -1.6502685546875, -1.57720947265625, -1.504150390625, -1.43109130859375, -1.3580322265625, -1.28497314453125, -1.2119140625, -1.13885498046875, -1.0657958984375, -0.99273681640625, -0.919677734375, -0.84661865234375, -0.7735595703125, -0.70050048828125, -0.62744140625, -0.55438232421875, -0.4813232421875, -0.40826416015625, -0.335205078125, -0.26214599609375, -0.1890869140625, -0.11602783203125, -0.04296875, 0.03009033203125, 0.1031494140625, 0.17620849609375, 0.249267578125, 0.32232666015625, 0.3953857421875, 0.46844482421875, 0.54150390625, 0.61456298828125, 0.6876220703125, 0.76068115234375, 0.833740234375, 0.90679931640625, 0.9798583984375, 1.05291748046875, 1.1259765625, 1.19903564453125, 1.2720947265625, 1.34515380859375, 1.418212890625, 1.49127197265625, 1.5643310546875, 1.63739013671875, 1.71044921875, 1.78350830078125, 1.8565673828125, 1.92962646484375, 2.002685546875, 2.07574462890625, 2.1488037109375, 2.22186279296875, 2.294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 8.0, 16.0, 38.0, 51.0, 93.0, 130.0, 234.0, 163.0, 93.0, 45.0, 39.0, 27.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.77720260620117, -56.64575958251953, -54.514320373535156, -52.382877349853516, -50.25143814086914, -48.1199951171875, -45.988555908203125, -43.857112884521484, -41.725669860839844, -39.5942268371582, -37.46278762817383, -35.33134460449219, -33.19990539550781, -31.068462371826172, -28.937021255493164, -26.805580139160156, -24.67414093017578, -22.542699813842773, -20.411258697509766, -18.279815673828125, -16.14837646484375, -14.016934394836426, -11.885492324829102, -9.754051208496094, -7.622610092163086, -5.491168975830078, -3.359727382659912, -1.228285789489746, 0.9031553268432617, 3.0345964431762695, 5.166038513183594, 7.297479629516602, 9.428916931152344, 11.560358047485352, 13.69179916381836, 15.823241233825684, 17.954681396484375, 20.086124420166016, 22.217565536499023, 24.34900665283203, 26.48044776916504, 28.611888885498047, 30.743330001831055, 32.87477111816406, 35.0062141418457, 37.13765335083008, 39.26909637451172, 41.400535583496094, 43.531978607177734, 45.663421630859375, 47.79486083984375, 49.92630386352539, 52.057743072509766, 54.189186096191406, 56.32062530517578, 58.45206832885742, 60.58351135253906, 62.7149543762207, 64.84639739990234, 66.97783660888672, 69.1092758178711, 71.24071502685547, 73.37216186523438, 75.50360107421875, 77.63504028320312]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 9.0, 7.0, 11.0, 10.0, 17.0, 26.0, 30.0, 24.0, 34.0, 38.0, 45.0, 63.0, 99.0, 130.0, 100.0, 70.0, 59.0, 40.0, 41.0, 32.0, 23.0, 23.0, 9.0, 13.0, 9.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.55998229980469, -104.90193939208984, -102.243896484375, -99.58584594726562, -96.92780303955078, -94.26976013183594, -91.61170959472656, -88.95366668701172, -86.29562377929688, -83.63758087158203, -80.97953796386719, -78.32148742675781, -75.66344451904297, -73.00540161132812, -70.34735107421875, -67.6893081665039, -65.03126525878906, -62.37322235107422, -59.71517562866211, -57.05712890625, -54.399085998535156, -51.74104309082031, -49.0829963684082, -46.424949645996094, -43.76690673828125, -41.108863830566406, -38.4508171081543, -35.79277038574219, -33.134727478027344, -30.476682662963867, -27.81863784790039, -25.160593032836914, -22.502540588378906, -19.84449577331543, -17.186450958251953, -14.528406143188477, -11.870361328125, -9.212316513061523, -6.554271697998047, -3.8962268829345703, -1.2381820678710938, 1.4198627471923828, 4.077907562255859, 6.735952377319336, 9.393997192382812, 12.052042007446289, 14.710086822509766, 17.368131637573242, 20.02617645263672, 22.684221267700195, 25.342266082763672, 28.00031089782715, 30.658355712890625, 33.31639862060547, 35.97444534301758, 38.63249206542969, 41.29053497314453, 43.948577880859375, 46.606624603271484, 49.264671325683594, 51.92271423339844, 54.58075714111328, 57.23880386352539, 59.8968505859375, 62.554893493652344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 11.0, 13.0, 16.0, 30.0, 32.0, 53.0, 72.0, 104.0, 172.0, 238.0, 456.0, 779.0, 1331.0, 2688.0, 5988.0, 16412.0, 63984.0, 385464.0, 2173948.0, 1301532.0, 186890.0, 34750.0, 10406.0, 4158.0, 2027.0, 1087.0, 556.0, 380.0, 230.0, 154.0, 86.0, 63.0, 38.0, 30.0, 29.0, 22.0, 17.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.47076416015625, -6.2735595703125, -6.07635498046875, -5.879150390625, -5.68194580078125, -5.4847412109375, -5.28753662109375, -5.09033203125, -4.89312744140625, -4.6959228515625, -4.49871826171875, -4.301513671875, -4.10430908203125, -3.9071044921875, -3.70989990234375, -3.5126953125, -3.31549072265625, -3.1182861328125, -2.92108154296875, -2.723876953125, -2.52667236328125, -2.3294677734375, -2.13226318359375, -1.93505859375, -1.73785400390625, -1.5406494140625, -1.34344482421875, -1.146240234375, -0.94903564453125, -0.7518310546875, -0.55462646484375, -0.357421875, -0.16021728515625, 0.0369873046875, 0.23419189453125, 0.431396484375, 0.62860107421875, 0.8258056640625, 1.02301025390625, 1.22021484375, 1.41741943359375, 1.6146240234375, 1.81182861328125, 2.009033203125, 2.20623779296875, 2.4034423828125, 2.60064697265625, 2.7978515625, 2.99505615234375, 3.1922607421875, 3.38946533203125, 3.586669921875, 3.78387451171875, 3.9810791015625, 4.17828369140625, 4.37548828125, 4.57269287109375, 4.7698974609375, 4.96710205078125, 5.164306640625, 5.36151123046875, 5.5587158203125, 5.75592041015625, 5.953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 8.0, 8.0, 22.0, 20.0, 20.0, 31.0, 30.0, 40.0, 46.0, 60.0, 51.0, 67.0, 62.0, 63.0, 58.0, 65.0, 62.0, 56.0, 31.0, 37.0, 22.0, 32.0, 24.0, 23.0, 17.0, 11.0, 10.0, 6.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.0697021484375, -3.889404296875, -3.7091064453125, -3.52880859375, -3.3485107421875, -3.168212890625, -2.9879150390625, -2.8076171875, -2.6273193359375, -2.447021484375, -2.2667236328125, -2.08642578125, -1.9061279296875, -1.725830078125, -1.5455322265625, -1.365234375, -1.1849365234375, -1.004638671875, -0.8243408203125, -0.64404296875, -0.4637451171875, -0.283447265625, -0.1031494140625, 0.0771484375, 0.2574462890625, 0.437744140625, 0.6180419921875, 0.79833984375, 0.9786376953125, 1.158935546875, 1.3392333984375, 1.51953125, 1.6998291015625, 1.880126953125, 2.0604248046875, 2.24072265625, 2.4210205078125, 2.601318359375, 2.7816162109375, 2.9619140625, 3.1422119140625, 3.322509765625, 3.5028076171875, 3.68310546875, 3.8634033203125, 4.043701171875, 4.2239990234375, 4.404296875, 4.5845947265625, 4.764892578125, 4.9451904296875, 5.12548828125, 5.3057861328125, 5.486083984375, 5.6663818359375, 5.8466796875, 6.0269775390625, 6.207275390625, 6.3875732421875, 6.56787109375, 6.7481689453125, 6.928466796875, 7.1087646484375, 7.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 21.0, 34.0, 50.0, 99.0, 179.0, 317.0, 832.0, 2916.0, 40003.0, 4038903.0, 104402.0, 4534.0, 1016.0, 445.0, 235.0, 123.0, 62.0, 31.0, 20.0, 18.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.640625, -28.7587890625, -27.876953125, -26.9951171875, -26.11328125, -25.2314453125, -24.349609375, -23.4677734375, -22.5859375, -21.7041015625, -20.822265625, -19.9404296875, -19.05859375, -18.1767578125, -17.294921875, -16.4130859375, -15.53125, -14.6494140625, -13.767578125, -12.8857421875, -12.00390625, -11.1220703125, -10.240234375, -9.3583984375, -8.4765625, -7.5947265625, -6.712890625, -5.8310546875, -4.94921875, -4.0673828125, -3.185546875, -2.3037109375, -1.421875, -0.5400390625, 0.341796875, 1.2236328125, 2.10546875, 2.9873046875, 3.869140625, 4.7509765625, 5.6328125, 6.5146484375, 7.396484375, 8.2783203125, 9.16015625, 10.0419921875, 10.923828125, 11.8056640625, 12.6875, 13.5693359375, 14.451171875, 15.3330078125, 16.21484375, 17.0966796875, 17.978515625, 18.8603515625, 19.7421875, 20.6240234375, 21.505859375, 22.3876953125, 23.26953125, 24.1513671875, 25.033203125, 25.9150390625, 26.796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 16.0, 31.0, 41.0, 71.0, 153.0, 431.0, 939.0, 1214.0, 637.0, 272.0, 126.0, 53.0, 26.0, 16.0, 11.0, 9.0, 10.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.9375, -19.338623046875, -18.73974609375, -18.140869140625, -17.5419921875, -16.943115234375, -16.34423828125, -15.745361328125, -15.146484375, -14.547607421875, -13.94873046875, -13.349853515625, -12.7509765625, -12.152099609375, -11.55322265625, -10.954345703125, -10.35546875, -9.756591796875, -9.15771484375, -8.558837890625, -7.9599609375, -7.361083984375, -6.76220703125, -6.163330078125, -5.564453125, -4.965576171875, -4.36669921875, -3.767822265625, -3.1689453125, -2.570068359375, -1.97119140625, -1.372314453125, -0.7734375, -0.174560546875, 0.42431640625, 1.023193359375, 1.6220703125, 2.220947265625, 2.81982421875, 3.418701171875, 4.017578125, 4.616455078125, 5.21533203125, 5.814208984375, 6.4130859375, 7.011962890625, 7.61083984375, 8.209716796875, 8.80859375, 9.407470703125, 10.00634765625, 10.605224609375, 11.2041015625, 11.802978515625, 12.40185546875, 13.000732421875, 13.599609375, 14.198486328125, 14.79736328125, 15.396240234375, 15.9951171875, 16.593994140625, 17.19287109375, 17.791748046875, 18.390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 10.0, 10.0, 37.0, 78.0, 169.0, 262.0, 234.0, 109.0, 53.0, 16.0, 10.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.4344940185547, -149.5614776611328, -144.68846130371094, -139.81544494628906, -134.9424285888672, -130.0694122314453, -125.19640350341797, -120.3233871459961, -115.45037078857422, -110.57735443115234, -105.70433807373047, -100.8313217163086, -95.95831298828125, -91.08529663085938, -86.2122802734375, -81.33926391601562, -76.46624755859375, -71.59323120117188, -66.72021484375, -61.84720230102539, -56.974185943603516, -52.10116958618164, -47.22815704345703, -42.355140686035156, -37.48212432861328, -32.609107971191406, -27.736093521118164, -22.863079071044922, -17.990062713623047, -13.117046356201172, -8.24403190612793, -3.3710174560546875, 1.50201416015625, 6.375029563903809, 11.248044967651367, 16.12105941772461, 20.994075775146484, 25.86709213256836, 30.7401065826416, 35.613121032714844, 40.48613739013672, 45.359153747558594, 50.23217010498047, 55.10518264770508, 59.97819900512695, 64.85121154785156, 69.72422790527344, 74.59724426269531, 79.47026062011719, 84.34327697753906, 89.21629333496094, 94.08930969238281, 98.96232604980469, 103.83534240722656, 108.7083511352539, 113.58136749267578, 118.45438385009766, 123.32740020751953, 128.20040893554688, 133.07342529296875, 137.94644165039062, 142.8194580078125, 147.69247436523438, 152.56549072265625, 157.43850708007812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 8.0, 9.0, 12.0, 8.0, 14.0, 23.0, 15.0, 17.0, 12.0, 23.0, 24.0, 24.0, 28.0, 44.0, 42.0, 51.0, 47.0, 47.0, 48.0, 40.0, 35.0, 42.0, 51.0, 42.0, 27.0, 33.0, 27.0, 30.0, 24.0, 24.0, 13.0, 19.0, 8.0, 12.0, 13.0, 12.0, 7.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.855377197265625, -44.46354675292969, -43.071712493896484, -41.67987823486328, -40.288047790527344, -38.896217346191406, -37.5043830871582, -36.112548828125, -34.72071838378906, -33.328887939453125, -31.937053680419922, -30.54522132873535, -29.15338897705078, -27.76155662536621, -26.36972427368164, -24.97789192199707, -23.5860595703125, -22.19422721862793, -20.80239486694336, -19.41056251525879, -18.01873016357422, -16.62689781188965, -15.235065460205078, -13.843233108520508, -12.451400756835938, -11.059568405151367, -9.667736053466797, -8.275903701782227, -6.884071350097656, -5.492238998413086, -4.100406646728516, -2.7085742950439453, -1.3167381286621094, 0.07509422302246094, 1.4669265747070312, 2.8587589263916016, 4.250591278076172, 5.642423629760742, 7.0342559814453125, 8.426088333129883, 9.817920684814453, 11.209753036499023, 12.601585388183594, 13.993417739868164, 15.385250091552734, 16.777082443237305, 18.168914794921875, 19.560747146606445, 20.952579498291016, 22.344411849975586, 23.736244201660156, 25.128076553344727, 26.519908905029297, 27.911741256713867, 29.303573608398438, 30.695405960083008, 32.08723831176758, 33.47907257080078, 34.87090301513672, 36.262733459472656, 37.65456771850586, 39.04640197753906, 40.438232421875, 41.83006286621094, 43.22189712524414]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 21.0, 19.0, 28.0, 47.0, 47.0, 84.0, 117.0, 207.0, 342.0, 601.0, 1119.0, 2016.0, 3958.0, 8105.0, 18228.0, 44034.0, 116403.0, 302669.0, 330459.0, 131433.0, 49698.0, 20584.0, 9044.0, 4273.0, 2216.0, 1142.0, 635.0, 395.0, 228.0, 139.0, 103.0, 50.0, 24.0, 20.0, 17.0, 12.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.49615478515625, -5.2852783203125, -5.07440185546875, -4.863525390625, -4.65264892578125, -4.4417724609375, -4.23089599609375, -4.02001953125, -3.80914306640625, -3.5982666015625, -3.38739013671875, -3.176513671875, -2.96563720703125, -2.7547607421875, -2.54388427734375, -2.3330078125, -2.12213134765625, -1.9112548828125, -1.70037841796875, -1.489501953125, -1.27862548828125, -1.0677490234375, -0.85687255859375, -0.64599609375, -0.43511962890625, -0.2242431640625, -0.01336669921875, 0.197509765625, 0.40838623046875, 0.6192626953125, 0.83013916015625, 1.041015625, 1.25189208984375, 1.4627685546875, 1.67364501953125, 1.884521484375, 2.09539794921875, 2.3062744140625, 2.51715087890625, 2.72802734375, 2.93890380859375, 3.1497802734375, 3.36065673828125, 3.571533203125, 3.78240966796875, 3.9932861328125, 4.20416259765625, 4.4150390625, 4.62591552734375, 4.8367919921875, 5.04766845703125, 5.258544921875, 5.46942138671875, 5.6802978515625, 5.89117431640625, 6.10205078125, 6.31292724609375, 6.5238037109375, 6.73468017578125, 6.945556640625, 7.15643310546875, 7.3673095703125, 7.57818603515625, 7.7890625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 2.0, 7.0, 6.0, 13.0, 9.0, 17.0, 18.0, 23.0, 27.0, 33.0, 27.0, 30.0, 53.0, 54.0, 36.0, 67.0, 36.0, 62.0, 66.0, 53.0, 50.0, 29.0, 48.0, 40.0, 34.0, 34.0, 20.0, 25.0, 16.0, 15.0, 19.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.564178466796875, -3.39202880859375, -3.219879150390625, -3.0477294921875, -2.875579833984375, -2.70343017578125, -2.531280517578125, -2.359130859375, -2.186981201171875, -2.01483154296875, -1.842681884765625, -1.6705322265625, -1.498382568359375, -1.32623291015625, -1.154083251953125, -0.98193359375, -0.809783935546875, -0.63763427734375, -0.465484619140625, -0.2933349609375, -0.121185302734375, 0.05096435546875, 0.223114013671875, 0.395263671875, 0.567413330078125, 0.73956298828125, 0.911712646484375, 1.0838623046875, 1.256011962890625, 1.42816162109375, 1.600311279296875, 1.7724609375, 1.944610595703125, 2.11676025390625, 2.288909912109375, 2.4610595703125, 2.633209228515625, 2.80535888671875, 2.977508544921875, 3.149658203125, 3.321807861328125, 3.49395751953125, 3.666107177734375, 3.8382568359375, 4.010406494140625, 4.18255615234375, 4.354705810546875, 4.52685546875, 4.699005126953125, 4.87115478515625, 5.043304443359375, 5.2154541015625, 5.387603759765625, 5.55975341796875, 5.731903076171875, 5.904052734375, 6.076202392578125, 6.24835205078125, 6.420501708984375, 6.5926513671875, 6.764801025390625, 6.93695068359375, 7.109100341796875, 7.28125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 13.0, 15.0, 22.0, 40.0, 43.0, 49.0, 76.0, 104.0, 167.0, 225.0, 333.0, 506.0, 813.0, 1433.0, 3047.0, 8825.0, 39702.0, 567602.0, 372852.0, 37637.0, 8285.0, 3057.0, 1386.0, 814.0, 477.0, 317.0, 198.0, 150.0, 106.0, 55.0, 53.0, 35.0, 25.0, 17.0, 19.0, 12.0, 8.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.963134765625, -11.53564453125, -11.108154296875, -10.6806640625, -10.253173828125, -9.82568359375, -9.398193359375, -8.970703125, -8.543212890625, -8.11572265625, -7.688232421875, -7.2607421875, -6.833251953125, -6.40576171875, -5.978271484375, -5.55078125, -5.123291015625, -4.69580078125, -4.268310546875, -3.8408203125, -3.413330078125, -2.98583984375, -2.558349609375, -2.130859375, -1.703369140625, -1.27587890625, -0.848388671875, -0.4208984375, 0.006591796875, 0.43408203125, 0.861572265625, 1.2890625, 1.716552734375, 2.14404296875, 2.571533203125, 2.9990234375, 3.426513671875, 3.85400390625, 4.281494140625, 4.708984375, 5.136474609375, 5.56396484375, 5.991455078125, 6.4189453125, 6.846435546875, 7.27392578125, 7.701416015625, 8.12890625, 8.556396484375, 8.98388671875, 9.411376953125, 9.8388671875, 10.266357421875, 10.69384765625, 11.121337890625, 11.548828125, 11.976318359375, 12.40380859375, 12.831298828125, 13.2587890625, 13.686279296875, 14.11376953125, 14.541259765625, 14.96875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 11.0, 5.0, 12.0, 12.0, 27.0, 26.0, 31.0, 45.0, 45.0, 48.0, 52.0, 57.0, 76.0, 66.0, 57.0, 57.0, 62.0, 47.0, 42.0, 40.0, 29.0, 33.0, 21.0, 17.0, 9.0, 8.0, 12.0, 13.0, 10.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.301025390625, -17.61767578125, -16.934326171875, -16.2509765625, -15.567626953125, -14.88427734375, -14.200927734375, -13.517578125, -12.834228515625, -12.15087890625, -11.467529296875, -10.7841796875, -10.100830078125, -9.41748046875, -8.734130859375, -8.05078125, -7.367431640625, -6.68408203125, -6.000732421875, -5.3173828125, -4.634033203125, -3.95068359375, -3.267333984375, -2.583984375, -1.900634765625, -1.21728515625, -0.533935546875, 0.1494140625, 0.832763671875, 1.51611328125, 2.199462890625, 2.8828125, 3.566162109375, 4.24951171875, 4.932861328125, 5.6162109375, 6.299560546875, 6.98291015625, 7.666259765625, 8.349609375, 9.032958984375, 9.71630859375, 10.399658203125, 11.0830078125, 11.766357421875, 12.44970703125, 13.133056640625, 13.81640625, 14.499755859375, 15.18310546875, 15.866455078125, 16.5498046875, 17.233154296875, 17.91650390625, 18.599853515625, 19.283203125, 19.966552734375, 20.64990234375, 21.333251953125, 22.0166015625, 22.699951171875, 23.38330078125, 24.066650390625, 24.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 19.0, 31.0, 52.0, 70.0, 131.0, 283.0, 606.0, 2123.0, 11576.0, 183989.0, 821315.0, 23349.0, 3341.0, 871.0, 341.0, 167.0, 88.0, 56.0, 43.0, 24.0, 21.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.06463623046875, -5.8870849609375, -5.70953369140625, -5.531982421875, -5.35443115234375, -5.1768798828125, -4.99932861328125, -4.82177734375, -4.64422607421875, -4.4666748046875, -4.28912353515625, -4.111572265625, -3.93402099609375, -3.7564697265625, -3.57891845703125, -3.4013671875, -3.22381591796875, -3.0462646484375, -2.86871337890625, -2.691162109375, -2.51361083984375, -2.3360595703125, -2.15850830078125, -1.98095703125, -1.80340576171875, -1.6258544921875, -1.44830322265625, -1.270751953125, -1.09320068359375, -0.9156494140625, -0.73809814453125, -0.560546875, -0.38299560546875, -0.2054443359375, -0.02789306640625, 0.149658203125, 0.32720947265625, 0.5047607421875, 0.68231201171875, 0.85986328125, 1.03741455078125, 1.2149658203125, 1.39251708984375, 1.570068359375, 1.74761962890625, 1.9251708984375, 2.10272216796875, 2.2802734375, 2.45782470703125, 2.6353759765625, 2.81292724609375, 2.990478515625, 3.16802978515625, 3.3455810546875, 3.52313232421875, 3.70068359375, 3.87823486328125, 4.0557861328125, 4.23333740234375, 4.410888671875, 4.58843994140625, 4.7659912109375, 4.94354248046875, 5.12109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 22.0, 45.0, 92.0, 355.0, 253.0, 82.0, 48.0, 24.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002925872802734375, -0.0028340518474578857, -0.0027422308921813965, -0.0026504099369049072, -0.002558588981628418, -0.0024667680263519287, -0.0023749470710754395, -0.00228312611579895, -0.002191305160522461, -0.0020994842052459717, -0.0020076632499694824, -0.0019158422946929932, -0.001824021339416504, -0.0017322003841400146, -0.0016403794288635254, -0.0015485584735870361, -0.0014567375183105469, -0.0013649165630340576, -0.0012730956077575684, -0.001181274652481079, -0.0010894536972045898, -0.0009976327419281006, -0.0009058117866516113, -0.0008139908313751221, -0.0007221698760986328, -0.0006303489208221436, -0.0005385279655456543, -0.00044670701026916504, -0.0003548860549926758, -0.0002630650997161865, -0.00017124414443969727, -7.942318916320801e-05, 1.239776611328125e-05, 0.00010421872138977051, 0.00019603967666625977, 0.000287860631942749, 0.0003796815872192383, 0.00047150254249572754, 0.0005633234977722168, 0.0006551444530487061, 0.0007469654083251953, 0.0008387863636016846, 0.0009306073188781738, 0.001022428274154663, 0.0011142492294311523, 0.0012060701847076416, 0.0012978911399841309, 0.0013897120952606201, 0.0014815330505371094, 0.0015733540058135986, 0.0016651749610900879, 0.0017569959163665771, 0.0018488168716430664, 0.0019406378269195557, 0.002032458782196045, 0.002124279737472534, 0.0022161006927490234, 0.0023079216480255127, 0.002399742603302002, 0.002491563558578491, 0.0025833845138549805, 0.0026752054691314697, 0.002767026424407959, 0.0028588473796844482, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 12.0, 34.0, 45.0, 48.0, 82.0, 108.0, 210.0, 312.0, 537.0, 1038.0, 2166.0, 5757.0, 18507.0, 86569.0, 742341.0, 149409.0, 27861.0, 7715.0, 2833.0, 1264.0, 669.0, 386.0, 250.0, 131.0, 91.0, 53.0, 43.0, 25.0, 12.0, 10.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.417938232421875, -3.31634521484375, -3.214752197265625, -3.1131591796875, -3.011566162109375, -2.90997314453125, -2.808380126953125, -2.706787109375, -2.605194091796875, -2.50360107421875, -2.402008056640625, -2.3004150390625, -2.198822021484375, -2.09722900390625, -1.995635986328125, -1.89404296875, -1.792449951171875, -1.69085693359375, -1.589263916015625, -1.4876708984375, -1.386077880859375, -1.28448486328125, -1.182891845703125, -1.081298828125, -0.979705810546875, -0.87811279296875, -0.776519775390625, -0.6749267578125, -0.573333740234375, -0.47174072265625, -0.370147705078125, -0.2685546875, -0.166961669921875, -0.06536865234375, 0.036224365234375, 0.1378173828125, 0.239410400390625, 0.34100341796875, 0.442596435546875, 0.544189453125, 0.645782470703125, 0.74737548828125, 0.848968505859375, 0.9505615234375, 1.052154541015625, 1.15374755859375, 1.255340576171875, 1.35693359375, 1.458526611328125, 1.56011962890625, 1.661712646484375, 1.7633056640625, 1.864898681640625, 1.96649169921875, 2.068084716796875, 2.169677734375, 2.271270751953125, 2.37286376953125, 2.474456787109375, 2.5760498046875, 2.677642822265625, 2.77923583984375, 2.880828857421875, 2.982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 5.0, 11.0, 14.0, 20.0, 25.0, 46.0, 56.0, 68.0, 89.0, 132.0, 139.0, 113.0, 69.0, 50.0, 23.0, 32.0, 26.0, 15.0, 21.0, 11.0, 12.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.875335693359375, -4.75067138671875, -4.626007080078125, -4.5013427734375, -4.376678466796875, -4.25201416015625, -4.127349853515625, -4.002685546875, -3.878021240234375, -3.75335693359375, -3.628692626953125, -3.5040283203125, -3.379364013671875, -3.25469970703125, -3.130035400390625, -3.00537109375, -2.880706787109375, -2.75604248046875, -2.631378173828125, -2.5067138671875, -2.382049560546875, -2.25738525390625, -2.132720947265625, -2.008056640625, -1.883392333984375, -1.75872802734375, -1.634063720703125, -1.5093994140625, -1.384735107421875, -1.26007080078125, -1.135406494140625, -1.0107421875, -0.886077880859375, -0.76141357421875, -0.636749267578125, -0.5120849609375, -0.387420654296875, -0.26275634765625, -0.138092041015625, -0.013427734375, 0.111236572265625, 0.23590087890625, 0.360565185546875, 0.4852294921875, 0.609893798828125, 0.73455810546875, 0.859222412109375, 0.98388671875, 1.108551025390625, 1.23321533203125, 1.357879638671875, 1.4825439453125, 1.607208251953125, 1.73187255859375, 1.856536865234375, 1.981201171875, 2.105865478515625, 2.23052978515625, 2.355194091796875, 2.4798583984375, 2.604522705078125, 2.72918701171875, 2.853851318359375, 2.978515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 13.0, 36.0, 88.0, 422.0, 321.0, 79.0, 24.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.60452270507812, -99.35810852050781, -93.1116943359375, -86.86528015136719, -80.6188735961914, -74.3724594116211, -68.12604522705078, -61.879634857177734, -55.63322067260742, -49.38680648803711, -43.14039611816406, -36.89398193359375, -30.64756965637207, -24.40115737915039, -18.154743194580078, -11.908332824707031, -5.661918640136719, 0.5844941139221191, 6.830906867980957, 13.077320098876953, 19.323732376098633, 25.570144653320312, 31.816558837890625, 38.06296920776367, 44.309383392333984, 50.5557975769043, 56.802207946777344, 63.048622131347656, 69.29503631591797, 75.54144287109375, 81.78785705566406, 88.03427124023438, 94.28068542480469, 100.527099609375, 106.77351379394531, 113.01992797851562, 119.2663345336914, 125.51274871826172, 131.7591552734375, 138.0055694580078, 144.25198364257812, 150.49839782714844, 156.74481201171875, 162.99122619628906, 169.23764038085938, 175.48403930664062, 181.73046875, 187.97686767578125, 194.22329711914062, 200.46971130371094, 206.71612548828125, 212.96253967285156, 219.20895385742188, 225.45535278320312, 231.7017822265625, 237.94818115234375, 244.19459533691406, 250.44100952148438, 256.6874084472656, 262.933837890625, 269.18023681640625, 275.4266662597656, 281.6730651855469, 287.91949462890625, 294.1658935546875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 6.0, 13.0, 13.0, 12.0, 16.0, 17.0, 31.0, 24.0, 34.0, 34.0, 37.0, 41.0, 41.0, 112.0, 139.0, 80.0, 40.0, 35.0, 29.0, 20.0, 30.0, 20.0, 19.0, 28.0, 18.0, 14.0, 17.0, 10.0, 9.0, 10.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-90.8123550415039, -88.3792495727539, -85.94615173339844, -83.51304626464844, -81.07994842529297, -78.64684295654297, -76.2137451171875, -73.7806396484375, -71.3475341796875, -68.9144287109375, -66.48133087158203, -64.04822540283203, -61.61512756347656, -59.18202209472656, -56.74892044067383, -54.315818786621094, -51.882720947265625, -49.44961929321289, -47.016517639160156, -44.58341598510742, -42.15031433105469, -39.71720886230469, -37.28410720825195, -34.85100555419922, -32.417903900146484, -29.98480224609375, -27.551700592041016, -25.11859703063965, -22.685495376586914, -20.25239372253418, -17.819290161132812, -15.386188507080078, -12.953079223632812, -10.519977569580078, -8.086874961853027, -5.653772830963135, -3.220670700073242, -0.7875690460205078, 1.645533561706543, 4.078636169433594, 6.511737823486328, 8.944839477539062, 11.377942085266113, 13.811044692993164, 16.2441463470459, 18.677248001098633, 21.1103515625, 23.543453216552734, 25.97655487060547, 28.409656524658203, 30.842758178710938, 33.27585983276367, 35.708961486816406, 38.142066955566406, 40.57516860961914, 43.008270263671875, 45.44137191772461, 47.874473571777344, 50.30757522583008, 52.74067687988281, 55.17378234863281, 57.60688018798828, 60.03998565673828, 62.473087310791016, 64.90618896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 9.0, 30.0, 30.0, 38.0, 66.0, 116.0, 196.0, 310.0, 463.0, 780.0, 1394.0, 2379.0, 5171.0, 10946.0, 29807.0, 123403.0, 683168.0, 2138630.0, 964113.0, 173154.0, 36361.0, 12033.0, 5245.0, 2577.0, 1480.0, 858.0, 555.0, 341.0, 225.0, 128.0, 87.0, 48.0, 45.0, 23.0, 20.0, 11.0, 8.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1796875, -5.955810546875, -5.73193359375, -5.508056640625, -5.2841796875, -5.060302734375, -4.83642578125, -4.612548828125, -4.388671875, -4.164794921875, -3.94091796875, -3.717041015625, -3.4931640625, -3.269287109375, -3.04541015625, -2.821533203125, -2.59765625, -2.373779296875, -2.14990234375, -1.926025390625, -1.7021484375, -1.478271484375, -1.25439453125, -1.030517578125, -0.806640625, -0.582763671875, -0.35888671875, -0.135009765625, 0.0888671875, 0.312744140625, 0.53662109375, 0.760498046875, 0.984375, 1.208251953125, 1.43212890625, 1.656005859375, 1.8798828125, 2.103759765625, 2.32763671875, 2.551513671875, 2.775390625, 2.999267578125, 3.22314453125, 3.447021484375, 3.6708984375, 3.894775390625, 4.11865234375, 4.342529296875, 4.56640625, 4.790283203125, 5.01416015625, 5.238037109375, 5.4619140625, 5.685791015625, 5.90966796875, 6.133544921875, 6.357421875, 6.581298828125, 6.80517578125, 7.029052734375, 7.2529296875, 7.476806640625, 7.70068359375, 7.924560546875, 8.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 23.0, 29.0, 26.0, 29.0, 31.0, 54.0, 37.0, 56.0, 67.0, 65.0, 59.0, 63.0, 55.0, 50.0, 52.0, 47.0, 45.0, 28.0, 25.0, 14.0, 19.0, 14.0, 22.0, 8.0, 12.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.548431396484375, -3.37615966796875, -3.203887939453125, -3.0316162109375, -2.859344482421875, -2.68707275390625, -2.514801025390625, -2.342529296875, -2.170257568359375, -1.99798583984375, -1.825714111328125, -1.6534423828125, -1.481170654296875, -1.30889892578125, -1.136627197265625, -0.96435546875, -0.792083740234375, -0.61981201171875, -0.447540283203125, -0.2752685546875, -0.102996826171875, 0.06927490234375, 0.241546630859375, 0.413818359375, 0.586090087890625, 0.75836181640625, 0.930633544921875, 1.1029052734375, 1.275177001953125, 1.44744873046875, 1.619720458984375, 1.7919921875, 1.964263916015625, 2.13653564453125, 2.308807373046875, 2.4810791015625, 2.653350830078125, 2.82562255859375, 2.997894287109375, 3.170166015625, 3.342437744140625, 3.51470947265625, 3.686981201171875, 3.8592529296875, 4.031524658203125, 4.20379638671875, 4.376068115234375, 4.54833984375, 4.720611572265625, 4.89288330078125, 5.065155029296875, 5.2374267578125, 5.409698486328125, 5.58197021484375, 5.754241943359375, 5.926513671875, 6.098785400390625, 6.27105712890625, 6.443328857421875, 6.6156005859375, 6.787872314453125, 6.96014404296875, 7.132415771484375, 7.3046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 18.0, 39.0, 58.0, 147.0, 308.0, 783.0, 6136.0, 4172055.0, 13003.0, 1059.0, 375.0, 157.0, 66.0, 31.0, 23.0, 11.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-96.75, -93.869140625, -90.98828125, -88.107421875, -85.2265625, -82.345703125, -79.46484375, -76.583984375, -73.703125, -70.822265625, -67.94140625, -65.060546875, -62.1796875, -59.298828125, -56.41796875, -53.537109375, -50.65625, -47.775390625, -44.89453125, -42.013671875, -39.1328125, -36.251953125, -33.37109375, -30.490234375, -27.609375, -24.728515625, -21.84765625, -18.966796875, -16.0859375, -13.205078125, -10.32421875, -7.443359375, -4.5625, -1.681640625, 1.19921875, 4.080078125, 6.9609375, 9.841796875, 12.72265625, 15.603515625, 18.484375, 21.365234375, 24.24609375, 27.126953125, 30.0078125, 32.888671875, 35.76953125, 38.650390625, 41.53125, 44.412109375, 47.29296875, 50.173828125, 53.0546875, 55.935546875, 58.81640625, 61.697265625, 64.578125, 67.458984375, 70.33984375, 73.220703125, 76.1015625, 78.982421875, 81.86328125, 84.744140625, 87.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 15.0, 22.0, 65.0, 154.0, 337.0, 1228.0, 1524.0, 441.0, 143.0, 72.0, 37.0, 23.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.578125, -15.314208984375, -14.05029296875, -12.786376953125, -11.5224609375, -10.258544921875, -8.99462890625, -7.730712890625, -6.466796875, -5.202880859375, -3.93896484375, -2.675048828125, -1.4111328125, -0.147216796875, 1.11669921875, 2.380615234375, 3.64453125, 4.908447265625, 6.17236328125, 7.436279296875, 8.7001953125, 9.964111328125, 11.22802734375, 12.491943359375, 13.755859375, 15.019775390625, 16.28369140625, 17.547607421875, 18.8115234375, 20.075439453125, 21.33935546875, 22.603271484375, 23.8671875, 25.131103515625, 26.39501953125, 27.658935546875, 28.9228515625, 30.186767578125, 31.45068359375, 32.714599609375, 33.978515625, 35.242431640625, 36.50634765625, 37.770263671875, 39.0341796875, 40.298095703125, 41.56201171875, 42.825927734375, 44.08984375, 45.353759765625, 46.61767578125, 47.881591796875, 49.1455078125, 50.409423828125, 51.67333984375, 52.937255859375, 54.201171875, 55.465087890625, 56.72900390625, 57.992919921875, 59.2568359375, 60.520751953125, 61.78466796875, 63.048583984375, 64.3125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 11.0, 12.0, 25.0, 56.0, 104.0, 253.0, 262.0, 142.0, 54.0, 31.0, 17.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2028503417969, -248.6716766357422, -239.1405029296875, -229.6093292236328, -220.07815551757812, -210.54698181152344, -201.01580810546875, -191.48463439941406, -181.95346069335938, -172.4222869873047, -162.89111328125, -153.3599395751953, -143.82876586914062, -134.29759216308594, -124.76641845703125, -115.23524475097656, -105.70407104492188, -96.17289733886719, -86.6417236328125, -77.11054992675781, -67.57937622070312, -58.04820251464844, -48.51702880859375, -38.98585510253906, -29.454681396484375, -19.923507690429688, -10.392333984375, -0.8611602783203125, 8.670013427734375, 18.201187133789062, 27.73236083984375, 37.26353454589844, 46.794677734375, 56.32585144042969, 65.85702514648438, 75.38819885253906, 84.91937255859375, 94.45054626464844, 103.98171997070312, 113.51289367675781, 123.0440673828125, 132.5752410888672, 142.10641479492188, 151.63758850097656, 161.16876220703125, 170.69993591308594, 180.23110961914062, 189.7622833251953, 199.29345703125, 208.8246307373047, 218.35580444335938, 227.88697814941406, 237.41815185546875, 246.94932556152344, 256.4804992675781, 266.01165771484375, 275.5428466796875, 285.07403564453125, 294.6051940917969, 304.1363525390625, 313.66754150390625, 323.19873046875, 332.7298889160156, 342.26104736328125, 351.792236328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 10.0, 15.0, 16.0, 26.0, 22.0, 35.0, 33.0, 36.0, 51.0, 49.0, 59.0, 57.0, 63.0, 70.0, 52.0, 55.0, 38.0, 41.0, 44.0, 27.0, 32.0, 31.0, 18.0, 8.0, 11.0, 16.0, 9.0, 6.0, 6.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-110.79570007324219, -107.67374420166016, -104.5517807006836, -101.42982482910156, -98.30786895751953, -95.18590545654297, -92.06394958496094, -88.94198608398438, -85.82003021240234, -82.69807434082031, -79.57611083984375, -76.45415496826172, -73.33219909667969, -70.21023559570312, -67.0882797241211, -63.9663200378418, -60.844364166259766, -57.72240447998047, -54.60044860839844, -51.47848892211914, -48.356529235839844, -45.23457336425781, -42.112613677978516, -38.99065399169922, -35.86869812011719, -32.74673843383789, -29.624780654907227, -26.502822875976562, -23.380863189697266, -20.2589054107666, -17.136947631835938, -14.01498794555664, -10.893028259277344, -7.771069526672363, -4.649111270904541, -1.5271530151367188, 1.5948057174682617, 4.716764450073242, 7.838722229003906, 10.960681915283203, 14.082639694213867, 17.20459747314453, 20.326557159423828, 23.448514938354492, 26.570472717285156, 29.692432403564453, 32.81439208984375, 35.93634796142578, 39.05830764770508, 42.180267333984375, 45.302223205566406, 48.4241828918457, 51.546142578125, 54.66809844970703, 57.79005813598633, 60.912017822265625, 64.03397369384766, 67.15592956542969, 70.27789306640625, 73.39984893798828, 76.52180480957031, 79.64376831054688, 82.7657241821289, 85.88768005371094, 89.0096435546875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 20.0, 15.0, 36.0, 64.0, 115.0, 185.0, 314.0, 572.0, 1275.0, 2944.0, 7417.0, 23731.0, 97618.0, 518671.0, 309803.0, 60109.0, 16073.0, 5306.0, 2155.0, 1025.0, 470.0, 262.0, 151.0, 81.0, 56.0, 22.0, 26.0, 11.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.7010498046875, -9.386474609375, -9.0718994140625, -8.75732421875, -8.4427490234375, -8.128173828125, -7.8135986328125, -7.4990234375, -7.1844482421875, -6.869873046875, -6.5552978515625, -6.24072265625, -5.9261474609375, -5.611572265625, -5.2969970703125, -4.982421875, -4.6678466796875, -4.353271484375, -4.0386962890625, -3.72412109375, -3.4095458984375, -3.094970703125, -2.7803955078125, -2.4658203125, -2.1512451171875, -1.836669921875, -1.5220947265625, -1.20751953125, -0.8929443359375, -0.578369140625, -0.2637939453125, 0.05078125, 0.3653564453125, 0.679931640625, 0.9945068359375, 1.30908203125, 1.6236572265625, 1.938232421875, 2.2528076171875, 2.5673828125, 2.8819580078125, 3.196533203125, 3.5111083984375, 3.82568359375, 4.1402587890625, 4.454833984375, 4.7694091796875, 5.083984375, 5.3985595703125, 5.713134765625, 6.0277099609375, 6.34228515625, 6.6568603515625, 6.971435546875, 7.2860107421875, 7.6005859375, 7.9151611328125, 8.229736328125, 8.5443115234375, 8.85888671875, 9.1734619140625, 9.488037109375, 9.8026123046875, 10.1171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 8.0, 19.0, 16.0, 20.0, 32.0, 22.0, 28.0, 47.0, 42.0, 48.0, 56.0, 48.0, 54.0, 52.0, 44.0, 54.0, 48.0, 50.0, 40.0, 38.0, 38.0, 36.0, 20.0, 32.0, 23.0, 20.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5528564453125, -4.363525390625, -4.1741943359375, -3.98486328125, -3.7955322265625, -3.606201171875, -3.4168701171875, -3.2275390625, -3.0382080078125, -2.848876953125, -2.6595458984375, -2.47021484375, -2.2808837890625, -2.091552734375, -1.9022216796875, -1.712890625, -1.5235595703125, -1.334228515625, -1.1448974609375, -0.95556640625, -0.7662353515625, -0.576904296875, -0.3875732421875, -0.1982421875, -0.0089111328125, 0.180419921875, 0.3697509765625, 0.55908203125, 0.7484130859375, 0.937744140625, 1.1270751953125, 1.31640625, 1.5057373046875, 1.695068359375, 1.8843994140625, 2.07373046875, 2.2630615234375, 2.452392578125, 2.6417236328125, 2.8310546875, 3.0203857421875, 3.209716796875, 3.3990478515625, 3.58837890625, 3.7777099609375, 3.967041015625, 4.1563720703125, 4.345703125, 4.5350341796875, 4.724365234375, 4.9136962890625, 5.10302734375, 5.2923583984375, 5.481689453125, 5.6710205078125, 5.8603515625, 6.0496826171875, 6.239013671875, 6.4283447265625, 6.61767578125, 6.8070068359375, 6.996337890625, 7.1856689453125, 7.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 15.0, 17.0, 27.0, 51.0, 92.0, 153.0, 301.0, 697.0, 2612.0, 31794.0, 976215.0, 32624.0, 2625.0, 702.0, 258.0, 142.0, 93.0, 51.0, 20.0, 19.0, 9.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.64599609375, -13.9951171875, -13.34423828125, -12.693359375, -12.04248046875, -11.3916015625, -10.74072265625, -10.08984375, -9.43896484375, -8.7880859375, -8.13720703125, -7.486328125, -6.83544921875, -6.1845703125, -5.53369140625, -4.8828125, -4.23193359375, -3.5810546875, -2.93017578125, -2.279296875, -1.62841796875, -0.9775390625, -0.32666015625, 0.32421875, 0.97509765625, 1.6259765625, 2.27685546875, 2.927734375, 3.57861328125, 4.2294921875, 4.88037109375, 5.53125, 6.18212890625, 6.8330078125, 7.48388671875, 8.134765625, 8.78564453125, 9.4365234375, 10.08740234375, 10.73828125, 11.38916015625, 12.0400390625, 12.69091796875, 13.341796875, 13.99267578125, 14.6435546875, 15.29443359375, 15.9453125, 16.59619140625, 17.2470703125, 17.89794921875, 18.548828125, 19.19970703125, 19.8505859375, 20.50146484375, 21.15234375, 21.80322265625, 22.4541015625, 23.10498046875, 23.755859375, 24.40673828125, 25.0576171875, 25.70849609375, 26.359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 16.0, 18.0, 13.0, 27.0, 34.0, 25.0, 45.0, 56.0, 48.0, 78.0, 81.0, 84.0, 75.0, 64.0, 59.0, 53.0, 39.0, 32.0, 26.0, 15.0, 22.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.6005859375, -22.826171875, -22.0517578125, -21.27734375, -20.5029296875, -19.728515625, -18.9541015625, -18.1796875, -17.4052734375, -16.630859375, -15.8564453125, -15.08203125, -14.3076171875, -13.533203125, -12.7587890625, -11.984375, -11.2099609375, -10.435546875, -9.6611328125, -8.88671875, -8.1123046875, -7.337890625, -6.5634765625, -5.7890625, -5.0146484375, -4.240234375, -3.4658203125, -2.69140625, -1.9169921875, -1.142578125, -0.3681640625, 0.40625, 1.1806640625, 1.955078125, 2.7294921875, 3.50390625, 4.2783203125, 5.052734375, 5.8271484375, 6.6015625, 7.3759765625, 8.150390625, 8.9248046875, 9.69921875, 10.4736328125, 11.248046875, 12.0224609375, 12.796875, 13.5712890625, 14.345703125, 15.1201171875, 15.89453125, 16.6689453125, 17.443359375, 18.2177734375, 18.9921875, 19.7666015625, 20.541015625, 21.3154296875, 22.08984375, 22.8642578125, 23.638671875, 24.4130859375, 25.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 8.0, 9.0, 31.0, 32.0, 39.0, 93.0, 164.0, 365.0, 1178.0, 4209.0, 43470.0, 975733.0, 18897.0, 2793.0, 807.0, 328.0, 163.0, 69.0, 44.0, 26.0, 18.0, 11.0, 8.0, 6.0, 12.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.798828125, -3.677703857421875, -3.55657958984375, -3.435455322265625, -3.3143310546875, -3.193206787109375, -3.07208251953125, -2.950958251953125, -2.829833984375, -2.708709716796875, -2.58758544921875, -2.466461181640625, -2.3453369140625, -2.224212646484375, -2.10308837890625, -1.981964111328125, -1.86083984375, -1.739715576171875, -1.61859130859375, -1.497467041015625, -1.3763427734375, -1.255218505859375, -1.13409423828125, -1.012969970703125, -0.891845703125, -0.770721435546875, -0.64959716796875, -0.528472900390625, -0.4073486328125, -0.286224365234375, -0.16510009765625, -0.043975830078125, 0.0771484375, 0.198272705078125, 0.31939697265625, 0.440521240234375, 0.5616455078125, 0.682769775390625, 0.80389404296875, 0.925018310546875, 1.046142578125, 1.167266845703125, 1.28839111328125, 1.409515380859375, 1.5306396484375, 1.651763916015625, 1.77288818359375, 1.894012451171875, 2.01513671875, 2.136260986328125, 2.25738525390625, 2.378509521484375, 2.4996337890625, 2.620758056640625, 2.74188232421875, 2.863006591796875, 2.984130859375, 3.105255126953125, 3.22637939453125, 3.347503662109375, 3.4686279296875, 3.589752197265625, 3.71087646484375, 3.832000732421875, 3.953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 14.0, 20.0, 35.0, 55.0, 100.0, 214.0, 235.0, 126.0, 69.0, 35.0, 23.0, 19.0, 8.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013141632080078125, -0.0012768208980560303, -0.001239478588104248, -0.0012021362781524658, -0.0011647939682006836, -0.0011274516582489014, -0.0010901093482971191, -0.001052767038345337, -0.0010154247283935547, -0.0009780824184417725, -0.0009407401084899902, -0.000903397798538208, -0.0008660554885864258, -0.0008287131786346436, -0.0007913708686828613, -0.0007540285587310791, -0.0007166862487792969, -0.0006793439388275146, -0.0006420016288757324, -0.0006046593189239502, -0.000567317008972168, -0.0005299746990203857, -0.0004926323890686035, -0.0004552900791168213, -0.00041794776916503906, -0.00038060545921325684, -0.0003432631492614746, -0.0003059208393096924, -0.00026857852935791016, -0.00023123621940612793, -0.0001938939094543457, -0.00015655159950256348, -0.00011920928955078125, -8.186697959899902e-05, -4.45246696472168e-05, -7.18235969543457e-06, 3.0159950256347656e-05, 6.750226020812988e-05, 0.00010484457015991211, 0.00014218688011169434, 0.00017952919006347656, 0.0002168715000152588, 0.000254213809967041, 0.00029155611991882324, 0.00032889842987060547, 0.0003662407398223877, 0.0004035830497741699, 0.00044092535972595215, 0.0004782676696777344, 0.0005156099796295166, 0.0005529522895812988, 0.0005902945995330811, 0.0006276369094848633, 0.0006649792194366455, 0.0007023215293884277, 0.00073966383934021, 0.0007770061492919922, 0.0008143484592437744, 0.0008516907691955566, 0.0008890330791473389, 0.0009263753890991211, 0.0009637176990509033, 0.0010010600090026855, 0.0010384023189544678, 0.00107574462890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 10.0, 10.0, 25.0, 37.0, 73.0, 117.0, 208.0, 348.0, 656.0, 1277.0, 2940.0, 8088.0, 35104.0, 828042.0, 145253.0, 17263.0, 5012.0, 1929.0, 974.0, 513.0, 259.0, 165.0, 86.0, 45.0, 35.0, 19.0, 13.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.3984375, -2.32745361328125, -2.2564697265625, -2.18548583984375, -2.114501953125, -2.04351806640625, -1.9725341796875, -1.90155029296875, -1.83056640625, -1.75958251953125, -1.6885986328125, -1.61761474609375, -1.546630859375, -1.47564697265625, -1.4046630859375, -1.33367919921875, -1.2626953125, -1.19171142578125, -1.1207275390625, -1.04974365234375, -0.978759765625, -0.90777587890625, -0.8367919921875, -0.76580810546875, -0.69482421875, -0.62384033203125, -0.5528564453125, -0.48187255859375, -0.410888671875, -0.33990478515625, -0.2689208984375, -0.19793701171875, -0.126953125, -0.05596923828125, 0.0150146484375, 0.08599853515625, 0.156982421875, 0.22796630859375, 0.2989501953125, 0.36993408203125, 0.44091796875, 0.51190185546875, 0.5828857421875, 0.65386962890625, 0.724853515625, 0.79583740234375, 0.8668212890625, 0.93780517578125, 1.0087890625, 1.07977294921875, 1.1507568359375, 1.22174072265625, 1.292724609375, 1.36370849609375, 1.4346923828125, 1.50567626953125, 1.57666015625, 1.64764404296875, 1.7186279296875, 1.78961181640625, 1.860595703125, 1.93157958984375, 2.0025634765625, 2.07354736328125, 2.14453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 12.0, 15.0, 16.0, 15.0, 30.0, 43.0, 66.0, 80.0, 102.0, 121.0, 92.0, 100.0, 80.0, 59.0, 24.0, 19.0, 22.0, 15.0, 15.0, 2.0, 8.0, 5.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.005859375, -1.9481201171875, -1.890380859375, -1.8326416015625, -1.77490234375, -1.7171630859375, -1.659423828125, -1.6016845703125, -1.5439453125, -1.4862060546875, -1.428466796875, -1.3707275390625, -1.31298828125, -1.2552490234375, -1.197509765625, -1.1397705078125, -1.08203125, -1.0242919921875, -0.966552734375, -0.9088134765625, -0.85107421875, -0.7933349609375, -0.735595703125, -0.6778564453125, -0.6201171875, -0.5623779296875, -0.504638671875, -0.4468994140625, -0.38916015625, -0.3314208984375, -0.273681640625, -0.2159423828125, -0.158203125, -0.1004638671875, -0.042724609375, 0.0150146484375, 0.07275390625, 0.1304931640625, 0.188232421875, 0.2459716796875, 0.3037109375, 0.3614501953125, 0.419189453125, 0.4769287109375, 0.53466796875, 0.5924072265625, 0.650146484375, 0.7078857421875, 0.765625, 0.8233642578125, 0.881103515625, 0.9388427734375, 0.99658203125, 1.0543212890625, 1.112060546875, 1.1697998046875, 1.2275390625, 1.2852783203125, 1.343017578125, 1.4007568359375, 1.45849609375, 1.5162353515625, 1.573974609375, 1.6317138671875, 1.689453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 32.0, 127.0, 701.0, 105.0, 25.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.4772186279297, -197.0380401611328, -189.59886169433594, -182.15968322753906, -174.7205047607422, -167.2813262939453, -159.84214782714844, -152.40296936035156, -144.9637908935547, -137.5246124267578, -130.08543395996094, -122.64625549316406, -115.20707702636719, -107.76789855957031, -100.32872009277344, -92.88954162597656, -85.45036315917969, -78.01118469238281, -70.57200622558594, -63.13282775878906, -55.69364929199219, -48.25447082519531, -40.81529235839844, -33.37611389160156, -25.936935424804688, -18.497756958007812, -11.058578491210938, -3.6194000244140625, 3.8197784423828125, 11.258956909179688, 18.698135375976562, 26.137313842773438, 33.57647705078125, 41.015655517578125, 48.454833984375, 55.894012451171875, 63.33319091796875, 70.77236938476562, 78.2115478515625, 85.65072631835938, 93.08990478515625, 100.52908325195312, 107.96826171875, 115.40744018554688, 122.84661865234375, 130.28579711914062, 137.7249755859375, 145.16415405273438, 152.60333251953125, 160.04251098632812, 167.481689453125, 174.92086791992188, 182.36004638671875, 189.79922485351562, 197.2384033203125, 204.67758178710938, 212.11676025390625, 219.55593872070312, 226.9951171875, 234.43429565429688, 241.87347412109375, 249.31265258789062, 256.7518310546875, 264.1910095214844, 271.63018798828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 10.0, 13.0, 10.0, 22.0, 28.0, 24.0, 30.0, 32.0, 59.0, 117.0, 299.0, 109.0, 36.0, 49.0, 23.0, 31.0, 12.0, 15.0, 19.0, 11.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.204261779785156, -53.45351791381836, -50.7027702331543, -47.9520263671875, -45.2012825012207, -42.450538635253906, -39.699790954589844, -36.94904708862305, -34.19830322265625, -31.44755744934082, -28.696813583374023, -25.946067810058594, -23.195323944091797, -20.444578170776367, -17.693832397460938, -14.94308853149414, -12.192340850830078, -9.441596031188965, -6.690850734710693, -3.940105438232422, -1.1893606185913086, 1.5613842010498047, 4.312129974365234, 7.062873840332031, 9.813619613647461, 12.564364433288574, 15.315109252929688, 18.065855026245117, 20.816600799560547, 23.567344665527344, 26.318090438842773, 29.06883430480957, 31.819580078125, 34.5703239440918, 37.32107162475586, 40.071815490722656, 42.82255935668945, 45.57330322265625, 48.32405090332031, 51.07479476928711, 53.825538635253906, 56.5762825012207, 59.327030181884766, 62.07777404785156, 64.82852172851562, 67.57926177978516, 70.33000946044922, 73.08074951171875, 75.83149719238281, 78.58224487304688, 81.3329849243164, 84.08373260498047, 86.83448028564453, 89.58522033691406, 92.33596801757812, 95.08671569824219, 97.83746337890625, 100.58821105957031, 103.33895111083984, 106.0896987915039, 108.84044647216797, 111.5911865234375, 114.34193420410156, 117.09268188476562, 119.84342193603516]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 22.0, 38.0, 50.0, 56.0, 73.0, 390.0, 148.0, 77.0, 49.0, 26.0, 24.0, 14.0, 11.0, 9.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -5.841552734375, -5.38623046875, -4.930908203125, -4.4755859375, -4.020263671875, -3.56494140625, -3.109619140625, -2.654296875, -2.198974609375, -1.74365234375, -1.288330078125, -0.8330078125, -0.377685546875, 0.07763671875, 0.532958984375, 0.98828125, 1.443603515625, 1.89892578125, 2.354248046875, 2.8095703125, 3.264892578125, 3.72021484375, 4.175537109375, 4.630859375, 5.086181640625, 5.54150390625, 5.996826171875, 6.4521484375, 6.907470703125, 7.36279296875, 7.818115234375, 8.2734375, 8.728759765625, 9.18408203125, 9.639404296875, 10.0947265625, 10.550048828125, 11.00537109375, 11.460693359375, 11.916015625, 12.371337890625, 12.82666015625, 13.281982421875, 13.7373046875, 14.192626953125, 14.64794921875, 15.103271484375, 15.55859375, 16.013916015625, 16.46923828125, 16.924560546875, 17.3798828125, 17.835205078125, 18.29052734375, 18.745849609375, 19.201171875, 19.656494140625, 20.11181640625, 20.567138671875, 21.0224609375, 21.477783203125, 21.93310546875, 22.388427734375, 22.84375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 7.0, 7.0, 10.0, 19.0, 12.0, 12.0, 23.0, 31.0, 66.0, 85.0, 141.0, 260.0, 472.0, 1196.0, 3937.0, 26785.0, 8332886.0, 17267.0, 3247.0, 1051.0, 476.0, 221.0, 117.0, 68.0, 38.0, 36.0, 28.0, 23.0, 5.0, 10.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.35891723632812, -72.37186431884766, -70.38480377197266, -68.39775085449219, -66.41069793701172, -64.42364501953125, -62.436588287353516, -60.44953155517578, -58.46247863769531, -56.47542190551758, -54.48836898803711, -52.501312255859375, -50.514259338378906, -48.52720260620117, -46.5401496887207, -44.55309295654297, -42.5660400390625, -40.578983306884766, -38.5919303894043, -36.60487365722656, -34.617820739746094, -32.63076400756836, -30.64371109008789, -28.656654357910156, -26.669597625732422, -24.68254280090332, -22.69548797607422, -20.708433151245117, -18.721378326416016, -16.73432159423828, -14.747267723083496, -12.760212898254395, -10.77315902709961, -8.786104202270508, -6.799049377441406, -4.8119940757751465, -2.824939250946045, -0.8378839492797852, 1.1491708755493164, 3.136225700378418, 5.1232805252075195, 7.110335350036621, 9.097390174865723, 11.08444595336914, 13.071500778198242, 15.058555603027344, 17.045610427856445, 19.032665252685547, 21.01972007751465, 23.00677490234375, 24.99382972717285, 26.980884552001953, 28.967939376831055, 30.954994201660156, 32.94205093383789, 34.92910385131836, 36.916160583496094, 38.90321731567383, 40.8902702331543, 42.87732696533203, 44.8643798828125, 46.851436614990234, 48.8384895324707, 50.82554626464844, 52.812599182128906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 12.0, 6.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.6932601928711, -101.4347915649414, -98.17632293701172, -94.9178466796875, -91.65937805175781, -88.40090942382812, -85.14244079589844, -81.88397216796875, -78.62550354003906, -75.36703491210938, -72.10856628417969, -68.85009765625, -65.59162139892578, -62.333152770996094, -59.074684143066406, -55.81621551513672, -52.5577392578125, -49.29927062988281, -46.04079818725586, -42.78232955932617, -39.52385711669922, -36.26538848876953, -33.006919860839844, -29.748449325561523, -26.489978790283203, -23.231508255004883, -19.973037719726562, -16.714569091796875, -13.456098556518555, -10.197628021240234, -6.939159393310547, -3.6806888580322266, -0.42221832275390625, 2.836251735687256, 6.094721794128418, 9.353191375732422, 12.611661911010742, 15.870132446289062, 19.12860107421875, 22.38707160949707, 25.64554214477539, 28.90401268005371, 32.16248321533203, 35.42095184326172, 38.679420471191406, 41.93789291381836, 45.19636154174805, 48.454833984375, 51.71330261230469, 54.971771240234375, 58.23024368286133, 61.488712310791016, 64.74718475341797, 68.00565338134766, 71.26412200927734, 74.52259063720703, 77.78106689453125, 81.03953552246094, 84.29800415039062, 87.55647277832031, 90.81494903564453, 94.07341766357422, 97.3318862915039, 100.5903549194336, 103.84882354736328]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 14.0, 14.0, 12.0, 25.0, 23.0, 30.0, 51.0, 61.0, 100.0, 157.0, 247.0, 389.0, 687.0, 1285.0, 2881.0, 6931.0, 20415.0, 70636.0, 216126.0, 142807.0, 40175.0, 12340.0, 4569.0, 2020.0, 951.0, 511.0, 298.0, 170.0, 108.0, 74.0, 47.0, 27.0, 23.0, 13.0, 8.0, 10.0, 5.0, 3.0, 2.0], "bins": [-84.125, -82.203125, -80.28125, -78.359375, -76.4375, -74.515625, -72.59375, -70.671875, -68.75, -66.828125, -64.90625, -62.984375, -61.0625, -59.140625, -57.21875, -55.296875, -53.375, -51.453125, -49.53125, -47.609375, -45.6875, -43.765625, -41.84375, -39.921875, -38.0, -36.078125, -34.15625, -32.234375, -30.3125, -28.390625, -26.46875, -24.546875, -22.625, -20.703125, -18.78125, -16.859375, -14.9375, -13.015625, -11.09375, -9.171875, -7.25, -5.328125, -3.40625, -1.484375, 0.4375, 2.359375, 4.28125, 6.203125, 8.125, 10.046875, 11.96875, 13.890625, 15.8125, 17.734375, 19.65625, 21.578125, 23.5, 25.421875, 27.34375, 29.265625, 31.1875, 33.109375, 35.03125, 36.953125, 38.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 13.0, 14.0, 22.0, 26.0, 45.0, 59.0, 72.0, 101.0, 112.0, 110.0, 110.0, 113.0, 72.0, 41.0, 47.0, 19.0, 15.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -16.0570068359375, -15.676513671875, -15.2960205078125, -14.91552734375, -14.5350341796875, -14.154541015625, -13.7740478515625, -13.3935546875, -13.0130615234375, -12.632568359375, -12.2520751953125, -11.87158203125, -11.4910888671875, -11.110595703125, -10.7301025390625, -10.349609375, -9.9691162109375, -9.588623046875, -9.2081298828125, -8.82763671875, -8.4471435546875, -8.066650390625, -7.6861572265625, -7.3056640625, -6.9251708984375, -6.544677734375, -6.1641845703125, -5.78369140625, -5.4031982421875, -5.022705078125, -4.6422119140625, -4.26171875, -3.8812255859375, -3.500732421875, -3.1202392578125, -2.73974609375, -2.3592529296875, -1.978759765625, -1.5982666015625, -1.2177734375, -0.8372802734375, -0.456787109375, -0.0762939453125, 0.30419921875, 0.6846923828125, 1.065185546875, 1.4456787109375, 1.826171875, 2.2066650390625, 2.587158203125, 2.9676513671875, 3.34814453125, 3.7286376953125, 4.109130859375, 4.4896240234375, 4.8701171875, 5.2506103515625, 5.631103515625, 6.0115966796875, 6.39208984375, 6.7725830078125, 7.153076171875, 7.5335693359375, 7.9140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 14.0, 13.0, 20.0, 18.0, 38.0, 55.0, 78.0, 77.0, 54.0, 35.0, 14.0, 13.0, 16.0, 7.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.44195556640625, -64.41422271728516, -62.3864860534668, -60.3587532043457, -58.33102035522461, -56.30328369140625, -54.275550842285156, -52.24781799316406, -50.22008514404297, -48.192352294921875, -46.164615631103516, -44.13688278198242, -42.10914993286133, -40.08141326904297, -38.053680419921875, -36.02594757080078, -33.99821090698242, -31.970476150512695, -29.9427433013916, -27.915008544921875, -25.88727569580078, -23.859540939331055, -21.831806182861328, -19.804073333740234, -17.776338577270508, -15.748604774475098, -13.720870971679688, -11.693136215209961, -9.66540241241455, -7.637668609619141, -5.609933853149414, -3.582200050354004, -1.5544700622558594, 0.4732639789581299, 2.500998020172119, 4.5287322998046875, 6.556466102600098, 8.584199905395508, 10.611934661865234, 12.639668464660645, 14.667402267456055, 16.69513702392578, 18.722869873046875, 20.7506046295166, 22.778339385986328, 24.806072235107422, 26.83380699157715, 28.861541748046875, 30.88927459716797, 32.91700744628906, 34.94474411010742, 36.972476959228516, 39.00020980834961, 41.02794647216797, 43.05567932128906, 45.083412170410156, 47.11114501953125, 49.138877868652344, 51.1666145324707, 53.1943473815918, 55.22208023071289, 57.24981689453125, 59.277549743652344, 61.30528259277344, 63.3330192565918]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 15.0, 25.0, 34.0, 39.0, 54.0, 60.0, 75.0, 54.0, 34.0, 17.0, 13.0, 5.0, 5.0, 1.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.305160522460938, -28.190046310424805, -27.074932098388672, -25.959819793701172, -24.84470558166504, -23.729591369628906, -22.614479064941406, -21.499364852905273, -20.38425064086914, -19.269136428833008, -18.154022216796875, -17.038909912109375, -15.923795700073242, -14.80868148803711, -13.693568229675293, -12.578454971313477, -11.463340759277344, -10.348226547241211, -9.233113288879395, -8.118000030517578, -7.002885818481445, -5.887772083282471, -4.772658348083496, -3.6575446128845215, -2.542430877685547, -1.4273171424865723, -0.31220340728759766, 0.802910327911377, 1.9180240631103516, 3.033137798309326, 4.148251533508301, 5.263365268707275, 6.378482818603516, 7.49359655380249, 8.608710289001465, 9.723823547363281, 10.838937759399414, 11.954051971435547, 13.069165229797363, 14.18427848815918, 15.299392700195312, 16.414506912231445, 17.529621124267578, 18.644733428955078, 19.75984764099121, 20.874961853027344, 21.990074157714844, 23.105188369750977, 24.22030258178711, 25.335416793823242, 26.450531005859375, 27.565643310546875, 28.680757522583008, 29.79587173461914, 30.91098403930664, 32.026100158691406, 33.141212463378906, 34.256324768066406, 35.37144088745117, 36.48655319213867, 37.60166931152344, 38.71678161621094, 39.83189392089844, 40.9470100402832, 42.0621223449707]}, "eval/loss": 0.832387387752533, "eval/wer": 0.1073079746810326, "eval/runtime": 1358.7502, "eval/samples_per_second": 1.944, "eval/steps_per_second": 0.244, "train/train_runtime": 122857.9097, "train/train_samples_per_second": 4.646, "train/train_steps_per_second": 0.145, "train/total_flos": 0.0, "train/train_loss": 2.2609593777487165} \ No newline at end of file