{"train/loss": 4.613, "train/learning_rate": 3.980000000000001e-06, "train/epoch": 0.78, "train/global_step": 200, "_runtime": 3637, "_timestamp": 1646097923, "_step": 199, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 73.0, 900.0, 41.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-161.31320190429688, -136.36038208007812, -111.40756225585938, -86.45474243164062, -61.501922607421875, -36.549102783203125, -11.596282958984375, 13.356536865234375, 38.309356689453125, 63.262176513671875, 88.21499633789062, 113.16781616210938, 138.12063598632812, 163.07345581054688, 188.02627563476562, 212.97909545898438, 237.93191528320312, 262.8847351074219, 287.8375549316406, 312.7903747558594, 337.7431945800781, 362.6960144042969, 387.6488342285156, 412.6016540527344, 437.5544738769531, 462.5072937011719, 487.4601135253906, 512.4129638671875, 537.36572265625, 562.318603515625, 587.2713623046875, 612.2242431640625, 637.177001953125, 662.1298217773438, 687.0826416015625, 712.0354614257812, 736.98828125, 761.9411010742188, 786.8939208984375, 811.8467407226562, 836.799560546875, 861.7523803710938, 886.7052001953125, 911.6580200195312, 936.61083984375, 961.5636596679688, 986.5164794921875, 1011.4692993164062, 1036.422119140625, 1061.375, 1086.3277587890625, 1111.280517578125, 1136.2333984375, 1161.186279296875, 1186.1390380859375, 1211.091796875, 1236.044677734375, 1260.99755859375, 1285.9503173828125, 1310.903076171875, 1335.85595703125, 1360.808837890625, 1385.7615966796875, 1410.71435546875, 1435.667236328125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 5.0, 5.0, 7.0, 12.0, 10.0, 22.0, 20.0, 13.0, 23.0, 24.0, 31.0, 44.0, 46.0, 48.0, 51.0, 42.0, 39.0, 58.0, 47.0, 47.0, 52.0, 56.0, 42.0, 49.0, 30.0, 29.0, 29.0, 23.0, 17.0, 15.0, 11.0, 12.0, 6.0, 4.0, 8.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.15585327148438, -106.0435791015625, -101.93130493164062, -97.81903076171875, -93.70675659179688, -89.594482421875, -85.48221588134766, -81.36994171142578, -77.2576675415039, -73.14539337158203, -69.03311920166016, -64.92084503173828, -60.80857467651367, -56.6963005065918, -52.58403015136719, -48.47175598144531, -44.35948181152344, -40.24720764160156, -36.13493347167969, -32.02266311645508, -27.910388946533203, -23.798114776611328, -19.685842514038086, -15.573570251464844, -11.461296081542969, -7.34902286529541, -3.2367496490478516, 0.875523567199707, 4.987796783447266, 9.10007095336914, 13.212343215942383, 17.324615478515625, 21.436874389648438, 25.549148559570312, 29.661420822143555, 33.7736930847168, 37.88596725463867, 41.99824142456055, 46.110511779785156, 50.22278594970703, 54.335060119628906, 58.44733428955078, 62.559608459472656, 66.67188262939453, 70.78414916992188, 74.89642333984375, 79.00869750976562, 83.1209716796875, 87.23324584960938, 91.34552001953125, 95.45779418945312, 99.570068359375, 103.68234252929688, 107.79461669921875, 111.9068832397461, 116.01915740966797, 120.13143157958984, 124.24370574951172, 128.35597229003906, 132.46824645996094, 136.5805206298828, 140.6927947998047, 144.80506896972656, 148.91734313964844, 153.0296173095703]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 3.0, 6.0, 10.0, 9.0, 10.0, 15.0, 15.0, 19.0, 15.0, 32.0, 38.0, 44.0, 39.0, 44.0, 42.0, 61.0, 44.0, 45.0, 43.0, 48.0, 48.0, 49.0, 37.0, 30.0, 47.0, 39.0, 24.0, 26.0, 25.0, 17.0, 14.0, 16.0, 14.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.4921875, -13.1370849609375, -12.781982421875, -12.4268798828125, -12.07177734375, -11.7166748046875, -11.361572265625, -11.0064697265625, -10.6513671875, -10.2962646484375, -9.941162109375, -9.5860595703125, -9.23095703125, -8.8758544921875, -8.520751953125, -8.1656494140625, -7.810546875, -7.4554443359375, -7.100341796875, -6.7452392578125, -6.39013671875, -6.0350341796875, -5.679931640625, -5.3248291015625, -4.9697265625, -4.6146240234375, -4.259521484375, -3.9044189453125, -3.54931640625, -3.1942138671875, -2.839111328125, -2.4840087890625, -2.12890625, -1.7738037109375, -1.418701171875, -1.0635986328125, -0.70849609375, -0.3533935546875, 0.001708984375, 0.3568115234375, 0.7119140625, 1.0670166015625, 1.422119140625, 1.7772216796875, 2.13232421875, 2.4874267578125, 2.842529296875, 3.1976318359375, 3.552734375, 3.9078369140625, 4.262939453125, 4.6180419921875, 4.97314453125, 5.3282470703125, 5.683349609375, 6.0384521484375, 6.3935546875, 6.7486572265625, 7.103759765625, 7.4588623046875, 7.81396484375, 8.1690673828125, 8.524169921875, 8.8792724609375, 9.234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 12.0, 10.0, 8.0, 11.0, 14.0, 13.0, 24.0, 32.0, 49.0, 52.0, 78.0, 109.0, 132.0, 193.0, 262.0, 368.0, 572.0, 960.0, 1723.0, 3279.0, 7870.0, 26251.0, 204815.0, 2190743.0, 1589554.0, 133036.0, 20686.0, 6541.0, 2793.0, 1444.0, 873.0, 523.0, 356.0, 258.0, 158.0, 132.0, 79.0, 67.0, 56.0, 41.0, 30.0, 15.0, 17.0, 14.0, 10.0, 12.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.135986328125, -27.16259765625, -26.189208984375, -25.2158203125, -24.242431640625, -23.26904296875, -22.295654296875, -21.322265625, -20.348876953125, -19.37548828125, -18.402099609375, -17.4287109375, -16.455322265625, -15.48193359375, -14.508544921875, -13.53515625, -12.561767578125, -11.58837890625, -10.614990234375, -9.6416015625, -8.668212890625, -7.69482421875, -6.721435546875, -5.748046875, -4.774658203125, -3.80126953125, -2.827880859375, -1.8544921875, -0.881103515625, 0.09228515625, 1.065673828125, 2.0390625, 3.012451171875, 3.98583984375, 4.959228515625, 5.9326171875, 6.906005859375, 7.87939453125, 8.852783203125, 9.826171875, 10.799560546875, 11.77294921875, 12.746337890625, 13.7197265625, 14.693115234375, 15.66650390625, 16.639892578125, 17.61328125, 18.586669921875, 19.56005859375, 20.533447265625, 21.5068359375, 22.480224609375, 23.45361328125, 24.427001953125, 25.400390625, 26.373779296875, 27.34716796875, 28.320556640625, 29.2939453125, 30.267333984375, 31.24072265625, 32.214111328125, 33.1875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 12.0, 13.0, 19.0, 39.0, 39.0, 65.0, 101.0, 157.0, 310.0, 452.0, 681.0, 747.0, 486.0, 326.0, 215.0, 117.0, 71.0, 59.0, 35.0, 25.0, 21.0, 18.0, 10.0, 4.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.84375, -36.38818359375, -34.9326171875, -33.47705078125, -32.021484375, -30.56591796875, -29.1103515625, -27.65478515625, -26.19921875, -24.74365234375, -23.2880859375, -21.83251953125, -20.376953125, -18.92138671875, -17.4658203125, -16.01025390625, -14.5546875, -13.09912109375, -11.6435546875, -10.18798828125, -8.732421875, -7.27685546875, -5.8212890625, -4.36572265625, -2.91015625, -1.45458984375, 0.0009765625, 1.45654296875, 2.912109375, 4.36767578125, 5.8232421875, 7.27880859375, 8.734375, 10.18994140625, 11.6455078125, 13.10107421875, 14.556640625, 16.01220703125, 17.4677734375, 18.92333984375, 20.37890625, 21.83447265625, 23.2900390625, 24.74560546875, 26.201171875, 27.65673828125, 29.1123046875, 30.56787109375, 32.0234375, 33.47900390625, 34.9345703125, 36.39013671875, 37.845703125, 39.30126953125, 40.7568359375, 42.21240234375, 43.66796875, 45.12353515625, 46.5791015625, 48.03466796875, 49.490234375, 50.94580078125, 52.4013671875, 53.85693359375, 55.3125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 10.0, 15.0, 21.0, 30.0, 51.0, 57.0, 115.0, 180.0, 319.0, 644.0, 1601.0, 15659.0, 4145929.0, 26075.0, 1984.0, 683.0, 376.0, 191.0, 109.0, 58.0, 54.0, 30.0, 19.0, 24.0, 10.0, 7.0, 5.0, 6.0, 2.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.625, -230.486328125, -224.34765625, -218.208984375, -212.0703125, -205.931640625, -199.79296875, -193.654296875, -187.515625, -181.376953125, -175.23828125, -169.099609375, -162.9609375, -156.822265625, -150.68359375, -144.544921875, -138.40625, -132.267578125, -126.12890625, -119.990234375, -113.8515625, -107.712890625, -101.57421875, -95.435546875, -89.296875, -83.158203125, -77.01953125, -70.880859375, -64.7421875, -58.603515625, -52.46484375, -46.326171875, -40.1875, -34.048828125, -27.91015625, -21.771484375, -15.6328125, -9.494140625, -3.35546875, 2.783203125, 8.921875, 15.060546875, 21.19921875, 27.337890625, 33.4765625, 39.615234375, 45.75390625, 51.892578125, 58.03125, 64.169921875, 70.30859375, 76.447265625, 82.5859375, 88.724609375, 94.86328125, 101.001953125, 107.140625, 113.279296875, 119.41796875, 125.556640625, 131.6953125, 137.833984375, 143.97265625, 150.111328125, 156.25]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 75.0, 908.0, 28.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-952.5120239257812, -927.0051879882812, -901.498291015625, -875.991455078125, -850.4845581054688, -824.9777221679688, -799.4708251953125, -773.9639892578125, -748.4571533203125, -722.9503173828125, -697.4434204101562, -671.9365844726562, -646.4296875, -620.9228515625, -595.416015625, -569.9091186523438, -544.4022216796875, -518.8953857421875, -493.38848876953125, -467.88165283203125, -442.374755859375, -416.867919921875, -391.3610534667969, -365.85418701171875, -340.3473205566406, -314.8404541015625, -289.3335876464844, -263.82672119140625, -238.3198699951172, -212.81300354003906, -187.30615234375, -161.79928588867188, -136.29248046875, -110.78561401367188, -85.27875518798828, -59.77189636230469, -34.26502990722656, -8.758163452148438, 16.748687744140625, 42.25555419921875, 67.76242065429688, 93.269287109375, 118.7761459350586, 144.2830047607422, 169.7898712158203, 195.29673767089844, 220.8035888671875, 246.31045532226562, 271.81732177734375, 297.3241882324219, 322.8310546875, 348.337890625, 373.84478759765625, 399.35162353515625, 424.8584899902344, 450.3653564453125, 475.8722229003906, 501.37908935546875, 526.8859252929688, 552.392822265625, 577.899658203125, 603.4065551757812, 628.9133911132812, 654.4202880859375, 679.9271240234375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 19.0, 16.0, 20.0, 15.0, 16.0, 25.0, 33.0, 22.0, 34.0, 30.0, 46.0, 28.0, 37.0, 56.0, 50.0, 41.0, 51.0, 46.0, 42.0, 37.0, 45.0, 42.0, 36.0, 35.0, 34.0, 23.0, 23.0, 21.0, 13.0, 15.0, 10.0, 8.0, 9.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-174.14617919921875, -169.54042053222656, -164.93466186523438, -160.32891845703125, -155.72315979003906, -151.11740112304688, -146.5116424560547, -141.9058837890625, -137.30014038085938, -132.6943817138672, -128.088623046875, -123.48287200927734, -118.87712097167969, -114.2713623046875, -109.66560363769531, -105.05984497070312, -100.45408630371094, -95.84832763671875, -91.2425765991211, -86.6368179321289, -82.03106689453125, -77.42530822753906, -72.81954956054688, -68.21379089355469, -63.60803985595703, -59.00228500366211, -54.39653015136719, -49.790771484375, -45.18501663208008, -40.579261779785156, -35.97350311279297, -31.367748260498047, -26.761978149414062, -22.15622329711914, -17.550466537475586, -12.944710731506348, -8.33895492553711, -3.7332000732421875, 0.8725566864013672, 5.478313446044922, 10.084068298339844, 14.689824104309082, 19.29557991027832, 23.901336669921875, 28.507091522216797, 33.11284637451172, 37.718605041503906, 42.32435989379883, 46.93011474609375, 51.53586959838867, 56.141624450683594, 60.74738311767578, 65.35313415527344, 69.95889282226562, 74.56465148925781, 79.17041015625, 83.77616119384766, 88.38191986083984, 92.9876708984375, 97.59342956542969, 102.19918823242188, 106.80493927001953, 111.41069793701172, 116.01644897460938, 120.62220764160156]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 14.0, 9.0, 10.0, 16.0, 10.0, 20.0, 20.0, 30.0, 29.0, 41.0, 35.0, 49.0, 35.0, 37.0, 59.0, 45.0, 46.0, 60.0, 41.0, 34.0, 43.0, 32.0, 27.0, 26.0, 31.0, 25.0, 22.0, 25.0, 22.0, 10.0, 14.0, 15.0, 15.0, 8.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.265625, -11.8897705078125, -11.513916015625, -11.1380615234375, -10.76220703125, -10.3863525390625, -10.010498046875, -9.6346435546875, -9.2587890625, -8.8829345703125, -8.507080078125, -8.1312255859375, -7.75537109375, -7.3795166015625, -7.003662109375, -6.6278076171875, -6.251953125, -5.8760986328125, -5.500244140625, -5.1243896484375, -4.74853515625, -4.3726806640625, -3.996826171875, -3.6209716796875, -3.2451171875, -2.8692626953125, -2.493408203125, -2.1175537109375, -1.74169921875, -1.3658447265625, -0.989990234375, -0.6141357421875, -0.23828125, 0.1375732421875, 0.513427734375, 0.8892822265625, 1.26513671875, 1.6409912109375, 2.016845703125, 2.3927001953125, 2.7685546875, 3.1444091796875, 3.520263671875, 3.8961181640625, 4.27197265625, 4.6478271484375, 5.023681640625, 5.3995361328125, 5.775390625, 6.1512451171875, 6.527099609375, 6.9029541015625, 7.27880859375, 7.6546630859375, 8.030517578125, 8.4063720703125, 8.7822265625, 9.1580810546875, 9.533935546875, 9.9097900390625, 10.28564453125, 10.6614990234375, 11.037353515625, 11.4132080078125, 11.7890625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 6.0, 6.0, 9.0, 19.0, 26.0, 37.0, 46.0, 63.0, 103.0, 123.0, 209.0, 280.0, 397.0, 638.0, 781.0, 1249.0, 1874.0, 2668.0, 3986.0, 6074.0, 9409.0, 14932.0, 24051.0, 40171.0, 69692.0, 132385.0, 356997.0, 173336.0, 83911.0, 47412.0, 28237.0, 17480.0, 10841.0, 7008.0, 4587.0, 3010.0, 2074.0, 1392.0, 892.0, 662.0, 410.0, 319.0, 204.0, 173.0, 106.0, 63.0, 67.0, 43.0, 35.0, 24.0, 11.0, 7.0, 11.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-3.009765625, -2.9176025390625, -2.825439453125, -2.7332763671875, -2.64111328125, -2.5489501953125, -2.456787109375, -2.3646240234375, -2.2724609375, -2.1802978515625, -2.088134765625, -1.9959716796875, -1.90380859375, -1.8116455078125, -1.719482421875, -1.6273193359375, -1.53515625, -1.4429931640625, -1.350830078125, -1.2586669921875, -1.16650390625, -1.0743408203125, -0.982177734375, -0.8900146484375, -0.7978515625, -0.7056884765625, -0.613525390625, -0.5213623046875, -0.42919921875, -0.3370361328125, -0.244873046875, -0.1527099609375, -0.060546875, 0.0316162109375, 0.123779296875, 0.2159423828125, 0.30810546875, 0.4002685546875, 0.492431640625, 0.5845947265625, 0.6767578125, 0.7689208984375, 0.861083984375, 0.9532470703125, 1.04541015625, 1.1375732421875, 1.229736328125, 1.3218994140625, 1.4140625, 1.5062255859375, 1.598388671875, 1.6905517578125, 1.78271484375, 1.8748779296875, 1.967041015625, 2.0592041015625, 2.1513671875, 2.2435302734375, 2.335693359375, 2.4278564453125, 2.52001953125, 2.6121826171875, 2.704345703125, 2.7965087890625, 2.888671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 8.0, 5.0, 9.0, 7.0, 10.0, 23.0, 16.0, 22.0, 17.0, 30.0, 32.0, 24.0, 27.0, 38.0, 35.0, 41.0, 40.0, 48.0, 53.0, 1072.0, 47.0, 29.0, 38.0, 38.0, 42.0, 36.0, 27.0, 32.0, 27.0, 33.0, 16.0, 13.0, 19.0, 14.0, 10.0, 7.0, 9.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.65234375, -7.41094970703125, -7.1695556640625, -6.92816162109375, -6.686767578125, -6.44537353515625, -6.2039794921875, -5.96258544921875, -5.72119140625, -5.47979736328125, -5.2384033203125, -4.99700927734375, -4.755615234375, -4.51422119140625, -4.2728271484375, -4.03143310546875, -3.7900390625, -3.54864501953125, -3.3072509765625, -3.06585693359375, -2.824462890625, -2.58306884765625, -2.3416748046875, -2.10028076171875, -1.85888671875, -1.61749267578125, -1.3760986328125, -1.13470458984375, -0.893310546875, -0.65191650390625, -0.4105224609375, -0.16912841796875, 0.072265625, 0.31365966796875, 0.5550537109375, 0.79644775390625, 1.037841796875, 1.27923583984375, 1.5206298828125, 1.76202392578125, 2.00341796875, 2.24481201171875, 2.4862060546875, 2.72760009765625, 2.968994140625, 3.21038818359375, 3.4517822265625, 3.69317626953125, 3.9345703125, 4.17596435546875, 4.4173583984375, 4.65875244140625, 4.900146484375, 5.14154052734375, 5.3829345703125, 5.62432861328125, 5.86572265625, 6.10711669921875, 6.3485107421875, 6.58990478515625, 6.831298828125, 7.07269287109375, 7.3140869140625, 7.55548095703125, 7.796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 13.0, 10.0, 14.0, 21.0, 32.0, 62.0, 65.0, 102.0, 122.0, 196.0, 262.0, 401.0, 613.0, 842.0, 1252.0, 1981.0, 3018.0, 4573.0, 7421.0, 11787.0, 19181.0, 30977.0, 51942.0, 90729.0, 184893.0, 1388135.0, 124607.0, 68052.0, 39949.0, 24483.0, 14776.0, 9494.0, 5798.0, 3794.0, 2473.0, 1576.0, 1043.0, 780.0, 548.0, 343.0, 202.0, 164.0, 118.0, 79.0, 66.0, 38.0, 35.0, 15.0, 14.0, 13.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.052734375, -2.95806884765625, -2.8634033203125, -2.76873779296875, -2.674072265625, -2.57940673828125, -2.4847412109375, -2.39007568359375, -2.29541015625, -2.20074462890625, -2.1060791015625, -2.01141357421875, -1.916748046875, -1.82208251953125, -1.7274169921875, -1.63275146484375, -1.5380859375, -1.44342041015625, -1.3487548828125, -1.25408935546875, -1.159423828125, -1.06475830078125, -0.9700927734375, -0.87542724609375, -0.78076171875, -0.68609619140625, -0.5914306640625, -0.49676513671875, -0.402099609375, -0.30743408203125, -0.2127685546875, -0.11810302734375, -0.0234375, 0.07122802734375, 0.1658935546875, 0.26055908203125, 0.355224609375, 0.44989013671875, 0.5445556640625, 0.63922119140625, 0.73388671875, 0.82855224609375, 0.9232177734375, 1.01788330078125, 1.112548828125, 1.20721435546875, 1.3018798828125, 1.39654541015625, 1.4912109375, 1.58587646484375, 1.6805419921875, 1.77520751953125, 1.869873046875, 1.96453857421875, 2.0592041015625, 2.15386962890625, 2.24853515625, 2.34320068359375, 2.4378662109375, 2.53253173828125, 2.627197265625, 2.72186279296875, 2.8165283203125, 2.91119384765625, 3.005859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 8.0, 8.0, 6.0, 9.0, 18.0, 20.0, 21.0, 27.0, 30.0, 40.0, 63.0, 84.0, 92.0, 88.0, 92.0, 98.0, 70.0, 47.0, 38.0, 27.0, 29.0, 20.0, 14.0, 17.0, 9.0, 8.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031032562255859375, -0.0030132830142974854, -0.002923309803009033, -0.002833336591720581, -0.002743363380432129, -0.0026533901691436768, -0.0025634169578552246, -0.0024734437465667725, -0.0023834705352783203, -0.002293497323989868, -0.002203524112701416, -0.002113550901412964, -0.0020235776901245117, -0.0019336044788360596, -0.0018436312675476074, -0.0017536580562591553, -0.0016636848449707031, -0.001573711633682251, -0.0014837384223937988, -0.0013937652111053467, -0.0013037919998168945, -0.0012138187885284424, -0.0011238455772399902, -0.001033872365951538, -0.0009438991546630859, -0.0008539259433746338, -0.0007639527320861816, -0.0006739795207977295, -0.0005840063095092773, -0.0004940330982208252, -0.00040405988693237305, -0.0003140866756439209, -0.00022411346435546875, -0.0001341402530670166, -4.416704177856445e-05, 4.5806169509887695e-05, 0.00013577938079833984, 0.000225752592086792, 0.00031572580337524414, 0.0004056990146636963, 0.0004956722259521484, 0.0005856454372406006, 0.0006756186485290527, 0.0007655918598175049, 0.000855565071105957, 0.0009455382823944092, 0.0010355114936828613, 0.0011254847049713135, 0.0012154579162597656, 0.0013054311275482178, 0.00139540433883667, 0.001485377550125122, 0.0015753507614135742, 0.0016653239727020264, 0.0017552971839904785, 0.0018452703952789307, 0.0019352436065673828, 0.002025216817855835, 0.002115190029144287, 0.0022051632404327393, 0.0022951364517211914, 0.0023851096630096436, 0.0024750828742980957, 0.002565056085586548, 0.002655029296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 7.0, 14.0, 18.0, 21.0, 38.0, 56.0, 67.0, 100.0, 134.0, 221.0, 341.0, 661.0, 1767.0, 1042402.0, 1202.0, 530.0, 335.0, 202.0, 119.0, 91.0, 67.0, 54.0, 28.0, 18.0, 10.0, 8.0, 10.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0543212890625, -0.05247306823730469, -0.050624847412109375, -0.04877662658691406, -0.04692840576171875, -0.04508018493652344, -0.043231964111328125, -0.04138374328613281, -0.0395355224609375, -0.03768730163574219, -0.035839080810546875, -0.03399085998535156, -0.03214263916015625, -0.030294418334960938, -0.028446197509765625, -0.026597976684570312, -0.024749755859375, -0.022901535034179688, -0.021053314208984375, -0.019205093383789062, -0.01735687255859375, -0.015508651733398438, -0.013660430908203125, -0.011812210083007812, -0.0099639892578125, -0.008115768432617188, -0.006267547607421875, -0.0044193267822265625, -0.00257110595703125, -0.0007228851318359375, 0.001125335693359375, 0.0029735565185546875, 0.00482177734375, 0.0066699981689453125, 0.008518218994140625, 0.010366439819335938, 0.01221466064453125, 0.014062881469726562, 0.015911102294921875, 0.017759323120117188, 0.0196075439453125, 0.021455764770507812, 0.023303985595703125, 0.025152206420898438, 0.02700042724609375, 0.028848648071289062, 0.030696868896484375, 0.03254508972167969, 0.034393310546875, 0.03624153137207031, 0.038089752197265625, 0.03993797302246094, 0.04178619384765625, 0.04363441467285156, 0.045482635498046875, 0.04733085632324219, 0.0491790771484375, 0.05102729797363281, 0.052875518798828125, 0.05472373962402344, 0.05657196044921875, 0.05842018127441406, 0.060268402099609375, 0.06211662292480469, 0.06396484375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 74.0, 590.0, 317.0, 25.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006508379592560232, -0.0005672624101862311, -0.0004836868611164391, -0.0004001112829428166, -0.0003165357338730246, -0.00023296018480323255, -0.00014938460662961006, -6.580905755981803e-05, 1.7766491509974003e-05, 0.00010134204785572365, 0.0001849176042014733, 0.00026849316782318056, 0.0003520687168929726, 0.0004356442659627646, 0.0005192198441363871, 0.0006027953932061791, 0.0006863709422759712, 0.0007699464913457632, 0.0008535220404155552, 0.0009370975894853473, 0.0010206731967628002, 0.0011042486876249313, 0.0011878242949023843, 0.0012713999021798372, 0.0013549753930419683, 0.0014385510003194213, 0.0015221264911815524, 0.0016057020984590054, 0.0016892775893211365, 0.0017728531965985894, 0.0018564288038760424, 0.0019400042947381735, 0.0020235797856003046, 0.0021071552764624357, 0.0021907310001552105, 0.0022743064910173416, 0.0023578819818794727, 0.002441457472741604, 0.0025250331964343786, 0.0026086086872965097, 0.002692184178158641, 0.002775759669020772, 0.0028593353927135468, 0.002942910883575678, 0.003026486374437809, 0.00311006186529994, 0.003193637588992715, 0.003277213079854846, 0.0033607888035476208, 0.003444364294409752, 0.0035279400181025267, 0.003611515508964658, 0.003695090999826789, 0.00377866649068892, 0.003862242214381695, 0.003945817705243826, 0.004029393196105957, 0.004112968686968088, 0.004196544177830219, 0.00428011966869235, 0.004363695625215769, 0.0044472711160779, 0.004530846606940031, 0.004614422097802162, 0.004697997588664293]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 6.0, 6.0, 9.0, 7.0, 13.0, 11.0, 13.0, 14.0, 21.0, 17.0, 20.0, 29.0, 27.0, 26.0, 22.0, 36.0, 31.0, 40.0, 51.0, 50.0, 31.0, 38.0, 32.0, 34.0, 36.0, 39.0, 29.0, 35.0, 29.0, 25.0, 29.0, 29.0, 20.0, 22.0, 21.0, 19.0, 13.0, 10.0, 13.0, 7.0, 8.0, 8.0, 8.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010222792625427246, -0.0009899279102683067, -0.0009575765579938889, -0.000925225205719471, -0.0008928738534450531, -0.0008605225011706352, -0.0008281711488962173, -0.0007958197966217995, -0.0007634684443473816, -0.0007311170920729637, -0.0006987657397985458, -0.000666414387524128, -0.0006340630352497101, -0.0006017116829752922, -0.0005693603307008743, -0.0005370089784264565, -0.0005046576261520386, -0.0004723062738776207, -0.0004399549216032028, -0.00040760356932878494, -0.00037525221705436707, -0.0003429008647799492, -0.0003105495125055313, -0.00027819816023111343, -0.00024584680795669556, -0.00021349545568227768, -0.0001811441034078598, -0.00014879275113344193, -0.00011644139885902405, -8.409004658460617e-05, -5.1738694310188293e-05, -1.9387342035770416e-05, 1.2964010238647461e-05, 4.531536251306534e-05, 7.766671478748322e-05, 0.00011001806706190109, 0.00014236941933631897, 0.00017472077161073685, 0.00020707212388515472, 0.0002394234761595726, 0.0002717748284339905, 0.00030412618070840836, 0.00033647753298282623, 0.0003688288852572441, 0.000401180237531662, 0.00043353158980607986, 0.00046588294208049774, 0.0004982342943549156, 0.0005305856466293335, 0.0005629369989037514, 0.0005952883511781693, 0.0006276397034525871, 0.000659991055727005, 0.0006923424080014229, 0.0007246937602758408, 0.0007570451125502586, 0.0007893964648246765, 0.0008217478170990944, 0.0008540991693735123, 0.0008864505216479301, 0.000918801873922348, 0.0009511532261967659, 0.0009835045784711838, 0.0010158559307456017, 0.0010482072830200195]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 14.0, 9.0, 10.0, 16.0, 10.0, 20.0, 21.0, 29.0, 29.0, 41.0, 35.0, 49.0, 35.0, 37.0, 59.0, 45.0, 46.0, 60.0, 41.0, 34.0, 43.0, 32.0, 27.0, 26.0, 31.0, 25.0, 22.0, 25.0, 22.0, 10.0, 14.0, 15.0, 15.0, 8.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.265625, -11.8897705078125, -11.513916015625, -11.1380615234375, -10.76220703125, -10.3863525390625, -10.010498046875, -9.6346435546875, -9.2587890625, -8.8829345703125, -8.507080078125, -8.1312255859375, -7.75537109375, -7.3795166015625, -7.003662109375, -6.6278076171875, -6.251953125, -5.8760986328125, -5.500244140625, -5.1243896484375, -4.74853515625, -4.3726806640625, -3.996826171875, -3.6209716796875, -3.2451171875, -2.8692626953125, -2.493408203125, -2.1175537109375, -1.74169921875, -1.3658447265625, -0.989990234375, -0.6141357421875, -0.23828125, 0.1375732421875, 0.513427734375, 0.8892822265625, 1.26513671875, 1.6409912109375, 2.016845703125, 2.3927001953125, 2.7685546875, 3.1444091796875, 3.520263671875, 3.8961181640625, 4.27197265625, 4.6478271484375, 5.023681640625, 5.3995361328125, 5.775390625, 6.1512451171875, 6.527099609375, 6.9029541015625, 7.27880859375, 7.6546630859375, 8.030517578125, 8.4063720703125, 8.7822265625, 9.1580810546875, 9.533935546875, 9.9097900390625, 10.28564453125, 10.6614990234375, 11.037353515625, 11.4132080078125, 11.7890625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 9.0, 6.0, 11.0, 15.0, 21.0, 26.0, 38.0, 58.0, 71.0, 110.0, 132.0, 199.0, 269.0, 404.0, 534.0, 814.0, 1103.0, 1642.0, 2506.0, 4085.0, 7337.0, 17586.0, 226620.0, 741260.0, 22083.0, 8599.0, 4509.0, 2637.0, 1771.0, 1228.0, 852.0, 579.0, 381.0, 301.0, 220.0, 145.0, 117.0, 76.0, 51.0, 47.0, 28.0, 22.0, 15.0, 10.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-104.875, -101.7060546875, -98.537109375, -95.3681640625, -92.19921875, -89.0302734375, -85.861328125, -82.6923828125, -79.5234375, -76.3544921875, -73.185546875, -70.0166015625, -66.84765625, -63.6787109375, -60.509765625, -57.3408203125, -54.171875, -51.0029296875, -47.833984375, -44.6650390625, -41.49609375, -38.3271484375, -35.158203125, -31.9892578125, -28.8203125, -25.6513671875, -22.482421875, -19.3134765625, -16.14453125, -12.9755859375, -9.806640625, -6.6376953125, -3.46875, -0.2998046875, 2.869140625, 6.0380859375, 9.20703125, 12.3759765625, 15.544921875, 18.7138671875, 21.8828125, 25.0517578125, 28.220703125, 31.3896484375, 34.55859375, 37.7275390625, 40.896484375, 44.0654296875, 47.234375, 50.4033203125, 53.572265625, 56.7412109375, 59.91015625, 63.0791015625, 66.248046875, 69.4169921875, 72.5859375, 75.7548828125, 78.923828125, 82.0927734375, 85.26171875, 88.4306640625, 91.599609375, 94.7685546875, 97.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 6.0, 6.0, 5.0, 13.0, 16.0, 14.0, 22.0, 23.0, 35.0, 25.0, 25.0, 45.0, 60.0, 50.0, 63.0, 92.0, 324.0, 1637.0, 134.0, 75.0, 56.0, 38.0, 43.0, 42.0, 27.0, 26.0, 20.0, 25.0, 27.0, 16.0, 10.0, 16.0, 8.0, 4.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.2705078125, -29.978515625, -28.6865234375, -27.39453125, -26.1025390625, -24.810546875, -23.5185546875, -22.2265625, -20.9345703125, -19.642578125, -18.3505859375, -17.05859375, -15.7666015625, -14.474609375, -13.1826171875, -11.890625, -10.5986328125, -9.306640625, -8.0146484375, -6.72265625, -5.4306640625, -4.138671875, -2.8466796875, -1.5546875, -0.2626953125, 1.029296875, 2.3212890625, 3.61328125, 4.9052734375, 6.197265625, 7.4892578125, 8.78125, 10.0732421875, 11.365234375, 12.6572265625, 13.94921875, 15.2412109375, 16.533203125, 17.8251953125, 19.1171875, 20.4091796875, 21.701171875, 22.9931640625, 24.28515625, 25.5771484375, 26.869140625, 28.1611328125, 29.453125, 30.7451171875, 32.037109375, 33.3291015625, 34.62109375, 35.9130859375, 37.205078125, 38.4970703125, 39.7890625, 41.0810546875, 42.373046875, 43.6650390625, 44.95703125, 46.2490234375, 47.541015625, 48.8330078125, 50.125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 6.0, 13.0, 11.0, 14.0, 20.0, 28.0, 27.0, 22.0, 32.0, 35.0, 54.0, 70.0, 113.0, 311.0, 1432.0, 3003330.0, 138553.0, 938.0, 270.0, 98.0, 74.0, 56.0, 24.0, 34.0, 29.0, 22.0, 18.0, 12.0, 17.0, 10.0, 6.0, 4.0, 5.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-246.5, -240.3203125, -234.140625, -227.9609375, -221.78125, -215.6015625, -209.421875, -203.2421875, -197.0625, -190.8828125, -184.703125, -178.5234375, -172.34375, -166.1640625, -159.984375, -153.8046875, -147.625, -141.4453125, -135.265625, -129.0859375, -122.90625, -116.7265625, -110.546875, -104.3671875, -98.1875, -92.0078125, -85.828125, -79.6484375, -73.46875, -67.2890625, -61.109375, -54.9296875, -48.75, -42.5703125, -36.390625, -30.2109375, -24.03125, -17.8515625, -11.671875, -5.4921875, 0.6875, 6.8671875, 13.046875, 19.2265625, 25.40625, 31.5859375, 37.765625, 43.9453125, 50.125, 56.3046875, 62.484375, 68.6640625, 74.84375, 81.0234375, 87.203125, 93.3828125, 99.5625, 105.7421875, 111.921875, 118.1015625, 124.28125, 130.4609375, 136.640625, 142.8203125, 149.0]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 965.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.88095092773438, -160.1182403564453, -132.35552978515625, -104.59283447265625, -76.83012390136719, -49.067413330078125, -21.304718017578125, 6.4579925537109375, 34.220703125, 61.9834098815918, 89.7461166381836, 117.50881958007812, 145.2715301513672, 173.03424072265625, 200.79693603515625, 228.5596466064453, 256.3223571777344, 284.0850524902344, 311.8477783203125, 339.6104736328125, 367.3731689453125, 395.1358947753906, 422.8985900878906, 450.66131591796875, 478.42401123046875, 506.18670654296875, 533.9494018554688, 561.712158203125, 589.474853515625, 617.237548828125, 645.000244140625, 672.762939453125, 700.525634765625, 728.288330078125, 756.051025390625, 783.813720703125, 811.5764770507812, 839.3391723632812, 867.1018676757812, 894.8645629882812, 922.6273193359375, 950.3900146484375, 978.1527099609375, 1005.9154052734375, 1033.6781005859375, 1061.44091796875, 1089.20361328125, 1116.96630859375, 1144.72900390625, 1172.49169921875, 1200.25439453125, 1228.01708984375, 1255.77978515625, 1283.54248046875, 1311.30517578125, 1339.0679931640625, 1366.83056640625, 1394.59326171875, 1422.35595703125, 1450.11865234375, 1477.88134765625, 1505.64404296875, 1533.40673828125, 1561.1695556640625, 1588.9322509765625]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 17.0, 17.0, 17.0, 16.0, 15.0, 23.0, 32.0, 35.0, 30.0, 33.0, 33.0, 32.0, 32.0, 37.0, 31.0, 39.0, 38.0, 38.0, 42.0, 30.0, 32.0, 42.0, 37.0, 37.0, 38.0, 24.0, 29.0, 27.0, 16.0, 11.0, 15.0, 9.0, 13.0, 14.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 4.0], "bins": [-106.12589263916016, -102.885009765625, -99.64412689208984, -96.40324401855469, -93.16236114501953, -89.92147827148438, -86.68058776855469, -83.43971252441406, -80.19882202148438, -76.95793914794922, -73.71705627441406, -70.4761734008789, -67.23529052734375, -63.994407653808594, -60.75352096557617, -57.512638092041016, -54.271759033203125, -51.03087615966797, -47.78999328613281, -44.549110412597656, -41.3082275390625, -38.067344665527344, -34.82645797729492, -31.585575103759766, -28.34469223022461, -25.103809356689453, -21.862926483154297, -18.622041702270508, -15.381158828735352, -12.140275955200195, -8.899391174316406, -5.65850830078125, -2.4176254272460938, 0.8232579231262207, 4.064141273498535, 7.305025100708008, 10.545907974243164, 13.78679084777832, 17.02767562866211, 20.268558502197266, 23.509441375732422, 26.750324249267578, 29.991207122802734, 33.232093811035156, 36.47297668457031, 39.71385955810547, 42.954742431640625, 46.19562530517578, 49.43650817871094, 52.677391052246094, 55.91827392578125, 59.159156799316406, 62.40003967285156, 65.64092254638672, 68.88180541992188, 72.12269592285156, 75.36357116699219, 78.60445404052734, 81.8453369140625, 85.08621978759766, 88.32710266113281, 91.56798553466797, 94.80886840820312, 98.04975891113281, 101.29064178466797]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 9.0, 9.0, 6.0, 13.0, 10.0, 20.0, 16.0, 15.0, 22.0, 28.0, 39.0, 32.0, 34.0, 39.0, 42.0, 37.0, 47.0, 49.0, 51.0, 51.0, 47.0, 40.0, 30.0, 32.0, 33.0, 30.0, 25.0, 21.0, 24.0, 19.0, 21.0, 19.0, 19.0, 11.0, 13.0, 7.0, 7.0, 13.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.53125, -12.14599609375, -11.7607421875, -11.37548828125, -10.990234375, -10.60498046875, -10.2197265625, -9.83447265625, -9.44921875, -9.06396484375, -8.6787109375, -8.29345703125, -7.908203125, -7.52294921875, -7.1376953125, -6.75244140625, -6.3671875, -5.98193359375, -5.5966796875, -5.21142578125, -4.826171875, -4.44091796875, -4.0556640625, -3.67041015625, -3.28515625, -2.89990234375, -2.5146484375, -2.12939453125, -1.744140625, -1.35888671875, -0.9736328125, -0.58837890625, -0.203125, 0.18212890625, 0.5673828125, 0.95263671875, 1.337890625, 1.72314453125, 2.1083984375, 2.49365234375, 2.87890625, 3.26416015625, 3.6494140625, 4.03466796875, 4.419921875, 4.80517578125, 5.1904296875, 5.57568359375, 5.9609375, 6.34619140625, 6.7314453125, 7.11669921875, 7.501953125, 7.88720703125, 8.2724609375, 8.65771484375, 9.04296875, 9.42822265625, 9.8134765625, 10.19873046875, 10.583984375, 10.96923828125, 11.3544921875, 11.73974609375, 12.125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 19.0, 18.0, 30.0, 32.0, 65.0, 81.0, 117.0, 213.0, 351.0, 700.0, 1368.0, 3024.0, 7151.0, 19199.0, 75717.0, 3449431.0, 577683.0, 37507.0, 12064.0, 4933.0, 2147.0, 1038.0, 530.0, 309.0, 179.0, 111.0, 60.0, 44.0, 33.0, 33.0, 11.0, 21.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.875, -91.79296875, -88.7109375, -85.62890625, -82.546875, -79.46484375, -76.3828125, -73.30078125, -70.21875, -67.13671875, -64.0546875, -60.97265625, -57.890625, -54.80859375, -51.7265625, -48.64453125, -45.5625, -42.48046875, -39.3984375, -36.31640625, -33.234375, -30.15234375, -27.0703125, -23.98828125, -20.90625, -17.82421875, -14.7421875, -11.66015625, -8.578125, -5.49609375, -2.4140625, 0.66796875, 3.75, 6.83203125, 9.9140625, 12.99609375, 16.078125, 19.16015625, 22.2421875, 25.32421875, 28.40625, 31.48828125, 34.5703125, 37.65234375, 40.734375, 43.81640625, 46.8984375, 49.98046875, 53.0625, 56.14453125, 59.2265625, 62.30859375, 65.390625, 68.47265625, 71.5546875, 74.63671875, 77.71875, 80.80078125, 83.8828125, 86.96484375, 90.046875, 93.12890625, 96.2109375, 99.29296875, 102.375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 8.0, 16.0, 28.0, 29.0, 33.0, 72.0, 111.0, 160.0, 338.0, 721.0, 1043.0, 634.0, 333.0, 173.0, 116.0, 80.0, 47.0, 37.0, 22.0, 17.0, 13.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-133.0, -130.0068359375, -127.013671875, -124.0205078125, -121.02734375, -118.0341796875, -115.041015625, -112.0478515625, -109.0546875, -106.0615234375, -103.068359375, -100.0751953125, -97.08203125, -94.0888671875, -91.095703125, -88.1025390625, -85.109375, -82.1162109375, -79.123046875, -76.1298828125, -73.13671875, -70.1435546875, -67.150390625, -64.1572265625, -61.1640625, -58.1708984375, -55.177734375, -52.1845703125, -49.19140625, -46.1982421875, -43.205078125, -40.2119140625, -37.21875, -34.2255859375, -31.232421875, -28.2392578125, -25.24609375, -22.2529296875, -19.259765625, -16.2666015625, -13.2734375, -10.2802734375, -7.287109375, -4.2939453125, -1.30078125, 1.6923828125, 4.685546875, 7.6787109375, 10.671875, 13.6650390625, 16.658203125, 19.6513671875, 22.64453125, 25.6376953125, 28.630859375, 31.6240234375, 34.6171875, 37.6103515625, 40.603515625, 43.5966796875, 46.58984375, 49.5830078125, 52.576171875, 55.5693359375, 58.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 17.0, 11.0, 25.0, 36.0, 57.0, 87.0, 146.0, 235.0, 438.0, 1595.0, 4185999.0, 4519.0, 461.0, 243.0, 145.0, 91.0, 52.0, 42.0, 23.0, 22.0, 4.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.5, -278.6953125, -262.890625, -247.0859375, -231.28125, -215.4765625, -199.671875, -183.8671875, -168.0625, -152.2578125, -136.453125, -120.6484375, -104.84375, -89.0390625, -73.234375, -57.4296875, -41.625, -25.8203125, -10.015625, 5.7890625, 21.59375, 37.3984375, 53.203125, 69.0078125, 84.8125, 100.6171875, 116.421875, 132.2265625, 148.03125, 163.8359375, 179.640625, 195.4453125, 211.25, 227.0546875, 242.859375, 258.6640625, 274.46875, 290.2734375, 306.078125, 321.8828125, 337.6875, 353.4921875, 369.296875, 385.1015625, 400.90625, 416.7109375, 432.515625, 448.3203125, 464.125, 479.9296875, 495.734375, 511.5390625, 527.34375, 543.1484375, 558.953125, 574.7578125, 590.5625, 606.3671875, 622.171875, 637.9765625, 653.78125, 669.5859375, 685.390625, 701.1953125, 717.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 965.0, 46.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.7090606689453, -161.59178161621094, -117.4745101928711, -73.35723876953125, -29.239959716796875, 14.8773193359375, 58.99458312988281, 103.11186218261719, 147.22914123535156, 191.34642028808594, 235.46368408203125, 279.5809631347656, 323.6982421875, 367.8155212402344, 411.93280029296875, 456.050048828125, 500.1673583984375, 544.2846069335938, 588.4019165039062, 632.5191650390625, 676.636474609375, 720.7537231445312, 764.8709716796875, 808.98828125, 853.1055297851562, 897.2227783203125, 941.340087890625, 985.4573364257812, 1029.5745849609375, 1073.69189453125, 1117.8092041015625, 1161.926513671875, 1206.0438232421875, 1250.1611328125, 1294.2783203125, 1338.3956298828125, 1382.512939453125, 1426.6302490234375, 1470.7474365234375, 1514.86474609375, 1558.9820556640625, 1603.099365234375, 1647.216552734375, 1691.3338623046875, 1735.451171875, 1779.5684814453125, 1823.6856689453125, 1867.802978515625, 1911.920166015625, 1956.0374755859375, 2000.1546630859375, 2044.27197265625, 2088.38916015625, 2132.506591796875, 2176.623779296875, 2220.7412109375, 2264.8583984375, 2308.9755859375, 2353.093017578125, 2397.210205078125, 2441.327392578125, 2485.44482421875, 2529.56201171875, 2573.67919921875, 2617.796630859375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 8.0, 16.0, 4.0, 8.0, 13.0, 21.0, 17.0, 17.0, 23.0, 18.0, 31.0, 25.0, 30.0, 29.0, 34.0, 31.0, 31.0, 39.0, 45.0, 33.0, 40.0, 41.0, 30.0, 36.0, 34.0, 30.0, 35.0, 38.0, 32.0, 26.0, 24.0, 25.0, 15.0, 12.0, 12.0, 17.0, 14.0, 9.0, 10.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-190.62664794921875, -184.52056884765625, -178.4144744873047, -172.3083953857422, -166.2023162841797, -160.09622192382812, -153.99014282226562, -147.88406372070312, -141.77798461914062, -135.67190551757812, -129.56581115722656, -123.45973205566406, -117.35365295410156, -111.24756622314453, -105.1414794921875, -99.035400390625, -92.92930603027344, -86.8232192993164, -80.7171401977539, -74.61105346679688, -68.50497436523438, -62.398887634277344, -56.29280090332031, -50.18671798706055, -44.08063507080078, -37.974552154541016, -31.868467330932617, -25.76238250732422, -19.656299591064453, -13.550216674804688, -7.444129943847656, -1.3380470275878906, 4.768035888671875, 10.874119758605957, 16.98020362854004, 23.086288452148438, 29.192371368408203, 35.29845428466797, 41.404541015625, 47.510623931884766, 53.61670684814453, 59.7227897644043, 65.82887268066406, 71.9349594116211, 78.04104614257812, 84.14712524414062, 90.25321197509766, 96.35929870605469, 102.46537780761719, 108.57146453857422, 114.67754364013672, 120.78363037109375, 126.88970947265625, 132.99578857421875, 139.1018829345703, 145.2079620361328, 151.31405639648438, 157.42013549804688, 163.52622985839844, 169.63230895996094, 175.73838806152344, 181.844482421875, 187.9505615234375, 194.056640625, 200.1627197265625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 6.0, 10.0, 11.0, 8.0, 18.0, 11.0, 16.0, 13.0, 29.0, 27.0, 35.0, 23.0, 36.0, 46.0, 42.0, 39.0, 39.0, 34.0, 53.0, 43.0, 38.0, 38.0, 29.0, 47.0, 36.0, 32.0, 32.0, 16.0, 27.0, 25.0, 24.0, 20.0, 15.0, 14.0, 14.0, 14.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8125, -11.4326171875, -11.052734375, -10.6728515625, -10.29296875, -9.9130859375, -9.533203125, -9.1533203125, -8.7734375, -8.3935546875, -8.013671875, -7.6337890625, -7.25390625, -6.8740234375, -6.494140625, -6.1142578125, -5.734375, -5.3544921875, -4.974609375, -4.5947265625, -4.21484375, -3.8349609375, -3.455078125, -3.0751953125, -2.6953125, -2.3154296875, -1.935546875, -1.5556640625, -1.17578125, -0.7958984375, -0.416015625, -0.0361328125, 0.34375, 0.7236328125, 1.103515625, 1.4833984375, 1.86328125, 2.2431640625, 2.623046875, 3.0029296875, 3.3828125, 3.7626953125, 4.142578125, 4.5224609375, 4.90234375, 5.2822265625, 5.662109375, 6.0419921875, 6.421875, 6.8017578125, 7.181640625, 7.5615234375, 7.94140625, 8.3212890625, 8.701171875, 9.0810546875, 9.4609375, 9.8408203125, 10.220703125, 10.6005859375, 10.98046875, 11.3603515625, 11.740234375, 12.1201171875, 12.5]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 12.0, 23.0, 33.0, 48.0, 74.0, 94.0, 112.0, 170.0, 231.0, 348.0, 515.0, 723.0, 1066.0, 1478.0, 2155.0, 3224.0, 4649.0, 7028.0, 10497.0, 16119.0, 25510.0, 41766.0, 70963.0, 130026.0, 324674.0, 176295.0, 90161.0, 51611.0, 31025.0, 19407.0, 12534.0, 8385.0, 5537.0, 3747.0, 2563.0, 1833.0, 1204.0, 806.0, 555.0, 408.0, 271.0, 202.0, 159.0, 95.0, 75.0, 41.0, 32.0, 19.0, 17.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0], "bins": [-3.0703125, -2.9764404296875, -2.882568359375, -2.7886962890625, -2.69482421875, -2.6009521484375, -2.507080078125, -2.4132080078125, -2.3193359375, -2.2254638671875, -2.131591796875, -2.0377197265625, -1.94384765625, -1.8499755859375, -1.756103515625, -1.6622314453125, -1.568359375, -1.4744873046875, -1.380615234375, -1.2867431640625, -1.19287109375, -1.0989990234375, -1.005126953125, -0.9112548828125, -0.8173828125, -0.7235107421875, -0.629638671875, -0.5357666015625, -0.44189453125, -0.3480224609375, -0.254150390625, -0.1602783203125, -0.06640625, 0.0274658203125, 0.121337890625, 0.2152099609375, 0.30908203125, 0.4029541015625, 0.496826171875, 0.5906982421875, 0.6845703125, 0.7784423828125, 0.872314453125, 0.9661865234375, 1.06005859375, 1.1539306640625, 1.247802734375, 1.3416748046875, 1.435546875, 1.5294189453125, 1.623291015625, 1.7171630859375, 1.81103515625, 1.9049072265625, 1.998779296875, 2.0926513671875, 2.1865234375, 2.2803955078125, 2.374267578125, 2.4681396484375, 2.56201171875, 2.6558837890625, 2.749755859375, 2.8436279296875, 2.9375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 8.0, 10.0, 11.0, 13.0, 15.0, 20.0, 15.0, 17.0, 29.0, 27.0, 28.0, 25.0, 21.0, 40.0, 34.0, 40.0, 40.0, 31.0, 44.0, 1062.0, 33.0, 30.0, 38.0, 41.0, 32.0, 26.0, 36.0, 32.0, 29.0, 27.0, 28.0, 25.0, 20.0, 10.0, 20.0, 10.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-7.0703125, -6.84478759765625, -6.6192626953125, -6.39373779296875, -6.168212890625, -5.94268798828125, -5.7171630859375, -5.49163818359375, -5.26611328125, -5.04058837890625, -4.8150634765625, -4.58953857421875, -4.364013671875, -4.13848876953125, -3.9129638671875, -3.68743896484375, -3.4619140625, -3.23638916015625, -3.0108642578125, -2.78533935546875, -2.559814453125, -2.33428955078125, -2.1087646484375, -1.88323974609375, -1.65771484375, -1.43218994140625, -1.2066650390625, -0.98114013671875, -0.755615234375, -0.53009033203125, -0.3045654296875, -0.07904052734375, 0.146484375, 0.37200927734375, 0.5975341796875, 0.82305908203125, 1.048583984375, 1.27410888671875, 1.4996337890625, 1.72515869140625, 1.95068359375, 2.17620849609375, 2.4017333984375, 2.62725830078125, 2.852783203125, 3.07830810546875, 3.3038330078125, 3.52935791015625, 3.7548828125, 3.98040771484375, 4.2059326171875, 4.43145751953125, 4.656982421875, 4.88250732421875, 5.1080322265625, 5.33355712890625, 5.55908203125, 5.78460693359375, 6.0101318359375, 6.23565673828125, 6.461181640625, 6.68670654296875, 6.9122314453125, 7.13775634765625, 7.36328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 10.0, 15.0, 21.0, 22.0, 44.0, 61.0, 69.0, 94.0, 152.0, 174.0, 256.0, 375.0, 502.0, 696.0, 1066.0, 1584.0, 2265.0, 3276.0, 4994.0, 7697.0, 11808.0, 18278.0, 28867.0, 45562.0, 73710.0, 129329.0, 1359204.0, 166797.0, 89500.0, 54136.0, 34237.0, 21429.0, 13881.0, 8889.0, 5830.0, 3848.0, 2641.0, 1793.0, 1220.0, 788.0, 570.0, 420.0, 306.0, 202.0, 132.0, 96.0, 70.0, 60.0, 38.0, 40.0, 21.0, 20.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0], "bins": [-2.892578125, -2.8040771484375, -2.715576171875, -2.6270751953125, -2.53857421875, -2.4500732421875, -2.361572265625, -2.2730712890625, -2.1845703125, -2.0960693359375, -2.007568359375, -1.9190673828125, -1.83056640625, -1.7420654296875, -1.653564453125, -1.5650634765625, -1.4765625, -1.3880615234375, -1.299560546875, -1.2110595703125, -1.12255859375, -1.0340576171875, -0.945556640625, -0.8570556640625, -0.7685546875, -0.6800537109375, -0.591552734375, -0.5030517578125, -0.41455078125, -0.3260498046875, -0.237548828125, -0.1490478515625, -0.060546875, 0.0279541015625, 0.116455078125, 0.2049560546875, 0.29345703125, 0.3819580078125, 0.470458984375, 0.5589599609375, 0.6474609375, 0.7359619140625, 0.824462890625, 0.9129638671875, 1.00146484375, 1.0899658203125, 1.178466796875, 1.2669677734375, 1.35546875, 1.4439697265625, 1.532470703125, 1.6209716796875, 1.70947265625, 1.7979736328125, 1.886474609375, 1.9749755859375, 2.0634765625, 2.1519775390625, 2.240478515625, 2.3289794921875, 2.41748046875, 2.5059814453125, 2.594482421875, 2.6829833984375, 2.771484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 10.0, 7.0, 6.0, 7.0, 14.0, 17.0, 32.0, 34.0, 33.0, 37.0, 54.0, 65.0, 78.0, 70.0, 93.0, 67.0, 84.0, 58.0, 51.0, 36.0, 29.0, 25.0, 17.0, 20.0, 16.0, 9.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0025463104248046875, -0.00247858464717865, -0.0024108588695526123, -0.0023431330919265747, -0.002275407314300537, -0.0022076815366744995, -0.002139955759048462, -0.0020722299814224243, -0.0020045042037963867, -0.0019367784261703491, -0.0018690526485443115, -0.001801326870918274, -0.0017336010932922363, -0.0016658753156661987, -0.0015981495380401611, -0.0015304237604141235, -0.001462697982788086, -0.0013949722051620483, -0.0013272464275360107, -0.0012595206499099731, -0.0011917948722839355, -0.001124069094657898, -0.0010563433170318604, -0.0009886175394058228, -0.0009208917617797852, -0.0008531659841537476, -0.00078544020652771, -0.0007177144289016724, -0.0006499886512756348, -0.0005822628736495972, -0.0005145370960235596, -0.00044681131839752197, -0.0003790855407714844, -0.0003113597631454468, -0.00024363398551940918, -0.00017590820789337158, -0.00010818243026733398, -4.045665264129639e-05, 2.726912498474121e-05, 9.499490261077881e-05, 0.0001627206802368164, 0.000230446457862854, 0.0002981722354888916, 0.0003658980131149292, 0.0004336237907409668, 0.0005013495683670044, 0.000569075345993042, 0.0006368011236190796, 0.0007045269012451172, 0.0007722526788711548, 0.0008399784564971924, 0.00090770423412323, 0.0009754300117492676, 0.0010431557893753052, 0.0011108815670013428, 0.0011786073446273804, 0.001246333122253418, 0.0013140588998794556, 0.0013817846775054932, 0.0014495104551315308, 0.0015172362327575684, 0.001584962010383606, 0.0016526877880096436, 0.0017204135656356812, 0.0017881393432617188]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 11.0, 10.0, 12.0, 17.0, 17.0, 22.0, 45.0, 44.0, 78.0, 155.0, 269.0, 528.0, 2847.0, 1042416.0, 1085.0, 339.0, 210.0, 118.0, 79.0, 73.0, 32.0, 33.0, 29.0, 12.0, 15.0, 7.0, 12.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044891357421875, -0.04318571090698242, -0.041480064392089844, -0.039774417877197266, -0.03806877136230469, -0.03636312484741211, -0.03465747833251953, -0.03295183181762695, -0.031246185302734375, -0.029540538787841797, -0.02783489227294922, -0.02612924575805664, -0.024423599243164062, -0.022717952728271484, -0.021012306213378906, -0.019306659698486328, -0.01760101318359375, -0.015895366668701172, -0.014189720153808594, -0.012484073638916016, -0.010778427124023438, -0.00907278060913086, -0.007367134094238281, -0.005661487579345703, -0.003955841064453125, -0.002250194549560547, -0.0005445480346679688, 0.0011610984802246094, 0.0028667449951171875, 0.004572391510009766, 0.006278038024902344, 0.007983684539794922, 0.0096893310546875, 0.011394977569580078, 0.013100624084472656, 0.014806270599365234, 0.016511917114257812, 0.01821756362915039, 0.01992321014404297, 0.021628856658935547, 0.023334503173828125, 0.025040149688720703, 0.02674579620361328, 0.02845144271850586, 0.030157089233398438, 0.031862735748291016, 0.033568382263183594, 0.03527402877807617, 0.03697967529296875, 0.03868532180786133, 0.040390968322753906, 0.042096614837646484, 0.04380226135253906, 0.04550790786743164, 0.04721355438232422, 0.0489192008972168, 0.050624847412109375, 0.05233049392700195, 0.05403614044189453, 0.05574178695678711, 0.05744743347167969, 0.059153079986572266, 0.060858726501464844, 0.06256437301635742, 0.06427001953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 566.0, 444.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009770093485713005, -0.009537297300994396, -0.009304500184953213, -0.009071704000234604, -0.00883890688419342, -0.008606110699474812, -0.008373313583433628, -0.00814051739871502, -0.007907720282673836, -0.00767492363229394, -0.007442126981914043, -0.007209330331534147, -0.006976533681154251, -0.006743737496435642, -0.006510940846055746, -0.00627814419567585, -0.006045348010957241, -0.005812551360577345, -0.005579754710197449, -0.005346958059817553, -0.005114161409437656, -0.0048813652247190475, -0.004648568574339151, -0.004415771923959255, -0.004182975273579359, -0.003950178623199463, -0.0037173819728195667, -0.003484585555270314, -0.003251788904890418, -0.003018992254510522, -0.0027861958369612694, -0.002553399186581373, -0.0023206030018627644, -0.002087806351482868, -0.0018550098175182939, -0.0016222132835537195, -0.0013894166331738234, -0.0011566199827939272, -0.0009238234488293529, -0.0006910269148647785, -0.00045823026448488235, -0.0002254336723126471, 7.362919859588146e-06, 0.0002401595120318234, 0.00047295610420405865, 0.0007057527545839548, 0.0009385492885485291, 0.0011713458225131035, 0.0014041424728929996, 0.0016369391232728958, 0.0018697356572374701, 0.0021025321912020445, 0.0023353288415819407, 0.002568125491961837, 0.0028009219095110893, 0.0030337185598909855, 0.0032665152102708817, 0.003499311860650778, 0.003732108511030674, 0.00396490516141057, 0.004197701811790466, 0.004430497996509075, 0.004663294646888971, 0.0048960912972688675, 0.005128887947648764]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 6.0, 11.0, 10.0, 10.0, 18.0, 7.0, 19.0, 12.0, 13.0, 33.0, 29.0, 23.0, 33.0, 32.0, 44.0, 39.0, 42.0, 46.0, 50.0, 41.0, 47.0, 36.0, 44.0, 37.0, 29.0, 39.0, 37.0, 29.0, 21.0, 27.0, 35.0, 17.0, 17.0, 14.0, 15.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007814168930053711, -0.0007513733580708504, -0.0007213298231363297, -0.0006912862882018089, -0.0006612427532672882, -0.0006311992183327675, -0.0006011556833982468, -0.000571112148463726, -0.0005410686135292053, -0.0005110250785946846, -0.0004809815436601639, -0.00045093800872564316, -0.00042089447379112244, -0.0003908509388566017, -0.000360807403922081, -0.00033076386898756027, -0.00030072033405303955, -0.00027067679911851883, -0.0002406332641839981, -0.0002105897292494774, -0.00018054619431495667, -0.00015050265938043594, -0.00012045912444591522, -9.04155895113945e-05, -6.037205457687378e-05, -3.0328519642353058e-05, -2.849847078323364e-07, 2.9758550226688385e-05, 5.9802085161209106e-05, 8.984562009572983e-05, 0.00011988915503025055, 0.00014993268996477127, 0.000179976224899292, 0.00021001975983381271, 0.00024006329476833344, 0.00027010682970285416, 0.0003001503646373749, 0.0003301938995718956, 0.0003602374345064163, 0.00039028096944093704, 0.00042032450437545776, 0.0004503680393099785, 0.0004804115742444992, 0.0005104551091790199, 0.0005404986441135406, 0.0005705421790480614, 0.0006005857139825821, 0.0006306292489171028, 0.0006606727838516235, 0.0006907163187861443, 0.000720759853720665, 0.0007508033886551857, 0.0007808469235897064, 0.0008108904585242271, 0.0008409339934587479, 0.0008709775283932686, 0.0009010210633277893, 0.00093106459826231, 0.0009611081331968307, 0.0009911516681313515, 0.0010211952030658722, 0.001051238738000393, 0.0010812822729349136, 0.0011113258078694344, 0.001141369342803955]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 6.0, 10.0, 11.0, 8.0, 18.0, 11.0, 16.0, 13.0, 29.0, 27.0, 35.0, 23.0, 36.0, 46.0, 42.0, 39.0, 39.0, 34.0, 53.0, 43.0, 38.0, 38.0, 29.0, 47.0, 36.0, 32.0, 32.0, 16.0, 27.0, 25.0, 24.0, 20.0, 15.0, 14.0, 14.0, 14.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8125, -11.4326171875, -11.052734375, -10.6728515625, -10.29296875, -9.9130859375, -9.533203125, -9.1533203125, -8.7734375, -8.3935546875, -8.013671875, -7.6337890625, -7.25390625, -6.8740234375, -6.494140625, -6.1142578125, -5.734375, -5.3544921875, -4.974609375, -4.5947265625, -4.21484375, -3.8349609375, -3.455078125, -3.0751953125, -2.6953125, -2.3154296875, -1.935546875, -1.5556640625, -1.17578125, -0.7958984375, -0.416015625, -0.0361328125, 0.34375, 0.7236328125, 1.103515625, 1.4833984375, 1.86328125, 2.2431640625, 2.623046875, 3.0029296875, 3.3828125, 3.7626953125, 4.142578125, 4.5224609375, 4.90234375, 5.2822265625, 5.662109375, 6.0419921875, 6.421875, 6.8017578125, 7.181640625, 7.5615234375, 7.94140625, 8.3212890625, 8.701171875, 9.0810546875, 9.4609375, 9.8408203125, 10.220703125, 10.6005859375, 10.98046875, 11.3603515625, 11.740234375, 12.1201171875, 12.5]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 2.0, 13.0, 18.0, 17.0, 26.0, 23.0, 39.0, 45.0, 79.0, 100.0, 120.0, 141.0, 252.0, 340.0, 533.0, 857.0, 1662.0, 3137.0, 7068.0, 17239.0, 50656.0, 191777.0, 520245.0, 176462.0, 47493.0, 16342.0, 6684.0, 3002.0, 1545.0, 829.0, 540.0, 358.0, 235.0, 170.0, 131.0, 74.0, 66.0, 57.0, 45.0, 39.0, 13.0, 23.0, 13.0, 8.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.9375, -10.5899658203125, -10.242431640625, -9.8948974609375, -9.54736328125, -9.1998291015625, -8.852294921875, -8.5047607421875, -8.1572265625, -7.8096923828125, -7.462158203125, -7.1146240234375, -6.76708984375, -6.4195556640625, -6.072021484375, -5.7244873046875, -5.376953125, -5.0294189453125, -4.681884765625, -4.3343505859375, -3.98681640625, -3.6392822265625, -3.291748046875, -2.9442138671875, -2.5966796875, -2.2491455078125, -1.901611328125, -1.5540771484375, -1.20654296875, -0.8590087890625, -0.511474609375, -0.1639404296875, 0.18359375, 0.5311279296875, 0.878662109375, 1.2261962890625, 1.57373046875, 1.9212646484375, 2.268798828125, 2.6163330078125, 2.9638671875, 3.3114013671875, 3.658935546875, 4.0064697265625, 4.35400390625, 4.7015380859375, 5.049072265625, 5.3966064453125, 5.744140625, 6.0916748046875, 6.439208984375, 6.7867431640625, 7.13427734375, 7.4818115234375, 7.829345703125, 8.1768798828125, 8.5244140625, 8.8719482421875, 9.219482421875, 9.5670166015625, 9.91455078125, 10.2620849609375, 10.609619140625, 10.9571533203125, 11.3046875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 6.0, 11.0, 13.0, 13.0, 18.0, 21.0, 21.0, 33.0, 38.0, 40.0, 35.0, 38.0, 45.0, 59.0, 62.0, 174.0, 1860.0, 128.0, 56.0, 59.0, 40.0, 37.0, 35.0, 33.0, 24.0, 22.0, 24.0, 16.0, 15.0, 19.0, 12.0, 10.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -39.7734375, -38.265625, -36.7578125, -35.25, -33.7421875, -32.234375, -30.7265625, -29.21875, -27.7109375, -26.203125, -24.6953125, -23.1875, -21.6796875, -20.171875, -18.6640625, -17.15625, -15.6484375, -14.140625, -12.6328125, -11.125, -9.6171875, -8.109375, -6.6015625, -5.09375, -3.5859375, -2.078125, -0.5703125, 0.9375, 2.4453125, 3.953125, 5.4609375, 6.96875, 8.4765625, 9.984375, 11.4921875, 13.0, 14.5078125, 16.015625, 17.5234375, 19.03125, 20.5390625, 22.046875, 23.5546875, 25.0625, 26.5703125, 28.078125, 29.5859375, 31.09375, 32.6015625, 34.109375, 35.6171875, 37.125, 38.6328125, 40.140625, 41.6484375, 43.15625, 44.6640625, 46.171875, 47.6796875, 49.1875, 50.6953125, 52.203125, 53.7109375, 55.21875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 4.0, 9.0, 12.0, 19.0, 14.0, 22.0, 18.0, 25.0, 35.0, 42.0, 54.0, 83.0, 118.0, 223.0, 645.0, 3284.0, 3115359.0, 23787.0, 1020.0, 348.0, 148.0, 98.0, 62.0, 59.0, 38.0, 38.0, 29.0, 19.0, 15.0, 16.0, 10.0, 14.0, 6.0, 7.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-127.375, -123.9033203125, -120.431640625, -116.9599609375, -113.48828125, -110.0166015625, -106.544921875, -103.0732421875, -99.6015625, -96.1298828125, -92.658203125, -89.1865234375, -85.71484375, -82.2431640625, -78.771484375, -75.2998046875, -71.828125, -68.3564453125, -64.884765625, -61.4130859375, -57.94140625, -54.4697265625, -50.998046875, -47.5263671875, -44.0546875, -40.5830078125, -37.111328125, -33.6396484375, -30.16796875, -26.6962890625, -23.224609375, -19.7529296875, -16.28125, -12.8095703125, -9.337890625, -5.8662109375, -2.39453125, 1.0771484375, 4.548828125, 8.0205078125, 11.4921875, 14.9638671875, 18.435546875, 21.9072265625, 25.37890625, 28.8505859375, 32.322265625, 35.7939453125, 39.265625, 42.7373046875, 46.208984375, 49.6806640625, 53.15234375, 56.6240234375, 60.095703125, 63.5673828125, 67.0390625, 70.5107421875, 73.982421875, 77.4541015625, 80.92578125, 84.3974609375, 87.869140625, 91.3408203125, 94.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 167.0, 739.0, 102.0, 4.0, 0.0, 1.0, 1.0], "bins": [-299.4395751953125, -294.3131408691406, -289.18670654296875, -284.0602722167969, -278.933837890625, -273.8074035644531, -268.68096923828125, -263.5545349121094, -258.4281005859375, -253.30166625976562, -248.17523193359375, -243.04879760742188, -237.92236328125, -232.79592895507812, -227.66949462890625, -222.54306030273438, -217.41664123535156, -212.2902069091797, -207.1637725830078, -202.03733825683594, -196.91090393066406, -191.7844696044922, -186.6580352783203, -181.5316162109375, -176.40518188476562, -171.27874755859375, -166.15231323242188, -161.02587890625, -155.89944458007812, -150.77301025390625, -145.64657592773438, -140.5201416015625, -135.39369201660156, -130.2672576904297, -125.14082336425781, -120.01438903808594, -114.88795471191406, -109.76152038574219, -104.63509368896484, -99.50865936279297, -94.3822250366211, -89.25579071044922, -84.12935638427734, -79.00292205810547, -73.87649536132812, -68.75006103515625, -63.623626708984375, -58.4971923828125, -53.370758056640625, -48.24432373046875, -43.117889404296875, -37.991458892822266, -32.86502456665039, -27.738590240478516, -22.612157821655273, -17.48572540283203, -12.359292984008789, -7.2328596115112305, -2.106426239013672, 3.0200071334838867, 8.146440505981445, 13.27287483215332, 18.399307250976562, 23.525739669799805, 28.65217399597168]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 7.0, 5.0, 6.0, 7.0, 7.0, 9.0, 9.0, 14.0, 22.0, 22.0, 26.0, 28.0, 31.0, 26.0, 28.0, 32.0, 33.0, 35.0, 34.0, 46.0, 47.0, 49.0, 51.0, 53.0, 48.0, 40.0, 27.0, 46.0, 26.0, 35.0, 31.0, 21.0, 12.0, 21.0, 18.0, 11.0, 6.0, 8.0, 3.0, 5.0, 9.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.95472717285156, -114.65241241455078, -110.35009765625, -106.04778289794922, -101.74546813964844, -97.44316101074219, -93.1408462524414, -88.83853149414062, -84.53621673583984, -80.23390197753906, -75.93158721923828, -71.6292724609375, -67.32696533203125, -63.0246467590332, -58.72233581542969, -54.420021057128906, -50.117706298828125, -45.815391540527344, -41.51307678222656, -37.21076583862305, -32.908451080322266, -28.606136322021484, -24.303823471069336, -20.001510620117188, -15.699195861816406, -11.396882057189941, -7.094568252563477, -2.7922544479370117, 1.5100593566894531, 5.812374114990234, 10.114686965942383, 14.416999816894531, 18.719314575195312, 23.021629333496094, 27.323942184448242, 31.62625503540039, 35.92856979370117, 40.23088455200195, 44.53319549560547, 48.83551025390625, 53.13782501220703, 57.44013977050781, 61.742454528808594, 66.04476928710938, 70.34707641601562, 74.64939880371094, 78.95170593261719, 83.25402069091797, 87.55633544921875, 91.85865020751953, 96.16096496582031, 100.4632797241211, 104.76559448242188, 109.06790161132812, 113.3702163696289, 117.67253112792969, 121.97484588623047, 126.27716064453125, 130.5794677734375, 134.8817901611328, 139.18409729003906, 143.48641967773438, 147.78872680664062, 152.09103393554688, 156.3933563232422]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 15.0, 9.0, 14.0, 12.0, 17.0, 9.0, 22.0, 32.0, 34.0, 20.0, 20.0, 47.0, 45.0, 37.0, 40.0, 33.0, 45.0, 52.0, 38.0, 34.0, 41.0, 37.0, 39.0, 31.0, 34.0, 24.0, 27.0, 20.0, 27.0, 26.0, 14.0, 17.0, 14.0, 13.0, 15.0, 6.0, 3.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7265625, -11.345947265625, -10.96533203125, -10.584716796875, -10.2041015625, -9.823486328125, -9.44287109375, -9.062255859375, -8.681640625, -8.301025390625, -7.92041015625, -7.539794921875, -7.1591796875, -6.778564453125, -6.39794921875, -6.017333984375, -5.63671875, -5.256103515625, -4.87548828125, -4.494873046875, -4.1142578125, -3.733642578125, -3.35302734375, -2.972412109375, -2.591796875, -2.211181640625, -1.83056640625, -1.449951171875, -1.0693359375, -0.688720703125, -0.30810546875, 0.072509765625, 0.453125, 0.833740234375, 1.21435546875, 1.594970703125, 1.9755859375, 2.356201171875, 2.73681640625, 3.117431640625, 3.498046875, 3.878662109375, 4.25927734375, 4.639892578125, 5.0205078125, 5.401123046875, 5.78173828125, 6.162353515625, 6.54296875, 6.923583984375, 7.30419921875, 7.684814453125, 8.0654296875, 8.446044921875, 8.82666015625, 9.207275390625, 9.587890625, 9.968505859375, 10.34912109375, 10.729736328125, 11.1103515625, 11.490966796875, 11.87158203125, 12.252197265625, 12.6328125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 5.0, 9.0, 8.0, 12.0, 20.0, 21.0, 28.0, 42.0, 39.0, 70.0, 86.0, 146.0, 314.0, 691.0, 2314.0, 14351.0, 237616.0, 2777751.0, 1098985.0, 54052.0, 5400.0, 1243.0, 447.0, 204.0, 119.0, 78.0, 52.0, 26.0, 28.0, 24.0, 28.0, 21.0, 9.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.53125, -37.31787109375, -36.1044921875, -34.89111328125, -33.677734375, -32.46435546875, -31.2509765625, -30.03759765625, -28.82421875, -27.61083984375, -26.3974609375, -25.18408203125, -23.970703125, -22.75732421875, -21.5439453125, -20.33056640625, -19.1171875, -17.90380859375, -16.6904296875, -15.47705078125, -14.263671875, -13.05029296875, -11.8369140625, -10.62353515625, -9.41015625, -8.19677734375, -6.9833984375, -5.77001953125, -4.556640625, -3.34326171875, -2.1298828125, -0.91650390625, 0.296875, 1.51025390625, 2.7236328125, 3.93701171875, 5.150390625, 6.36376953125, 7.5771484375, 8.79052734375, 10.00390625, 11.21728515625, 12.4306640625, 13.64404296875, 14.857421875, 16.07080078125, 17.2841796875, 18.49755859375, 19.7109375, 20.92431640625, 22.1376953125, 23.35107421875, 24.564453125, 25.77783203125, 26.9912109375, 28.20458984375, 29.41796875, 30.63134765625, 31.8447265625, 33.05810546875, 34.271484375, 35.48486328125, 36.6982421875, 37.91162109375, 39.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 21.0, 17.0, 47.0, 60.0, 81.0, 149.0, 244.0, 391.0, 798.0, 860.0, 580.0, 308.0, 176.0, 120.0, 65.0, 66.0, 25.0, 21.0, 11.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-110.0, -107.51025390625, -105.0205078125, -102.53076171875, -100.041015625, -97.55126953125, -95.0615234375, -92.57177734375, -90.08203125, -87.59228515625, -85.1025390625, -82.61279296875, -80.123046875, -77.63330078125, -75.1435546875, -72.65380859375, -70.1640625, -67.67431640625, -65.1845703125, -62.69482421875, -60.205078125, -57.71533203125, -55.2255859375, -52.73583984375, -50.24609375, -47.75634765625, -45.2666015625, -42.77685546875, -40.287109375, -37.79736328125, -35.3076171875, -32.81787109375, -30.328125, -27.83837890625, -25.3486328125, -22.85888671875, -20.369140625, -17.87939453125, -15.3896484375, -12.89990234375, -10.41015625, -7.92041015625, -5.4306640625, -2.94091796875, -0.451171875, 2.03857421875, 4.5283203125, 7.01806640625, 9.5078125, 11.99755859375, 14.4873046875, 16.97705078125, 19.466796875, 21.95654296875, 24.4462890625, 26.93603515625, 29.42578125, 31.91552734375, 34.4052734375, 36.89501953125, 39.384765625, 41.87451171875, 44.3642578125, 46.85400390625, 49.34375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 10.0, 5.0, 11.0, 19.0, 45.0, 43.0, 81.0, 133.0, 174.0, 303.0, 627.0, 3990.0, 4176317.0, 10989.0, 649.0, 306.0, 217.0, 118.0, 72.0, 62.0, 32.0, 22.0, 17.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.375, -186.728515625, -178.08203125, -169.435546875, -160.7890625, -152.142578125, -143.49609375, -134.849609375, -126.203125, -117.556640625, -108.91015625, -100.263671875, -91.6171875, -82.970703125, -74.32421875, -65.677734375, -57.03125, -48.384765625, -39.73828125, -31.091796875, -22.4453125, -13.798828125, -5.15234375, 3.494140625, 12.140625, 20.787109375, 29.43359375, 38.080078125, 46.7265625, 55.373046875, 64.01953125, 72.666015625, 81.3125, 89.958984375, 98.60546875, 107.251953125, 115.8984375, 124.544921875, 133.19140625, 141.837890625, 150.484375, 159.130859375, 167.77734375, 176.423828125, 185.0703125, 193.716796875, 202.36328125, 211.009765625, 219.65625, 228.302734375, 236.94921875, 245.595703125, 254.2421875, 262.888671875, 271.53515625, 280.181640625, 288.828125, 297.474609375, 306.12109375, 314.767578125, 323.4140625, 332.060546875, 340.70703125, 349.353515625, 358.0]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 29.0, 418.0, 528.0, 40.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1027.7467041015625, -1009.7408447265625, -991.7349853515625, -973.7291259765625, -955.7232666015625, -937.7174072265625, -919.7115478515625, -901.7056884765625, -883.6998291015625, -865.6939697265625, -847.6881103515625, -829.6822509765625, -811.6763916015625, -793.6705322265625, -775.6646728515625, -757.6588134765625, -739.6529541015625, -721.6470947265625, -703.6412353515625, -685.6353759765625, -667.6295166015625, -649.6236572265625, -631.6177978515625, -613.6119384765625, -595.6060791015625, -577.6002197265625, -559.5943603515625, -541.5885009765625, -523.5826416015625, -505.5767822265625, -487.5709228515625, -469.5650634765625, -451.55914306640625, -433.55328369140625, -415.54742431640625, -397.54156494140625, -379.53570556640625, -361.52984619140625, -343.52398681640625, -325.51812744140625, -307.51226806640625, -289.50640869140625, -271.50054931640625, -253.49468994140625, -235.48883056640625, -217.48297119140625, -199.47711181640625, -181.47125244140625, -163.46539306640625, -145.45953369140625, -127.45367431640625, -109.44781494140625, -91.44195556640625, -73.43609619140625, -55.43023681640625, -37.42437744140625, -19.41851806640625, -1.41265869140625, 16.59320068359375, 34.59906005859375, 52.60491943359375, 70.61077880859375, 88.61663818359375, 106.62249755859375, 124.62835693359375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 10.0, 4.0, 10.0, 15.0, 13.0, 10.0, 22.0, 12.0, 28.0, 21.0, 26.0, 27.0, 32.0, 35.0, 47.0, 29.0, 41.0, 38.0, 61.0, 44.0, 35.0, 49.0, 25.0, 45.0, 46.0, 40.0, 30.0, 29.0, 22.0, 25.0, 18.0, 22.0, 20.0, 14.0, 8.0, 13.0, 9.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-203.5912628173828, -197.81182861328125, -192.03237915039062, -186.25294494628906, -180.4735107421875, -174.69406127929688, -168.9146270751953, -163.13519287109375, -157.35574340820312, -151.57630920410156, -145.79685974121094, -140.01742553710938, -134.2379913330078, -128.45855712890625, -122.67910766601562, -116.89967346191406, -111.1202392578125, -105.3407974243164, -99.56136322021484, -93.78192138671875, -88.00248718261719, -82.2230453491211, -76.443603515625, -70.66416931152344, -64.88472747802734, -59.105289459228516, -53.32585144042969, -47.546409606933594, -41.766971588134766, -35.98753356933594, -30.208091735839844, -24.428653717041016, -18.649215698242188, -12.869776725769043, -7.090337753295898, -1.3108978271484375, 4.468540191650391, 10.247978210449219, 16.027420043945312, 21.80685806274414, 27.58629608154297, 33.3657341003418, 39.145172119140625, 44.92461395263672, 50.70405197143555, 56.483489990234375, 62.26293182373047, 68.04237365722656, 73.82180786132812, 79.60124969482422, 85.38068389892578, 91.16012573242188, 96.93955993652344, 102.71900177001953, 108.49844360351562, 114.27787780761719, 120.05731964111328, 125.83676147460938, 131.61619567871094, 137.3956298828125, 143.17507934570312, 148.9545135498047, 154.73394775390625, 160.51339721679688, 166.29283142089844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 8.0, 11.0, 5.0, 18.0, 14.0, 17.0, 26.0, 25.0, 30.0, 32.0, 31.0, 37.0, 37.0, 36.0, 52.0, 37.0, 34.0, 46.0, 38.0, 37.0, 46.0, 40.0, 39.0, 41.0, 21.0, 18.0, 31.0, 26.0, 20.0, 21.0, 15.0, 20.0, 17.0, 7.0, 12.0, 6.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.015625, -12.626953125, -12.23828125, -11.849609375, -11.4609375, -11.072265625, -10.68359375, -10.294921875, -9.90625, -9.517578125, -9.12890625, -8.740234375, -8.3515625, -7.962890625, -7.57421875, -7.185546875, -6.796875, -6.408203125, -6.01953125, -5.630859375, -5.2421875, -4.853515625, -4.46484375, -4.076171875, -3.6875, -3.298828125, -2.91015625, -2.521484375, -2.1328125, -1.744140625, -1.35546875, -0.966796875, -0.578125, -0.189453125, 0.19921875, 0.587890625, 0.9765625, 1.365234375, 1.75390625, 2.142578125, 2.53125, 2.919921875, 3.30859375, 3.697265625, 4.0859375, 4.474609375, 4.86328125, 5.251953125, 5.640625, 6.029296875, 6.41796875, 6.806640625, 7.1953125, 7.583984375, 7.97265625, 8.361328125, 8.75, 9.138671875, 9.52734375, 9.916015625, 10.3046875, 10.693359375, 11.08203125, 11.470703125, 11.859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 15.0, 25.0, 29.0, 42.0, 50.0, 89.0, 112.0, 194.0, 222.0, 414.0, 590.0, 908.0, 1434.0, 2237.0, 3684.0, 5956.0, 9895.0, 16784.0, 28497.0, 49177.0, 91328.0, 197561.0, 344813.0, 133526.0, 67486.0, 37911.0, 21909.0, 12975.0, 7759.0, 4790.0, 2917.0, 1849.0, 1161.0, 719.0, 488.0, 340.0, 186.0, 143.0, 90.0, 61.0, 58.0, 34.0, 17.0, 28.0, 10.0, 10.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.560546875, -3.4466552734375, -3.332763671875, -3.2188720703125, -3.10498046875, -2.9910888671875, -2.877197265625, -2.7633056640625, -2.6494140625, -2.5355224609375, -2.421630859375, -2.3077392578125, -2.19384765625, -2.0799560546875, -1.966064453125, -1.8521728515625, -1.73828125, -1.6243896484375, -1.510498046875, -1.3966064453125, -1.28271484375, -1.1688232421875, -1.054931640625, -0.9410400390625, -0.8271484375, -0.7132568359375, -0.599365234375, -0.4854736328125, -0.37158203125, -0.2576904296875, -0.143798828125, -0.0299072265625, 0.083984375, 0.1978759765625, 0.311767578125, 0.4256591796875, 0.53955078125, 0.6534423828125, 0.767333984375, 0.8812255859375, 0.9951171875, 1.1090087890625, 1.222900390625, 1.3367919921875, 1.45068359375, 1.5645751953125, 1.678466796875, 1.7923583984375, 1.90625, 2.0201416015625, 2.134033203125, 2.2479248046875, 2.36181640625, 2.4757080078125, 2.589599609375, 2.7034912109375, 2.8173828125, 2.9312744140625, 3.045166015625, 3.1590576171875, 3.27294921875, 3.3868408203125, 3.500732421875, 3.6146240234375, 3.728515625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 8.0, 11.0, 16.0, 23.0, 29.0, 21.0, 23.0, 28.0, 25.0, 48.0, 32.0, 29.0, 43.0, 43.0, 50.0, 1067.0, 51.0, 37.0, 29.0, 48.0, 37.0, 36.0, 34.0, 30.0, 24.0, 23.0, 26.0, 21.0, 18.0, 17.0, 12.0, 9.0, 17.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.12322998046875, -6.8753662109375, -6.62750244140625, -6.379638671875, -6.13177490234375, -5.8839111328125, -5.63604736328125, -5.38818359375, -5.14031982421875, -4.8924560546875, -4.64459228515625, -4.396728515625, -4.14886474609375, -3.9010009765625, -3.65313720703125, -3.4052734375, -3.15740966796875, -2.9095458984375, -2.66168212890625, -2.413818359375, -2.16595458984375, -1.9180908203125, -1.67022705078125, -1.42236328125, -1.17449951171875, -0.9266357421875, -0.67877197265625, -0.430908203125, -0.18304443359375, 0.0648193359375, 0.31268310546875, 0.560546875, 0.80841064453125, 1.0562744140625, 1.30413818359375, 1.552001953125, 1.79986572265625, 2.0477294921875, 2.29559326171875, 2.54345703125, 2.79132080078125, 3.0391845703125, 3.28704833984375, 3.534912109375, 3.78277587890625, 4.0306396484375, 4.27850341796875, 4.5263671875, 4.77423095703125, 5.0220947265625, 5.26995849609375, 5.517822265625, 5.76568603515625, 6.0135498046875, 6.26141357421875, 6.50927734375, 6.75714111328125, 7.0050048828125, 7.25286865234375, 7.500732421875, 7.74859619140625, 7.9964599609375, 8.24432373046875, 8.4921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 13.0, 19.0, 34.0, 33.0, 61.0, 87.0, 133.0, 199.0, 263.0, 394.0, 614.0, 945.0, 1499.0, 2228.0, 3684.0, 5749.0, 9126.0, 15274.0, 25024.0, 41732.0, 72409.0, 136221.0, 1402852.0, 169743.0, 85580.0, 48338.0, 28859.0, 17517.0, 10526.0, 6609.0, 4125.0, 2434.0, 1599.0, 1084.0, 692.0, 476.0, 294.0, 203.0, 144.0, 98.0, 64.0, 47.0, 30.0, 26.0, 10.0, 12.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.33984375, -3.237518310546875, -3.13519287109375, -3.032867431640625, -2.9305419921875, -2.828216552734375, -2.72589111328125, -2.623565673828125, -2.521240234375, -2.418914794921875, -2.31658935546875, -2.214263916015625, -2.1119384765625, -2.009613037109375, -1.90728759765625, -1.804962158203125, -1.70263671875, -1.600311279296875, -1.49798583984375, -1.395660400390625, -1.2933349609375, -1.191009521484375, -1.08868408203125, -0.986358642578125, -0.884033203125, -0.781707763671875, -0.67938232421875, -0.577056884765625, -0.4747314453125, -0.372406005859375, -0.27008056640625, -0.167755126953125, -0.0654296875, 0.036895751953125, 0.13922119140625, 0.241546630859375, 0.3438720703125, 0.446197509765625, 0.54852294921875, 0.650848388671875, 0.753173828125, 0.855499267578125, 0.95782470703125, 1.060150146484375, 1.1624755859375, 1.264801025390625, 1.36712646484375, 1.469451904296875, 1.57177734375, 1.674102783203125, 1.77642822265625, 1.878753662109375, 1.9810791015625, 2.083404541015625, 2.18572998046875, 2.288055419921875, 2.390380859375, 2.492706298828125, 2.59503173828125, 2.697357177734375, 2.7996826171875, 2.902008056640625, 3.00433349609375, 3.106658935546875, 3.208984375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 5.0, 5.0, 9.0, 11.0, 7.0, 21.0, 18.0, 23.0, 36.0, 58.0, 86.0, 110.0, 133.0, 110.0, 96.0, 73.0, 55.0, 27.0, 19.0, 16.0, 15.0, 7.0, 9.0, 9.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003131866455078125, -0.0030262768268585205, -0.002920687198638916, -0.0028150975704193115, -0.002709507942199707, -0.0026039183139801025, -0.002498328685760498, -0.0023927390575408936, -0.002287149429321289, -0.0021815598011016846, -0.00207597017288208, -0.0019703805446624756, -0.001864790916442871, -0.0017592012882232666, -0.0016536116600036621, -0.0015480220317840576, -0.0014424324035644531, -0.0013368427753448486, -0.0012312531471252441, -0.0011256635189056396, -0.0010200738906860352, -0.0009144842624664307, -0.0008088946342468262, -0.0007033050060272217, -0.0005977153778076172, -0.0004921257495880127, -0.0003865361213684082, -0.0002809464931488037, -0.00017535686492919922, -6.976723670959473e-05, 3.5822391510009766e-05, 0.00014141201972961426, 0.00024700164794921875, 0.00035259127616882324, 0.00045818090438842773, 0.0005637705326080322, 0.0006693601608276367, 0.0007749497890472412, 0.0008805394172668457, 0.0009861290454864502, 0.0010917186737060547, 0.0011973083019256592, 0.0013028979301452637, 0.0014084875583648682, 0.0015140771865844727, 0.0016196668148040771, 0.0017252564430236816, 0.0018308460712432861, 0.0019364356994628906, 0.002042025327682495, 0.0021476149559020996, 0.002253204584121704, 0.0023587942123413086, 0.002464383840560913, 0.0025699734687805176, 0.002675563097000122, 0.0027811527252197266, 0.002886742353439331, 0.0029923319816589355, 0.00309792160987854, 0.0032035112380981445, 0.003309100866317749, 0.0034146904945373535, 0.003520280122756958, 0.0036258697509765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 3.0, 3.0, 6.0, 5.0, 9.0, 16.0, 10.0, 22.0, 30.0, 37.0, 77.0, 134.0, 209.0, 691.0, 1045091.0, 1520.0, 300.0, 137.0, 74.0, 51.0, 29.0, 25.0, 7.0, 9.0, 8.0, 5.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1070556640625, -0.10413646697998047, -0.10121726989746094, -0.0982980728149414, -0.09537887573242188, -0.09245967864990234, -0.08954048156738281, -0.08662128448486328, -0.08370208740234375, -0.08078289031982422, -0.07786369323730469, -0.07494449615478516, -0.07202529907226562, -0.0691061019897461, -0.06618690490722656, -0.06326770782470703, -0.0603485107421875, -0.05742931365966797, -0.05451011657714844, -0.051590919494628906, -0.048671722412109375, -0.045752525329589844, -0.04283332824707031, -0.03991413116455078, -0.03699493408203125, -0.03407573699951172, -0.031156539916992188, -0.028237342834472656, -0.025318145751953125, -0.022398948669433594, -0.019479751586914062, -0.01656055450439453, -0.013641357421875, -0.010722160339355469, -0.0078029632568359375, -0.004883766174316406, -0.001964569091796875, 0.0009546279907226562, 0.0038738250732421875, 0.006793022155761719, 0.00971221923828125, 0.012631416320800781, 0.015550613403320312, 0.018469810485839844, 0.021389007568359375, 0.024308204650878906, 0.027227401733398438, 0.03014659881591797, 0.0330657958984375, 0.03598499298095703, 0.03890419006347656, 0.041823387145996094, 0.044742584228515625, 0.047661781311035156, 0.05058097839355469, 0.05350017547607422, 0.05641937255859375, 0.05933856964111328, 0.06225776672363281, 0.06517696380615234, 0.06809616088867188, 0.0710153579711914, 0.07393455505371094, 0.07685375213623047, 0.07977294921875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 528.0, 485.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001317107817158103, -0.000987539766356349, -0.0006579716573469341, -0.00032840354833751917, 1.164502464234829e-06, 0.0003307325532659888, 0.0006603007204830647, 0.0009898687712848186, 0.0013194368220865726, 0.0016490048728883266, 0.0019785729236900806, 0.0023081409744918346, 0.0026377090252935886, 0.0029672770760953426, 0.0032968453597277403, 0.0036264134105294943, 0.003955981694161892, 0.004285549744963646, 0.0046151177957654, 0.004944685846567154, 0.005274253897368908, 0.005603821948170662, 0.005933389998972416, 0.00626295804977417, 0.006592526100575924, 0.006922094151377678, 0.007251662202179432, 0.007581230252981186, 0.00791079830378294, 0.008240366354584694, 0.008569934405386448, 0.008899502456188202, 0.009229070506989956, 0.00955863855779171, 0.009888206608593464, 0.010217774659395218, 0.010547342710196972, 0.010876910760998726, 0.01120647881180048, 0.011536046862602234, 0.011865614913403988, 0.012195182964205742, 0.012524751015007496, 0.01285431906580925, 0.013183887116611004, 0.013513455167412758, 0.013843023218214512, 0.014172591269016266, 0.014502160251140594, 0.014831728301942348, 0.015161296352744102, 0.015490864403545856, 0.01582043245434761, 0.01615000143647194, 0.01647956855595112, 0.016809137538075447, 0.017138704657554626, 0.017468273639678955, 0.017797840759158134, 0.018127409741282463, 0.018456976860761642, 0.01878654584288597, 0.01911611296236515, 0.01944568194448948, 0.01977524906396866]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 12.0, 11.0, 18.0, 19.0, 16.0, 25.0, 19.0, 27.0, 17.0, 26.0, 43.0, 34.0, 38.0, 42.0, 38.0, 47.0, 40.0, 44.0, 33.0, 40.0, 36.0, 43.0, 36.0, 27.0, 24.0, 24.0, 28.0, 25.0, 21.0, 29.0, 21.0, 21.0, 9.0, 12.0, 5.0, 7.0, 6.0, 10.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.001367330551147461, -0.0013268524780869484, -0.0012863744050264359, -0.0012458963319659233, -0.0012054182589054108, -0.0011649401858448982, -0.0011244621127843857, -0.0010839840397238731, -0.0010435059666633606, -0.001003027893602848, -0.0009625498205423355, -0.000922071747481823, -0.0008815936744213104, -0.0008411156013607979, -0.0008006375283002853, -0.0007601594552397728, -0.0007196813821792603, -0.0006792033091187477, -0.0006387252360582352, -0.0005982471629977226, -0.0005577690899372101, -0.0005172910168766975, -0.000476812943816185, -0.00043633487075567245, -0.0003958567976951599, -0.00035537872463464737, -0.0003149006515741348, -0.0002744225785136223, -0.00023394450545310974, -0.0001934664323925972, -0.00015298835933208466, -0.00011251028627157211, -7.203221321105957e-05, -3.155414015054703e-05, 8.923932909965515e-06, 4.940200597047806e-05, 8.98800790309906e-05, 0.00013035815209150314, 0.00017083622515201569, 0.00021131429821252823, 0.00025179237127304077, 0.0002922704443335533, 0.00033274851739406586, 0.0003732265904545784, 0.00041370466351509094, 0.0004541827365756035, 0.000494660809636116, 0.0005351388826966286, 0.0005756169557571411, 0.0006160950288176537, 0.0006565731018781662, 0.0006970511749386787, 0.0007375292479991913, 0.0007780073210597038, 0.0008184853941202164, 0.0008589634671807289, 0.0008994415402412415, 0.000939919613301754, 0.0009803976863622665, 0.001020875759422779, 0.0010613538324832916, 0.0011018319055438042, 0.0011423099786043167, 0.0011827880516648293, 0.0012232661247253418]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 8.0, 8.0, 11.0, 5.0, 18.0, 14.0, 17.0, 26.0, 25.0, 30.0, 32.0, 31.0, 37.0, 37.0, 36.0, 52.0, 37.0, 34.0, 46.0, 38.0, 37.0, 46.0, 40.0, 39.0, 41.0, 21.0, 18.0, 31.0, 26.0, 20.0, 21.0, 15.0, 20.0, 17.0, 7.0, 12.0, 6.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.015625, -12.626953125, -12.23828125, -11.849609375, -11.4609375, -11.072265625, -10.68359375, -10.294921875, -9.90625, -9.517578125, -9.12890625, -8.740234375, -8.3515625, -7.962890625, -7.57421875, -7.185546875, -6.796875, -6.408203125, -6.01953125, -5.630859375, -5.2421875, -4.853515625, -4.46484375, -4.076171875, -3.6875, -3.298828125, -2.91015625, -2.521484375, -2.1328125, -1.744140625, -1.35546875, -0.966796875, -0.578125, -0.189453125, 0.19921875, 0.587890625, 0.9765625, 1.365234375, 1.75390625, 2.142578125, 2.53125, 2.919921875, 3.30859375, 3.697265625, 4.0859375, 4.474609375, 4.86328125, 5.251953125, 5.640625, 6.029296875, 6.41796875, 6.806640625, 7.1953125, 7.583984375, 7.97265625, 8.361328125, 8.75, 9.138671875, 9.52734375, 9.916015625, 10.3046875, 10.693359375, 11.08203125, 11.470703125, 11.859375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 7.0, 8.0, 10.0, 14.0, 15.0, 23.0, 37.0, 47.0, 70.0, 88.0, 161.0, 196.0, 285.0, 440.0, 676.0, 1093.0, 1821.0, 3187.0, 6024.0, 12424.0, 28663.0, 77378.0, 264226.0, 444911.0, 127583.0, 43150.0, 17410.0, 8211.0, 4101.0, 2369.0, 1365.0, 837.0, 554.0, 346.0, 265.0, 163.0, 108.0, 92.0, 61.0, 31.0, 33.0, 20.0, 15.0, 15.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.421875, -8.152099609375, -7.88232421875, -7.612548828125, -7.3427734375, -7.072998046875, -6.80322265625, -6.533447265625, -6.263671875, -5.993896484375, -5.72412109375, -5.454345703125, -5.1845703125, -4.914794921875, -4.64501953125, -4.375244140625, -4.10546875, -3.835693359375, -3.56591796875, -3.296142578125, -3.0263671875, -2.756591796875, -2.48681640625, -2.217041015625, -1.947265625, -1.677490234375, -1.40771484375, -1.137939453125, -0.8681640625, -0.598388671875, -0.32861328125, -0.058837890625, 0.2109375, 0.480712890625, 0.75048828125, 1.020263671875, 1.2900390625, 1.559814453125, 1.82958984375, 2.099365234375, 2.369140625, 2.638916015625, 2.90869140625, 3.178466796875, 3.4482421875, 3.718017578125, 3.98779296875, 4.257568359375, 4.52734375, 4.797119140625, 5.06689453125, 5.336669921875, 5.6064453125, 5.876220703125, 6.14599609375, 6.415771484375, 6.685546875, 6.955322265625, 7.22509765625, 7.494873046875, 7.7646484375, 8.034423828125, 8.30419921875, 8.573974609375, 8.84375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 2.0, 5.0, 5.0, 13.0, 10.0, 15.0, 17.0, 10.0, 19.0, 28.0, 23.0, 28.0, 34.0, 36.0, 25.0, 40.0, 44.0, 55.0, 63.0, 151.0, 1858.0, 96.0, 61.0, 40.0, 49.0, 31.0, 41.0, 37.0, 29.0, 26.0, 21.0, 24.0, 17.0, 15.0, 11.0, 10.0, 11.0, 13.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-43.84375, -42.52978515625, -41.2158203125, -39.90185546875, -38.587890625, -37.27392578125, -35.9599609375, -34.64599609375, -33.33203125, -32.01806640625, -30.7041015625, -29.39013671875, -28.076171875, -26.76220703125, -25.4482421875, -24.13427734375, -22.8203125, -21.50634765625, -20.1923828125, -18.87841796875, -17.564453125, -16.25048828125, -14.9365234375, -13.62255859375, -12.30859375, -10.99462890625, -9.6806640625, -8.36669921875, -7.052734375, -5.73876953125, -4.4248046875, -3.11083984375, -1.796875, -0.48291015625, 0.8310546875, 2.14501953125, 3.458984375, 4.77294921875, 6.0869140625, 7.40087890625, 8.71484375, 10.02880859375, 11.3427734375, 12.65673828125, 13.970703125, 15.28466796875, 16.5986328125, 17.91259765625, 19.2265625, 20.54052734375, 21.8544921875, 23.16845703125, 24.482421875, 25.79638671875, 27.1103515625, 28.42431640625, 29.73828125, 31.05224609375, 32.3662109375, 33.68017578125, 34.994140625, 36.30810546875, 37.6220703125, 38.93603515625, 40.25]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 14.0, 12.0, 9.0, 18.0, 15.0, 25.0, 25.0, 28.0, 33.0, 58.0, 81.0, 128.0, 204.0, 366.0, 896.0, 5380.0, 2953548.0, 180902.0, 2380.0, 638.0, 302.0, 165.0, 103.0, 71.0, 44.0, 48.0, 37.0, 25.0, 24.0, 15.0, 17.0, 16.0, 10.0, 14.0, 5.0, 4.0, 4.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-70.375, -68.0927734375, -65.810546875, -63.5283203125, -61.24609375, -58.9638671875, -56.681640625, -54.3994140625, -52.1171875, -49.8349609375, -47.552734375, -45.2705078125, -42.98828125, -40.7060546875, -38.423828125, -36.1416015625, -33.859375, -31.5771484375, -29.294921875, -27.0126953125, -24.73046875, -22.4482421875, -20.166015625, -17.8837890625, -15.6015625, -13.3193359375, -11.037109375, -8.7548828125, -6.47265625, -4.1904296875, -1.908203125, 0.3740234375, 2.65625, 4.9384765625, 7.220703125, 9.5029296875, 11.78515625, 14.0673828125, 16.349609375, 18.6318359375, 20.9140625, 23.1962890625, 25.478515625, 27.7607421875, 30.04296875, 32.3251953125, 34.607421875, 36.8896484375, 39.171875, 41.4541015625, 43.736328125, 46.0185546875, 48.30078125, 50.5830078125, 52.865234375, 55.1474609375, 57.4296875, 59.7119140625, 61.994140625, 64.2763671875, 66.55859375, 68.8408203125, 71.123046875, 73.4052734375, 75.6875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 11.0, 993.0, 14.0, 0.0, 1.0], "bins": [-910.322265625, -895.2715454101562, -880.2208251953125, -865.1701049804688, -850.119384765625, -835.0686645507812, -820.0179443359375, -804.9672241210938, -789.91650390625, -774.8657836914062, -759.8150634765625, -744.7643432617188, -729.713623046875, -714.6629028320312, -699.6121826171875, -684.5614624023438, -669.5108032226562, -654.4600830078125, -639.4093627929688, -624.358642578125, -609.3079223632812, -594.2572021484375, -579.2064819335938, -564.15576171875, -549.1050415039062, -534.0543212890625, -519.0036010742188, -503.952880859375, -488.90216064453125, -473.8514404296875, -458.80072021484375, -443.7500305175781, -428.6993103027344, -413.6485900878906, -398.5978698730469, -383.5471496582031, -368.4964294433594, -353.44573974609375, -338.39501953125, -323.34429931640625, -308.2935791015625, -293.24285888671875, -278.192138671875, -263.14141845703125, -248.09071350097656, -233.0399932861328, -217.98927307128906, -202.93856811523438, -187.8878173828125, -172.83709716796875, -157.786376953125, -142.73565673828125, -127.68495178222656, -112.63423156738281, -97.58351135253906, -82.53279876708984, -67.48208618164062, -52.43136978149414, -37.380653381347656, -22.329933166503906, -7.279216766357422, 7.7714996337890625, 22.822219848632812, 37.87293243408203, 52.92365264892578]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 7.0, 12.0, 13.0, 15.0, 11.0, 17.0, 20.0, 28.0, 35.0, 25.0, 30.0, 25.0, 31.0, 39.0, 42.0, 32.0, 46.0, 27.0, 36.0, 31.0, 44.0, 37.0, 35.0, 38.0, 45.0, 32.0, 31.0, 32.0, 18.0, 19.0, 25.0, 17.0, 11.0, 18.0, 8.0, 7.0, 9.0, 2.0, 7.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-134.83187866210938, -130.77552795410156, -126.71917724609375, -122.66283416748047, -118.60648345947266, -114.55013275146484, -110.49378967285156, -106.43743896484375, -102.38108825683594, -98.32473754882812, -94.26838684082031, -90.21204376220703, -86.15569305419922, -82.0993423461914, -78.04299926757812, -73.98664855957031, -69.9302978515625, -65.87394714355469, -61.81760025024414, -57.761253356933594, -53.70490264892578, -49.64855194091797, -45.59220504760742, -41.535858154296875, -37.47950744628906, -33.42315673828125, -29.366809844970703, -25.310461044311523, -21.254112243652344, -17.197763442993164, -13.141414642333984, -9.085065841674805, -5.028717041015625, -0.9723682403564453, 3.0839805603027344, 7.140329360961914, 11.196678161621094, 15.253026962280273, 19.309375762939453, 23.365724563598633, 27.422073364257812, 31.478422164916992, 35.53477096557617, 39.59111785888672, 43.64746856689453, 47.703819274902344, 51.76016616821289, 55.81651306152344, 59.87286376953125, 63.92921447753906, 67.98556518554688, 72.04190826416016, 76.09825897216797, 80.15460968017578, 84.21095275878906, 88.26730346679688, 92.32365417480469, 96.3800048828125, 100.43635559082031, 104.4926986694336, 108.5490493774414, 112.60540008544922, 116.6617431640625, 120.71809387207031, 124.77444458007812]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 9.0, 11.0, 11.0, 14.0, 23.0, 18.0, 27.0, 28.0, 31.0, 34.0, 26.0, 36.0, 42.0, 42.0, 45.0, 41.0, 39.0, 36.0, 41.0, 35.0, 54.0, 33.0, 35.0, 40.0, 18.0, 24.0, 23.0, 22.0, 26.0, 21.0, 19.0, 17.0, 7.0, 12.0, 7.0, 3.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.0859375, -12.68896484375, -12.2919921875, -11.89501953125, -11.498046875, -11.10107421875, -10.7041015625, -10.30712890625, -9.91015625, -9.51318359375, -9.1162109375, -8.71923828125, -8.322265625, -7.92529296875, -7.5283203125, -7.13134765625, -6.734375, -6.33740234375, -5.9404296875, -5.54345703125, -5.146484375, -4.74951171875, -4.3525390625, -3.95556640625, -3.55859375, -3.16162109375, -2.7646484375, -2.36767578125, -1.970703125, -1.57373046875, -1.1767578125, -0.77978515625, -0.3828125, 0.01416015625, 0.4111328125, 0.80810546875, 1.205078125, 1.60205078125, 1.9990234375, 2.39599609375, 2.79296875, 3.18994140625, 3.5869140625, 3.98388671875, 4.380859375, 4.77783203125, 5.1748046875, 5.57177734375, 5.96875, 6.36572265625, 6.7626953125, 7.15966796875, 7.556640625, 7.95361328125, 8.3505859375, 8.74755859375, 9.14453125, 9.54150390625, 9.9384765625, 10.33544921875, 10.732421875, 11.12939453125, 11.5263671875, 11.92333984375, 12.3203125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 12.0, 11.0, 13.0, 13.0, 15.0, 24.0, 22.0, 20.0, 33.0, 26.0, 46.0, 28.0, 34.0, 45.0, 151.0, 985.0, 81544.0, 4049290.0, 60646.0, 810.0, 119.0, 64.0, 38.0, 46.0, 25.0, 24.0, 15.0, 28.0, 22.0, 15.0, 21.0, 21.0, 9.0, 16.0, 6.0, 6.0, 4.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.3125, -83.5703125, -80.828125, -78.0859375, -75.34375, -72.6015625, -69.859375, -67.1171875, -64.375, -61.6328125, -58.890625, -56.1484375, -53.40625, -50.6640625, -47.921875, -45.1796875, -42.4375, -39.6953125, -36.953125, -34.2109375, -31.46875, -28.7265625, -25.984375, -23.2421875, -20.5, -17.7578125, -15.015625, -12.2734375, -9.53125, -6.7890625, -4.046875, -1.3046875, 1.4375, 4.1796875, 6.921875, 9.6640625, 12.40625, 15.1484375, 17.890625, 20.6328125, 23.375, 26.1171875, 28.859375, 31.6015625, 34.34375, 37.0859375, 39.828125, 42.5703125, 45.3125, 48.0546875, 50.796875, 53.5390625, 56.28125, 59.0234375, 61.765625, 64.5078125, 67.25, 69.9921875, 72.734375, 75.4765625, 78.21875, 80.9609375, 83.703125, 86.4453125, 89.1875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 26.0, 27.0, 47.0, 72.0, 113.0, 205.0, 390.0, 745.0, 955.0, 662.0, 335.0, 208.0, 95.0, 64.0, 37.0, 29.0, 16.0, 14.0, 13.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.40625, -61.09130859375, -58.7763671875, -56.46142578125, -54.146484375, -51.83154296875, -49.5166015625, -47.20166015625, -44.88671875, -42.57177734375, -40.2568359375, -37.94189453125, -35.626953125, -33.31201171875, -30.9970703125, -28.68212890625, -26.3671875, -24.05224609375, -21.7373046875, -19.42236328125, -17.107421875, -14.79248046875, -12.4775390625, -10.16259765625, -7.84765625, -5.53271484375, -3.2177734375, -0.90283203125, 1.412109375, 3.72705078125, 6.0419921875, 8.35693359375, 10.671875, 12.98681640625, 15.3017578125, 17.61669921875, 19.931640625, 22.24658203125, 24.5615234375, 26.87646484375, 29.19140625, 31.50634765625, 33.8212890625, 36.13623046875, 38.451171875, 40.76611328125, 43.0810546875, 45.39599609375, 47.7109375, 50.02587890625, 52.3408203125, 54.65576171875, 56.970703125, 59.28564453125, 61.6005859375, 63.91552734375, 66.23046875, 68.54541015625, 70.8603515625, 73.17529296875, 75.490234375, 77.80517578125, 80.1201171875, 82.43505859375, 84.75]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 22.0, 28.0, 40.0, 62.0, 84.0, 131.0, 231.0, 403.0, 1102.0, 3986590.0, 203941.0, 778.0, 368.0, 157.0, 112.0, 74.0, 70.0, 35.0, 21.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-377.0, -366.49609375, -355.9921875, -345.48828125, -334.984375, -324.48046875, -313.9765625, -303.47265625, -292.96875, -282.46484375, -271.9609375, -261.45703125, -250.953125, -240.44921875, -229.9453125, -219.44140625, -208.9375, -198.43359375, -187.9296875, -177.42578125, -166.921875, -156.41796875, -145.9140625, -135.41015625, -124.90625, -114.40234375, -103.8984375, -93.39453125, -82.890625, -72.38671875, -61.8828125, -51.37890625, -40.875, -30.37109375, -19.8671875, -9.36328125, 1.140625, 11.64453125, 22.1484375, 32.65234375, 43.15625, 53.66015625, 64.1640625, 74.66796875, 85.171875, 95.67578125, 106.1796875, 116.68359375, 127.1875, 137.69140625, 148.1953125, 158.69921875, 169.203125, 179.70703125, 190.2109375, 200.71484375, 211.21875, 221.72265625, 232.2265625, 242.73046875, 253.234375, 263.73828125, 274.2421875, 284.74609375, 295.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 66.0, 649.0, 282.0, 20.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1067.28857421875, -1047.4288330078125, -1027.569091796875, -1007.7092895507812, -987.8494873046875, -967.98974609375, -948.1299438476562, -928.2702026367188, -908.410400390625, -888.5506591796875, -868.6908569335938, -848.8311157226562, -828.9713134765625, -809.111572265625, -789.2517700195312, -769.3920288085938, -749.5322875976562, -729.6725463867188, -709.812744140625, -689.9530029296875, -670.0932006835938, -650.2334594726562, -630.3736572265625, -610.513916015625, -590.6541748046875, -570.79443359375, -550.9346313476562, -531.0748901367188, -511.215087890625, -491.3553466796875, -471.4955749511719, -451.63580322265625, -431.77606201171875, -411.9162902832031, -392.0565185546875, -372.1967468261719, -352.33697509765625, -332.47723388671875, -312.6174621582031, -292.7576904296875, -272.89788818359375, -253.03811645507812, -233.1783447265625, -213.31858825683594, -193.4588165283203, -173.5990447998047, -153.73928833007812, -133.8795166015625, -114.01976013183594, -94.15998840332031, -74.30022430419922, -54.44045639038086, -34.5806884765625, -14.720916748046875, 5.138847351074219, 24.998611450195312, 44.85838317871094, 64.71815490722656, 84.57791900634766, 104.43768310546875, 124.29745483398438, 144.1572265625, 164.01699829101562, 183.8767547607422, 203.7365264892578]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 10.0, 7.0, 5.0, 6.0, 7.0, 16.0, 14.0, 14.0, 23.0, 24.0, 30.0, 34.0, 27.0, 38.0, 28.0, 43.0, 46.0, 38.0, 33.0, 36.0, 40.0, 35.0, 37.0, 41.0, 35.0, 32.0, 34.0, 46.0, 28.0, 32.0, 21.0, 23.0, 13.0, 16.0, 12.0, 16.0, 15.0, 14.0, 9.0, 4.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-123.61080932617188, -119.3019790649414, -114.99315643310547, -110.684326171875, -106.37549591064453, -102.06666564941406, -97.75784301757812, -93.44901275634766, -89.14018249511719, -84.83135223388672, -80.52252960205078, -76.21369934082031, -71.90486907958984, -67.59603881835938, -63.28721618652344, -58.97838592529297, -54.66956329345703, -50.36073684692383, -46.05190658569336, -41.743080139160156, -37.43424987792969, -33.125423431396484, -28.81659698486328, -24.507768630981445, -20.19894027709961, -15.890111923217773, -11.581284523010254, -7.272457122802734, -2.9636287689208984, 1.3451995849609375, 5.654026031494141, 9.962854385375977, 14.271682739257812, 18.58051109313965, 22.889339447021484, 27.198165893554688, 31.506994247436523, 35.81582260131836, 40.12464904785156, 44.43347930908203, 48.742305755615234, 53.05113220214844, 57.359962463378906, 61.66878890991211, 65.97761535644531, 70.28644561767578, 74.59527587890625, 78.90409851074219, 83.21292877197266, 87.52175903320312, 91.83058166503906, 96.13941192626953, 100.4482421875, 104.75706481933594, 109.0658950805664, 113.37472534179688, 117.68354797363281, 121.99237823486328, 126.30120086669922, 130.6100311279297, 134.91885375976562, 139.22769165039062, 143.53651428222656, 147.8453369140625, 152.1541748046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 11.0, 11.0, 9.0, 12.0, 22.0, 23.0, 18.0, 28.0, 34.0, 27.0, 43.0, 38.0, 37.0, 42.0, 44.0, 36.0, 49.0, 44.0, 45.0, 40.0, 40.0, 39.0, 37.0, 33.0, 21.0, 25.0, 22.0, 25.0, 19.0, 16.0, 20.0, 15.0, 10.0, 15.0, 5.0, 4.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.71875, -13.3016357421875, -12.884521484375, -12.4674072265625, -12.05029296875, -11.6331787109375, -11.216064453125, -10.7989501953125, -10.3818359375, -9.9647216796875, -9.547607421875, -9.1304931640625, -8.71337890625, -8.2962646484375, -7.879150390625, -7.4620361328125, -7.044921875, -6.6278076171875, -6.210693359375, -5.7935791015625, -5.37646484375, -4.9593505859375, -4.542236328125, -4.1251220703125, -3.7080078125, -3.2908935546875, -2.873779296875, -2.4566650390625, -2.03955078125, -1.6224365234375, -1.205322265625, -0.7882080078125, -0.37109375, 0.0460205078125, 0.463134765625, 0.8802490234375, 1.29736328125, 1.7144775390625, 2.131591796875, 2.5487060546875, 2.9658203125, 3.3829345703125, 3.800048828125, 4.2171630859375, 4.63427734375, 5.0513916015625, 5.468505859375, 5.8856201171875, 6.302734375, 6.7198486328125, 7.136962890625, 7.5540771484375, 7.97119140625, 8.3883056640625, 8.805419921875, 9.2225341796875, 9.6396484375, 10.0567626953125, 10.473876953125, 10.8909912109375, 11.30810546875, 11.7252197265625, 12.142333984375, 12.5594482421875, 12.9765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 13.0, 19.0, 34.0, 41.0, 59.0, 86.0, 118.0, 189.0, 252.0, 409.0, 588.0, 848.0, 1240.0, 1872.0, 2777.0, 4169.0, 6187.0, 9540.0, 14560.0, 22686.0, 35791.0, 59348.0, 102670.0, 219376.0, 277147.0, 113562.0, 64951.0, 39414.0, 24566.0, 15705.0, 10062.0, 6759.0, 4337.0, 3012.0, 1974.0, 1302.0, 899.0, 609.0, 438.0, 296.0, 192.0, 134.0, 96.0, 70.0, 47.0, 42.0, 18.0, 11.0, 10.0, 10.0, 2.0, 5.0, 3.0, 1.0, 2.0], "bins": [-3.302734375, -3.202911376953125, -3.10308837890625, -3.003265380859375, -2.9034423828125, -2.803619384765625, -2.70379638671875, -2.603973388671875, -2.504150390625, -2.404327392578125, -2.30450439453125, -2.204681396484375, -2.1048583984375, -2.005035400390625, -1.90521240234375, -1.805389404296875, -1.70556640625, -1.605743408203125, -1.50592041015625, -1.406097412109375, -1.3062744140625, -1.206451416015625, -1.10662841796875, -1.006805419921875, -0.906982421875, -0.807159423828125, -0.70733642578125, -0.607513427734375, -0.5076904296875, -0.407867431640625, -0.30804443359375, -0.208221435546875, -0.1083984375, -0.008575439453125, 0.09124755859375, 0.191070556640625, 0.2908935546875, 0.390716552734375, 0.49053955078125, 0.590362548828125, 0.690185546875, 0.790008544921875, 0.88983154296875, 0.989654541015625, 1.0894775390625, 1.189300537109375, 1.28912353515625, 1.388946533203125, 1.48876953125, 1.588592529296875, 1.68841552734375, 1.788238525390625, 1.8880615234375, 1.987884521484375, 2.08770751953125, 2.187530517578125, 2.287353515625, 2.387176513671875, 2.48699951171875, 2.586822509765625, 2.6866455078125, 2.786468505859375, 2.88629150390625, 2.986114501953125, 3.0859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 7.0, 5.0, 6.0, 8.0, 9.0, 8.0, 16.0, 23.0, 19.0, 14.0, 20.0, 35.0, 34.0, 31.0, 24.0, 40.0, 33.0, 45.0, 26.0, 31.0, 45.0, 1074.0, 40.0, 37.0, 32.0, 37.0, 26.0, 32.0, 29.0, 34.0, 26.0, 31.0, 27.0, 14.0, 15.0, 10.0, 13.0, 9.0, 6.0, 9.0, 11.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-8.3359375, -8.08477783203125, -7.8336181640625, -7.58245849609375, -7.331298828125, -7.08013916015625, -6.8289794921875, -6.57781982421875, -6.32666015625, -6.07550048828125, -5.8243408203125, -5.57318115234375, -5.322021484375, -5.07086181640625, -4.8197021484375, -4.56854248046875, -4.3173828125, -4.06622314453125, -3.8150634765625, -3.56390380859375, -3.312744140625, -3.06158447265625, -2.8104248046875, -2.55926513671875, -2.30810546875, -2.05694580078125, -1.8057861328125, -1.55462646484375, -1.303466796875, -1.05230712890625, -0.8011474609375, -0.54998779296875, -0.298828125, -0.04766845703125, 0.2034912109375, 0.45465087890625, 0.705810546875, 0.95697021484375, 1.2081298828125, 1.45928955078125, 1.71044921875, 1.96160888671875, 2.2127685546875, 2.46392822265625, 2.715087890625, 2.96624755859375, 3.2174072265625, 3.46856689453125, 3.7197265625, 3.97088623046875, 4.2220458984375, 4.47320556640625, 4.724365234375, 4.97552490234375, 5.2266845703125, 5.47784423828125, 5.72900390625, 5.98016357421875, 6.2313232421875, 6.48248291015625, 6.733642578125, 6.98480224609375, 7.2359619140625, 7.48712158203125, 7.73828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 19.0, 16.0, 21.0, 34.0, 62.0, 76.0, 104.0, 145.0, 202.0, 283.0, 357.0, 567.0, 833.0, 1128.0, 1619.0, 2502.0, 3785.0, 5422.0, 8223.0, 13116.0, 20035.0, 32275.0, 52300.0, 87215.0, 161583.0, 1376248.0, 130273.0, 74403.0, 44959.0, 27860.0, 17576.0, 11215.0, 7360.0, 4956.0, 3294.0, 2161.0, 1422.0, 1029.0, 735.0, 509.0, 348.0, 206.0, 175.0, 135.0, 100.0, 69.0, 48.0, 39.0, 22.0, 17.0, 6.0, 10.0, 5.0, 9.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.142578125, -3.042327880859375, -2.94207763671875, -2.841827392578125, -2.7415771484375, -2.641326904296875, -2.54107666015625, -2.440826416015625, -2.340576171875, -2.240325927734375, -2.14007568359375, -2.039825439453125, -1.9395751953125, -1.839324951171875, -1.73907470703125, -1.638824462890625, -1.53857421875, -1.438323974609375, -1.33807373046875, -1.237823486328125, -1.1375732421875, -1.037322998046875, -0.93707275390625, -0.836822509765625, -0.736572265625, -0.636322021484375, -0.53607177734375, -0.435821533203125, -0.3355712890625, -0.235321044921875, -0.13507080078125, -0.034820556640625, 0.0654296875, 0.165679931640625, 0.26593017578125, 0.366180419921875, 0.4664306640625, 0.566680908203125, 0.66693115234375, 0.767181396484375, 0.867431640625, 0.967681884765625, 1.06793212890625, 1.168182373046875, 1.2684326171875, 1.368682861328125, 1.46893310546875, 1.569183349609375, 1.66943359375, 1.769683837890625, 1.86993408203125, 1.970184326171875, 2.0704345703125, 2.170684814453125, 2.27093505859375, 2.371185302734375, 2.471435546875, 2.571685791015625, 2.67193603515625, 2.772186279296875, 2.8724365234375, 2.972686767578125, 3.07293701171875, 3.173187255859375, 3.2734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 9.0, 24.0, 23.0, 24.0, 30.0, 34.0, 57.0, 47.0, 94.0, 101.0, 109.0, 97.0, 63.0, 54.0, 41.0, 40.0, 33.0, 19.0, 13.0, 13.0, 6.0, 12.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002468109130859375, -0.0023861825466156006, -0.002304255962371826, -0.0022223293781280518, -0.0021404027938842773, -0.002058476209640503, -0.0019765496253967285, -0.001894623041152954, -0.0018126964569091797, -0.0017307698726654053, -0.0016488432884216309, -0.0015669167041778564, -0.001484990119934082, -0.0014030635356903076, -0.0013211369514465332, -0.0012392103672027588, -0.0011572837829589844, -0.00107535719871521, -0.0009934306144714355, -0.0009115040302276611, -0.0008295774459838867, -0.0007476508617401123, -0.0006657242774963379, -0.0005837976932525635, -0.0005018711090087891, -0.00041994452476501465, -0.00033801794052124023, -0.0002560913562774658, -0.0001741647720336914, -9.223818778991699e-05, -1.0311603546142578e-05, 7.161498069763184e-05, 0.00015354156494140625, 0.00023546814918518066, 0.0003173947334289551, 0.0003993213176727295, 0.0004812479019165039, 0.0005631744861602783, 0.0006451010704040527, 0.0007270276546478271, 0.0008089542388916016, 0.000890880823135376, 0.0009728074073791504, 0.0010547339916229248, 0.0011366605758666992, 0.0012185871601104736, 0.001300513744354248, 0.0013824403285980225, 0.0014643669128417969, 0.0015462934970855713, 0.0016282200813293457, 0.0017101466655731201, 0.0017920732498168945, 0.001873999834060669, 0.0019559264183044434, 0.0020378530025482178, 0.002119779586791992, 0.0022017061710357666, 0.002283632755279541, 0.0023655593395233154, 0.00244748592376709, 0.0025294125080108643, 0.0026113390922546387, 0.002693265676498413, 0.0027751922607421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 9.0, 5.0, 11.0, 12.0, 19.0, 31.0, 41.0, 56.0, 70.0, 116.0, 218.0, 494.0, 877506.0, 168908.0, 471.0, 210.0, 101.0, 85.0, 52.0, 34.0, 21.0, 20.0, 13.0, 10.0, 9.0, 6.0, 4.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07684326171875, -0.0746450424194336, -0.07244682312011719, -0.07024860382080078, -0.06805038452148438, -0.06585216522216797, -0.06365394592285156, -0.061455726623535156, -0.05925750732421875, -0.057059288024902344, -0.05486106872558594, -0.05266284942626953, -0.050464630126953125, -0.04826641082763672, -0.04606819152832031, -0.043869972229003906, -0.0416717529296875, -0.039473533630371094, -0.03727531433105469, -0.03507709503173828, -0.032878875732421875, -0.03068065643310547, -0.028482437133789062, -0.026284217834472656, -0.02408599853515625, -0.021887779235839844, -0.019689559936523438, -0.01749134063720703, -0.015293121337890625, -0.013094902038574219, -0.010896682739257812, -0.008698463439941406, -0.006500244140625, -0.004302024841308594, -0.0021038055419921875, 9.441375732421875e-05, 0.002292633056640625, 0.004490852355957031, 0.0066890716552734375, 0.008887290954589844, 0.01108551025390625, 0.013283729553222656, 0.015481948852539062, 0.01768016815185547, 0.019878387451171875, 0.02207660675048828, 0.024274826049804688, 0.026473045349121094, 0.0286712646484375, 0.030869483947753906, 0.03306770324707031, 0.03526592254638672, 0.037464141845703125, 0.03966236114501953, 0.04186058044433594, 0.044058799743652344, 0.04625701904296875, 0.048455238342285156, 0.05065345764160156, 0.05285167694091797, 0.055049896240234375, 0.05724811553955078, 0.05944633483886719, 0.061644554138183594, 0.0638427734375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 18.0, 683.0, 315.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002351014409214258, -0.0021123590413480997, -0.001873703789897263, -0.0016350485384464264, -0.001396393170580268, -0.0011577378027141094, -0.0009190825512632728, -0.0006804272998124361, -0.0004417719319462776, -0.00020311662228778005, 3.5538687370717525e-05, 0.0002741939970292151, 0.0005128493066877127, 0.0007515046745538712, 0.0009901599260047078, 0.0012288151774555445, 0.001467470545321703, 0.0017061259131878614, 0.001944781164638698, 0.0021834364160895348, 0.0024220917839556932, 0.0026607471518218517, 0.0028994022868573666, 0.003138057654723525, 0.0033767130225896835, 0.003615368390455842, 0.0038540237583220005, 0.004092678893357515, 0.0043313344940543175, 0.004569989629089832, 0.004808644764125347, 0.005047299899160862, 0.005285955965518951, 0.005524611100554466, 0.005763266701251268, 0.006001921836286783, 0.006240577436983585, 0.0064792325720191, 0.006717887707054615, 0.00695654284209013, 0.007195198442786932, 0.007433853577822447, 0.007672509178519249, 0.007911164313554764, 0.008149819448590279, 0.008388474583625793, 0.008627130649983883, 0.008865785785019398, 0.009104440920054913, 0.009343096055090427, 0.009581751190125942, 0.009820407256484032, 0.010059062391519547, 0.010297717526555061, 0.010536372661590576, 0.010775027796626091, 0.011013682931661606, 0.01125233806669712, 0.011490993201732635, 0.011729649268090725, 0.01196830440312624, 0.012206959538161755, 0.01244561467319727, 0.012684269808232784, 0.012922925874590874]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 8.0, 9.0, 9.0, 12.0, 21.0, 17.0, 25.0, 26.0, 44.0, 27.0, 41.0, 43.0, 36.0, 35.0, 56.0, 51.0, 44.0, 54.0, 44.0, 49.0, 44.0, 47.0, 36.0, 41.0, 29.0, 25.0, 27.0, 14.0, 19.0, 19.0, 7.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001042783260345459, -0.0010045096278190613, -0.0009662359952926636, -0.0009279623627662659, -0.0008896887302398682, -0.0008514150977134705, -0.0008131414651870728, -0.000774867832660675, -0.0007365942001342773, -0.0006983205676078796, -0.0006600469350814819, -0.0006217733025550842, -0.0005834996700286865, -0.0005452260375022888, -0.0005069524049758911, -0.0004686787724494934, -0.0004304051399230957, -0.000392131507396698, -0.0003538578748703003, -0.0003155842423439026, -0.0002773106098175049, -0.00023903697729110718, -0.00020076334476470947, -0.00016248971223831177, -0.00012421607971191406, -8.594244718551636e-05, -4.766881465911865e-05, -9.395182132720947e-06, 2.8878450393676758e-05, 6.715208292007446e-05, 0.00010542571544647217, 0.00014369934797286987, 0.00018197298049926758, 0.00022024661302566528, 0.000258520245552063, 0.0002967938780784607, 0.0003350675106048584, 0.0003733411431312561, 0.0004116147756576538, 0.0004498884081840515, 0.0004881620407104492, 0.0005264356732368469, 0.0005647093057632446, 0.0006029829382896423, 0.00064125657081604, 0.0006795302033424377, 0.0007178038358688354, 0.0007560774683952332, 0.0007943511009216309, 0.0008326247334480286, 0.0008708983659744263, 0.000909171998500824, 0.0009474456310272217, 0.0009857192635536194, 0.001023992896080017, 0.0010622665286064148, 0.0011005401611328125, 0.0011388137936592102, 0.001177087426185608, 0.0012153610587120056, 0.0012536346912384033, 0.001291908323764801, 0.0013301819562911987, 0.0013684555888175964, 0.0014067292213439941]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 11.0, 11.0, 9.0, 12.0, 22.0, 23.0, 18.0, 28.0, 34.0, 27.0, 43.0, 38.0, 37.0, 42.0, 44.0, 36.0, 49.0, 44.0, 45.0, 40.0, 40.0, 39.0, 37.0, 33.0, 21.0, 25.0, 22.0, 25.0, 19.0, 16.0, 20.0, 15.0, 10.0, 15.0, 5.0, 4.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.71875, -13.3016357421875, -12.884521484375, -12.4674072265625, -12.05029296875, -11.6331787109375, -11.216064453125, -10.7989501953125, -10.3818359375, -9.9647216796875, -9.547607421875, -9.1304931640625, -8.71337890625, -8.2962646484375, -7.879150390625, -7.4620361328125, -7.044921875, -6.6278076171875, -6.210693359375, -5.7935791015625, -5.37646484375, -4.9593505859375, -4.542236328125, -4.1251220703125, -3.7080078125, -3.2908935546875, -2.873779296875, -2.4566650390625, -2.03955078125, -1.6224365234375, -1.205322265625, -0.7882080078125, -0.37109375, 0.0460205078125, 0.463134765625, 0.8802490234375, 1.29736328125, 1.7144775390625, 2.131591796875, 2.5487060546875, 2.9658203125, 3.3829345703125, 3.800048828125, 4.2171630859375, 4.63427734375, 5.0513916015625, 5.468505859375, 5.8856201171875, 6.302734375, 6.7198486328125, 7.136962890625, 7.5540771484375, 7.97119140625, 8.3883056640625, 8.805419921875, 9.2225341796875, 9.6396484375, 10.0567626953125, 10.473876953125, 10.8909912109375, 11.30810546875, 11.7252197265625, 12.142333984375, 12.5594482421875, 12.9765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 15.0, 31.0, 39.0, 66.0, 72.0, 116.0, 151.0, 228.0, 351.0, 527.0, 835.0, 1323.0, 2285.0, 4102.0, 8577.0, 20003.0, 58398.0, 240037.0, 516676.0, 129285.0, 37188.0, 13763.0, 6280.0, 3286.0, 1781.0, 1103.0, 655.0, 427.0, 278.0, 202.0, 127.0, 93.0, 67.0, 47.0, 29.0, 30.0, 22.0, 18.0, 8.0, 1.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.796875, -7.53076171875, -7.2646484375, -6.99853515625, -6.732421875, -6.46630859375, -6.2001953125, -5.93408203125, -5.66796875, -5.40185546875, -5.1357421875, -4.86962890625, -4.603515625, -4.33740234375, -4.0712890625, -3.80517578125, -3.5390625, -3.27294921875, -3.0068359375, -2.74072265625, -2.474609375, -2.20849609375, -1.9423828125, -1.67626953125, -1.41015625, -1.14404296875, -0.8779296875, -0.61181640625, -0.345703125, -0.07958984375, 0.1865234375, 0.45263671875, 0.71875, 0.98486328125, 1.2509765625, 1.51708984375, 1.783203125, 2.04931640625, 2.3154296875, 2.58154296875, 2.84765625, 3.11376953125, 3.3798828125, 3.64599609375, 3.912109375, 4.17822265625, 4.4443359375, 4.71044921875, 4.9765625, 5.24267578125, 5.5087890625, 5.77490234375, 6.041015625, 6.30712890625, 6.5732421875, 6.83935546875, 7.10546875, 7.37158203125, 7.6376953125, 7.90380859375, 8.169921875, 8.43603515625, 8.7021484375, 8.96826171875, 9.234375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 3.0, 6.0, 7.0, 10.0, 8.0, 11.0, 26.0, 29.0, 25.0, 34.0, 29.0, 38.0, 41.0, 45.0, 59.0, 60.0, 156.0, 1939.0, 105.0, 63.0, 57.0, 47.0, 44.0, 38.0, 29.0, 28.0, 12.0, 18.0, 13.0, 10.0, 7.0, 12.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-57.34375, -55.619140625, -53.89453125, -52.169921875, -50.4453125, -48.720703125, -46.99609375, -45.271484375, -43.546875, -41.822265625, -40.09765625, -38.373046875, -36.6484375, -34.923828125, -33.19921875, -31.474609375, -29.75, -28.025390625, -26.30078125, -24.576171875, -22.8515625, -21.126953125, -19.40234375, -17.677734375, -15.953125, -14.228515625, -12.50390625, -10.779296875, -9.0546875, -7.330078125, -5.60546875, -3.880859375, -2.15625, -0.431640625, 1.29296875, 3.017578125, 4.7421875, 6.466796875, 8.19140625, 9.916015625, 11.640625, 13.365234375, 15.08984375, 16.814453125, 18.5390625, 20.263671875, 21.98828125, 23.712890625, 25.4375, 27.162109375, 28.88671875, 30.611328125, 32.3359375, 34.060546875, 35.78515625, 37.509765625, 39.234375, 40.958984375, 42.68359375, 44.408203125, 46.1328125, 47.857421875, 49.58203125, 51.306640625, 53.03125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 6.0, 11.0, 8.0, 12.0, 12.0, 27.0, 20.0, 28.0, 47.0, 66.0, 104.0, 124.0, 270.0, 636.0, 3083.0, 3008460.0, 130075.0, 1514.0, 460.0, 242.0, 128.0, 78.0, 68.0, 47.0, 30.0, 32.0, 31.0, 13.0, 9.0, 13.0, 5.0, 6.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.3125, -84.482421875, -81.65234375, -78.822265625, -75.9921875, -73.162109375, -70.33203125, -67.501953125, -64.671875, -61.841796875, -59.01171875, -56.181640625, -53.3515625, -50.521484375, -47.69140625, -44.861328125, -42.03125, -39.201171875, -36.37109375, -33.541015625, -30.7109375, -27.880859375, -25.05078125, -22.220703125, -19.390625, -16.560546875, -13.73046875, -10.900390625, -8.0703125, -5.240234375, -2.41015625, 0.419921875, 3.25, 6.080078125, 8.91015625, 11.740234375, 14.5703125, 17.400390625, 20.23046875, 23.060546875, 25.890625, 28.720703125, 31.55078125, 34.380859375, 37.2109375, 40.041015625, 42.87109375, 45.701171875, 48.53125, 51.361328125, 54.19140625, 57.021484375, 59.8515625, 62.681640625, 65.51171875, 68.341796875, 71.171875, 74.001953125, 76.83203125, 79.662109375, 82.4921875, 85.322265625, 88.15234375, 90.982421875, 93.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 21.0, 57.0, 132.0, 217.0, 234.0, 178.0, 101.0, 42.0, 14.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.36103439331055, -54.66956329345703, -52.97808837890625, -51.286617279052734, -49.59514236450195, -47.90367126464844, -46.212196350097656, -44.52072525024414, -42.82925033569336, -41.137779235839844, -39.44630432128906, -37.75483322143555, -36.063358306884766, -34.37188720703125, -32.68041229248047, -30.988941192626953, -29.297468185424805, -27.605995178222656, -25.914522171020508, -24.22304916381836, -22.53157615661621, -20.840103149414062, -19.148632049560547, -17.457157135009766, -15.765685081481934, -14.074212074279785, -12.382739067077637, -10.691267013549805, -8.999794006347656, -7.308320999145508, -5.616847991943359, -3.925374984741211, -2.2339019775390625, -0.5424290895462036, 1.1490437984466553, 2.8405165672302246, 4.531989574432373, 6.223462104797363, 7.914935111999512, 9.60640811920166, 11.297881126403809, 12.989354133605957, 14.680827140808105, 16.372299194335938, 18.063772201538086, 19.755245208740234, 21.446718215942383, 23.13819122314453, 24.82966423034668, 26.521137237548828, 28.212610244750977, 29.904083251953125, 31.595556259155273, 33.28702926635742, 34.97850036621094, 36.66997528076172, 38.361446380615234, 40.05291748046875, 41.74439239501953, 43.43586349487305, 45.12733840942383, 46.818809509277344, 48.510284423828125, 50.20175552368164, 51.89323043823242]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 10.0, 4.0, 6.0, 6.0, 10.0, 7.0, 19.0, 17.0, 18.0, 24.0, 20.0, 27.0, 23.0, 26.0, 25.0, 18.0, 34.0, 35.0, 49.0, 30.0, 32.0, 38.0, 44.0, 36.0, 38.0, 37.0, 27.0, 34.0, 37.0, 36.0, 25.0, 22.0, 27.0, 29.0, 17.0, 13.0, 14.0, 12.0, 12.0, 12.0, 11.0, 10.0, 7.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-137.01206970214844, -132.70550537109375, -128.39894104003906, -124.09236907958984, -119.78579711914062, -115.47923278808594, -111.17266845703125, -106.86610412597656, -102.55953216552734, -98.25296783447266, -93.94639587402344, -89.63983154296875, -85.33326721191406, -81.02669525146484, -76.72013092041016, -72.41355895996094, -68.10699462890625, -63.8004264831543, -59.493858337402344, -55.187294006347656, -50.8807258605957, -46.57415771484375, -42.26759338378906, -37.96102523803711, -33.654457092285156, -29.347888946533203, -25.041322708129883, -20.734756469726562, -16.42818832397461, -12.121620178222656, -7.815053939819336, -3.5084877014160156, 0.798095703125, 5.104662895202637, 9.411230087280273, 13.71779727935791, 18.024364471435547, 22.3309326171875, 26.63749885559082, 30.94406509399414, 35.250633239746094, 39.55720138549805, 43.86376953125, 48.17033386230469, 52.47690200805664, 56.783470153808594, 61.09003448486328, 65.3966064453125, 69.70317077636719, 74.00973510742188, 78.3163070678711, 82.62287139892578, 86.929443359375, 91.23600769042969, 95.54257202148438, 99.84913635253906, 104.15570831298828, 108.46227264404297, 112.76884460449219, 117.07540893554688, 121.38197326660156, 125.68854522705078, 129.9951171875, 134.3016815185547, 138.60824584960938]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 6.0, 2.0, 6.0, 9.0, 14.0, 9.0, 18.0, 15.0, 26.0, 20.0, 24.0, 34.0, 31.0, 38.0, 37.0, 45.0, 32.0, 45.0, 43.0, 48.0, 46.0, 54.0, 29.0, 39.0, 37.0, 30.0, 33.0, 31.0, 23.0, 21.0, 25.0, 24.0, 14.0, 21.0, 10.0, 12.0, 11.0, 6.0, 4.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.828125, -13.40625, -12.984375, -12.5625, -12.140625, -11.71875, -11.296875, -10.875, -10.453125, -10.03125, -9.609375, -9.1875, -8.765625, -8.34375, -7.921875, -7.5, -7.078125, -6.65625, -6.234375, -5.8125, -5.390625, -4.96875, -4.546875, -4.125, -3.703125, -3.28125, -2.859375, -2.4375, -2.015625, -1.59375, -1.171875, -0.75, -0.328125, 0.09375, 0.515625, 0.9375, 1.359375, 1.78125, 2.203125, 2.625, 3.046875, 3.46875, 3.890625, 4.3125, 4.734375, 5.15625, 5.578125, 6.0, 6.421875, 6.84375, 7.265625, 7.6875, 8.109375, 8.53125, 8.953125, 9.375, 9.796875, 10.21875, 10.640625, 11.0625, 11.484375, 11.90625, 12.328125, 12.75, 13.171875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 5.0, 7.0, 9.0, 12.0, 11.0, 23.0, 30.0, 51.0, 55.0, 81.0, 136.0, 210.0, 381.0, 1075.0, 2954.0, 13770.0, 97596.0, 737393.0, 2340929.0, 861999.0, 115145.0, 16868.0, 3362.0, 1050.0, 428.0, 220.0, 130.0, 104.0, 53.0, 48.0, 38.0, 21.0, 17.0, 15.0, 16.0, 12.0, 4.0, 8.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.65625, -24.891357421875, -24.12646484375, -23.361572265625, -22.5966796875, -21.831787109375, -21.06689453125, -20.302001953125, -19.537109375, -18.772216796875, -18.00732421875, -17.242431640625, -16.4775390625, -15.712646484375, -14.94775390625, -14.182861328125, -13.41796875, -12.653076171875, -11.88818359375, -11.123291015625, -10.3583984375, -9.593505859375, -8.82861328125, -8.063720703125, -7.298828125, -6.533935546875, -5.76904296875, -5.004150390625, -4.2392578125, -3.474365234375, -2.70947265625, -1.944580078125, -1.1796875, -0.414794921875, 0.35009765625, 1.114990234375, 1.8798828125, 2.644775390625, 3.40966796875, 4.174560546875, 4.939453125, 5.704345703125, 6.46923828125, 7.234130859375, 7.9990234375, 8.763916015625, 9.52880859375, 10.293701171875, 11.05859375, 11.823486328125, 12.58837890625, 13.353271484375, 14.1181640625, 14.883056640625, 15.64794921875, 16.412841796875, 17.177734375, 17.942626953125, 18.70751953125, 19.472412109375, 20.2373046875, 21.002197265625, 21.76708984375, 22.531982421875, 23.296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 11.0, 11.0, 18.0, 24.0, 26.0, 36.0, 43.0, 73.0, 94.0, 124.0, 185.0, 280.0, 392.0, 600.0, 601.0, 465.0, 331.0, 227.0, 152.0, 90.0, 64.0, 51.0, 37.0, 34.0, 24.0, 17.0, 17.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.53125, -46.0546875, -44.578125, -43.1015625, -41.625, -40.1484375, -38.671875, -37.1953125, -35.71875, -34.2421875, -32.765625, -31.2890625, -29.8125, -28.3359375, -26.859375, -25.3828125, -23.90625, -22.4296875, -20.953125, -19.4765625, -18.0, -16.5234375, -15.046875, -13.5703125, -12.09375, -10.6171875, -9.140625, -7.6640625, -6.1875, -4.7109375, -3.234375, -1.7578125, -0.28125, 1.1953125, 2.671875, 4.1484375, 5.625, 7.1015625, 8.578125, 10.0546875, 11.53125, 13.0078125, 14.484375, 15.9609375, 17.4375, 18.9140625, 20.390625, 21.8671875, 23.34375, 24.8203125, 26.296875, 27.7734375, 29.25, 30.7265625, 32.203125, 33.6796875, 35.15625, 36.6328125, 38.109375, 39.5859375, 41.0625, 42.5390625, 44.015625, 45.4921875, 46.96875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 15.0, 26.0, 25.0, 43.0, 42.0, 81.0, 108.0, 164.0, 275.0, 536.0, 3238.0, 4169474.0, 18522.0, 766.0, 335.0, 185.0, 129.0, 85.0, 67.0, 37.0, 33.0, 23.0, 13.0, 12.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-263.75, -255.41796875, -247.0859375, -238.75390625, -230.421875, -222.08984375, -213.7578125, -205.42578125, -197.09375, -188.76171875, -180.4296875, -172.09765625, -163.765625, -155.43359375, -147.1015625, -138.76953125, -130.4375, -122.10546875, -113.7734375, -105.44140625, -97.109375, -88.77734375, -80.4453125, -72.11328125, -63.78125, -55.44921875, -47.1171875, -38.78515625, -30.453125, -22.12109375, -13.7890625, -5.45703125, 2.875, 11.20703125, 19.5390625, 27.87109375, 36.203125, 44.53515625, 52.8671875, 61.19921875, 69.53125, 77.86328125, 86.1953125, 94.52734375, 102.859375, 111.19140625, 119.5234375, 127.85546875, 136.1875, 144.51953125, 152.8515625, 161.18359375, 169.515625, 177.84765625, 186.1796875, 194.51171875, 202.84375, 211.17578125, 219.5078125, 227.83984375, 236.171875, 244.50390625, 252.8359375, 261.16796875, 269.5]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 28.0, 73.0, 193.0, 291.0, 257.0, 116.0, 30.0, 15.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.45133209228516, -101.4977035522461, -93.54407501220703, -85.59043884277344, -77.63681030273438, -69.68318176269531, -61.72955322265625, -53.77592086791992, -45.82229232788086, -37.8686637878418, -29.91503143310547, -21.961402893066406, -14.007772445678711, -6.054141998291016, 1.8994865417480469, 9.853118896484375, 17.806747436523438, 25.760377883911133, 33.71400833129883, 41.66763687133789, 49.62126922607422, 57.57489776611328, 65.52852630615234, 73.48216247558594, 81.435791015625, 89.38941955566406, 97.34304809570312, 105.29667663574219, 113.25031280517578, 121.20394134521484, 129.15756225585938, 137.1112060546875, 145.06483459472656, 153.01846313476562, 160.9720916748047, 168.92572021484375, 176.8793487548828, 184.83297729492188, 192.78662109375, 200.74024963378906, 208.69387817382812, 216.6475067138672, 224.60113525390625, 232.5547637939453, 240.50839233398438, 248.4620361328125, 256.4156494140625, 264.3692932128906, 272.3229064941406, 280.27655029296875, 288.23016357421875, 296.1838073730469, 304.1374206542969, 312.091064453125, 320.044677734375, 327.9983215332031, 335.95196533203125, 343.9056091308594, 351.8592224121094, 359.8128662109375, 367.7664794921875, 375.7201232910156, 383.6737365722656, 391.62738037109375, 399.58099365234375]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 14.0, 6.0, 14.0, 7.0, 12.0, 14.0, 17.0, 25.0, 22.0, 16.0, 30.0, 33.0, 27.0, 36.0, 26.0, 37.0, 28.0, 50.0, 36.0, 38.0, 38.0, 32.0, 41.0, 31.0, 43.0, 43.0, 30.0, 23.0, 27.0, 29.0, 24.0, 23.0, 17.0, 19.0, 17.0, 6.0, 13.0, 11.0, 5.0, 11.0, 4.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-146.58441162109375, -142.41366577148438, -138.242919921875, -134.07217407226562, -129.9014129638672, -125.73066711425781, -121.55992126464844, -117.38917541503906, -113.21842956542969, -109.04768371582031, -104.8769302368164, -100.70618438720703, -96.53543853759766, -92.36468505859375, -88.19393920898438, -84.023193359375, -79.8524398803711, -75.68169403076172, -71.51094055175781, -67.34019470214844, -63.16944885253906, -58.99869918823242, -54.82794952392578, -50.657203674316406, -46.486454010009766, -42.315704345703125, -38.14495849609375, -33.97420883178711, -29.8034610748291, -25.632713317871094, -21.461963653564453, -17.291215896606445, -13.120468139648438, -8.94972038269043, -4.7789716720581055, -0.6082229614257812, 3.5625247955322266, 7.733272552490234, 11.904022216796875, 16.074769973754883, 20.24551773071289, 24.4162654876709, 28.587013244628906, 32.75776290893555, 36.92851257324219, 41.09925842285156, 45.2700080871582, 49.440757751464844, 53.61150360107422, 57.78225326538086, 61.952999114990234, 66.12374877929688, 70.29449462890625, 74.46524047851562, 78.63599395751953, 82.8067398071289, 86.97749328613281, 91.14823913574219, 95.3189926147461, 99.48973846435547, 103.66048431396484, 107.83123779296875, 112.00198364257812, 116.1727294921875, 120.34347534179688]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 8.0, 9.0, 6.0, 9.0, 15.0, 17.0, 12.0, 17.0, 12.0, 20.0, 33.0, 24.0, 45.0, 34.0, 44.0, 37.0, 34.0, 44.0, 51.0, 37.0, 52.0, 48.0, 40.0, 48.0, 33.0, 31.0, 34.0, 27.0, 25.0, 23.0, 17.0, 23.0, 14.0, 15.0, 14.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.5625, -14.1263427734375, -13.690185546875, -13.2540283203125, -12.81787109375, -12.3817138671875, -11.945556640625, -11.5093994140625, -11.0732421875, -10.6370849609375, -10.200927734375, -9.7647705078125, -9.32861328125, -8.8924560546875, -8.456298828125, -8.0201416015625, -7.583984375, -7.1478271484375, -6.711669921875, -6.2755126953125, -5.83935546875, -5.4031982421875, -4.967041015625, -4.5308837890625, -4.0947265625, -3.6585693359375, -3.222412109375, -2.7862548828125, -2.35009765625, -1.9139404296875, -1.477783203125, -1.0416259765625, -0.60546875, -0.1693115234375, 0.266845703125, 0.7030029296875, 1.13916015625, 1.5753173828125, 2.011474609375, 2.4476318359375, 2.8837890625, 3.3199462890625, 3.756103515625, 4.1922607421875, 4.62841796875, 5.0645751953125, 5.500732421875, 5.9368896484375, 6.373046875, 6.8092041015625, 7.245361328125, 7.6815185546875, 8.11767578125, 8.5538330078125, 8.989990234375, 9.4261474609375, 9.8623046875, 10.2984619140625, 10.734619140625, 11.1707763671875, 11.60693359375, 12.0430908203125, 12.479248046875, 12.9154052734375, 13.3515625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 12.0, 21.0, 37.0, 32.0, 76.0, 85.0, 152.0, 190.0, 340.0, 472.0, 732.0, 1124.0, 1668.0, 2568.0, 3943.0, 6373.0, 10166.0, 16449.0, 26981.0, 45971.0, 82878.0, 167316.0, 351534.0, 146170.0, 74871.0, 42299.0, 24926.0, 15132.0, 9316.0, 5873.0, 3807.0, 2426.0, 1564.0, 1011.0, 657.0, 441.0, 303.0, 211.0, 135.0, 92.0, 60.0, 43.0, 28.0, 20.0, 13.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.83984375, -3.724945068359375, -3.61004638671875, -3.495147705078125, -3.3802490234375, -3.265350341796875, -3.15045166015625, -3.035552978515625, -2.920654296875, -2.805755615234375, -2.69085693359375, -2.575958251953125, -2.4610595703125, -2.346160888671875, -2.23126220703125, -2.116363525390625, -2.00146484375, -1.886566162109375, -1.77166748046875, -1.656768798828125, -1.5418701171875, -1.426971435546875, -1.31207275390625, -1.197174072265625, -1.082275390625, -0.967376708984375, -0.85247802734375, -0.737579345703125, -0.6226806640625, -0.507781982421875, -0.39288330078125, -0.277984619140625, -0.1630859375, -0.048187255859375, 0.06671142578125, 0.181610107421875, 0.2965087890625, 0.411407470703125, 0.52630615234375, 0.641204833984375, 0.756103515625, 0.871002197265625, 0.98590087890625, 1.100799560546875, 1.2156982421875, 1.330596923828125, 1.44549560546875, 1.560394287109375, 1.67529296875, 1.790191650390625, 1.90509033203125, 2.019989013671875, 2.1348876953125, 2.249786376953125, 2.36468505859375, 2.479583740234375, 2.594482421875, 2.709381103515625, 2.82427978515625, 2.939178466796875, 3.0540771484375, 3.168975830078125, 3.28387451171875, 3.398773193359375, 3.513671875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 9.0, 5.0, 9.0, 12.0, 13.0, 9.0, 28.0, 15.0, 24.0, 37.0, 25.0, 31.0, 19.0, 19.0, 34.0, 34.0, 38.0, 33.0, 41.0, 1071.0, 45.0, 50.0, 51.0, 44.0, 45.0, 30.0, 28.0, 32.0, 25.0, 26.0, 23.0, 18.0, 13.0, 14.0, 9.0, 11.0, 10.0, 12.0, 9.0, 10.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.25, -8.9835205078125, -8.717041015625, -8.4505615234375, -8.18408203125, -7.9176025390625, -7.651123046875, -7.3846435546875, -7.1181640625, -6.8516845703125, -6.585205078125, -6.3187255859375, -6.05224609375, -5.7857666015625, -5.519287109375, -5.2528076171875, -4.986328125, -4.7198486328125, -4.453369140625, -4.1868896484375, -3.92041015625, -3.6539306640625, -3.387451171875, -3.1209716796875, -2.8544921875, -2.5880126953125, -2.321533203125, -2.0550537109375, -1.78857421875, -1.5220947265625, -1.255615234375, -0.9891357421875, -0.72265625, -0.4561767578125, -0.189697265625, 0.0767822265625, 0.34326171875, 0.6097412109375, 0.876220703125, 1.1427001953125, 1.4091796875, 1.6756591796875, 1.942138671875, 2.2086181640625, 2.47509765625, 2.7415771484375, 3.008056640625, 3.2745361328125, 3.541015625, 3.8074951171875, 4.073974609375, 4.3404541015625, 4.60693359375, 4.8734130859375, 5.139892578125, 5.4063720703125, 5.6728515625, 5.9393310546875, 6.205810546875, 6.4722900390625, 6.73876953125, 7.0052490234375, 7.271728515625, 7.5382080078125, 7.8046875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 6.0, 12.0, 21.0, 25.0, 33.0, 53.0, 77.0, 125.0, 175.0, 255.0, 356.0, 527.0, 819.0, 1208.0, 1914.0, 2899.0, 4540.0, 7279.0, 11503.0, 18977.0, 30817.0, 50601.0, 88060.0, 187114.0, 1393812.0, 124630.0, 66532.0, 39457.0, 24399.0, 14969.0, 9272.0, 5997.0, 3734.0, 2259.0, 1512.0, 1028.0, 677.0, 458.0, 302.0, 205.0, 142.0, 117.0, 65.0, 47.0, 41.0, 23.0, 20.0, 7.0, 7.0, 6.0, 7.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.4609375, -3.3502197265625, -3.239501953125, -3.1287841796875, -3.01806640625, -2.9073486328125, -2.796630859375, -2.6859130859375, -2.5751953125, -2.4644775390625, -2.353759765625, -2.2430419921875, -2.13232421875, -2.0216064453125, -1.910888671875, -1.8001708984375, -1.689453125, -1.5787353515625, -1.468017578125, -1.3572998046875, -1.24658203125, -1.1358642578125, -1.025146484375, -0.9144287109375, -0.8037109375, -0.6929931640625, -0.582275390625, -0.4715576171875, -0.36083984375, -0.2501220703125, -0.139404296875, -0.0286865234375, 0.08203125, 0.1927490234375, 0.303466796875, 0.4141845703125, 0.52490234375, 0.6356201171875, 0.746337890625, 0.8570556640625, 0.9677734375, 1.0784912109375, 1.189208984375, 1.2999267578125, 1.41064453125, 1.5213623046875, 1.632080078125, 1.7427978515625, 1.853515625, 1.9642333984375, 2.074951171875, 2.1856689453125, 2.29638671875, 2.4071044921875, 2.517822265625, 2.6285400390625, 2.7392578125, 2.8499755859375, 2.960693359375, 3.0714111328125, 3.18212890625, 3.2928466796875, 3.403564453125, 3.5142822265625, 3.625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 17.0, 15.0, 17.0, 24.0, 39.0, 42.0, 67.0, 69.0, 135.0, 139.0, 113.0, 92.0, 58.0, 34.0, 36.0, 16.0, 18.0, 16.0, 11.0, 7.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00275421142578125, -0.002669215202331543, -0.002584218978881836, -0.002499222755432129, -0.002414226531982422, -0.002329230308532715, -0.002244234085083008, -0.0021592378616333008, -0.0020742416381835938, -0.0019892454147338867, -0.0019042491912841797, -0.0018192529678344727, -0.0017342567443847656, -0.0016492605209350586, -0.0015642642974853516, -0.0014792680740356445, -0.0013942718505859375, -0.0013092756271362305, -0.0012242794036865234, -0.0011392831802368164, -0.0010542869567871094, -0.0009692907333374023, -0.0008842945098876953, -0.0007992982864379883, -0.0007143020629882812, -0.0006293058395385742, -0.0005443096160888672, -0.00045931339263916016, -0.0003743171691894531, -0.0002893209457397461, -0.00020432472229003906, -0.00011932849884033203, -3.4332275390625e-05, 5.066394805908203e-05, 0.00013566017150878906, 0.0002206563949584961, 0.0003056526184082031, 0.00039064884185791016, 0.0004756450653076172, 0.0005606412887573242, 0.0006456375122070312, 0.0007306337356567383, 0.0008156299591064453, 0.0009006261825561523, 0.0009856224060058594, 0.0010706186294555664, 0.0011556148529052734, 0.0012406110763549805, 0.0013256072998046875, 0.0014106035232543945, 0.0014955997467041016, 0.0015805959701538086, 0.0016655921936035156, 0.0017505884170532227, 0.0018355846405029297, 0.0019205808639526367, 0.0020055770874023438, 0.0020905733108520508, 0.002175569534301758, 0.002260565757751465, 0.002345561981201172, 0.002430558204650879, 0.002515554428100586, 0.002600550651550293, 0.002685546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 12.0, 16.0, 24.0, 36.0, 35.0, 83.0, 138.0, 395.0, 6256.0, 1040400.0, 601.0, 244.0, 113.0, 53.0, 39.0, 28.0, 20.0, 13.0, 9.0, 5.0, 7.0, 7.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08197021484375, -0.079345703125, -0.07672119140625, -0.0740966796875, -0.07147216796875, -0.06884765625, -0.06622314453125, -0.0635986328125, -0.06097412109375, -0.058349609375, -0.05572509765625, -0.0531005859375, -0.05047607421875, -0.0478515625, -0.04522705078125, -0.0426025390625, -0.03997802734375, -0.037353515625, -0.03472900390625, -0.0321044921875, -0.02947998046875, -0.02685546875, -0.02423095703125, -0.0216064453125, -0.01898193359375, -0.016357421875, -0.01373291015625, -0.0111083984375, -0.00848388671875, -0.005859375, -0.00323486328125, -0.0006103515625, 0.00201416015625, 0.004638671875, 0.00726318359375, 0.0098876953125, 0.01251220703125, 0.01513671875, 0.01776123046875, 0.0203857421875, 0.02301025390625, 0.025634765625, 0.02825927734375, 0.0308837890625, 0.03350830078125, 0.0361328125, 0.03875732421875, 0.0413818359375, 0.04400634765625, 0.046630859375, 0.04925537109375, 0.0518798828125, 0.05450439453125, 0.05712890625, 0.05975341796875, 0.0623779296875, 0.06500244140625, 0.067626953125, 0.07025146484375, 0.0728759765625, 0.07550048828125, 0.078125, 0.08074951171875, 0.0833740234375, 0.08599853515625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [98.0, 893.0, 30.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044345547212287784, -0.00013266719179227948, 0.00017812108853831887, 0.0004889093688689172, 0.0007996976491995156, 0.0011104859877377748, 0.0014212741516530514, 0.001732062315568328, 0.002042850712314248, 0.0023536388762295246, 0.002664427272975445, 0.002975215669721365, 0.0032860038336366415, 0.003596791997551918, 0.003907580394297838, 0.004218368791043758, 0.004529157187789679, 0.004839945584535599, 0.005150733515620232, 0.005461521912366152, 0.005772310309112072, 0.006083098705857992, 0.006393887102603912, 0.006704675033688545, 0.007015463430434465, 0.007326251827180386, 0.0076370397582650185, 0.007947828620672226, 0.008258616551756859, 0.008569404482841492, 0.0088801933452487, 0.009190981276333332, 0.00950177013874054, 0.009812558069825172, 0.01012334693223238, 0.010434134863317013, 0.01074492372572422, 0.011055711656808853, 0.011366499587893486, 0.011677287518978119, 0.011988076381385326, 0.01229886431246996, 0.012609653174877167, 0.0129204411059618, 0.013231229037046432, 0.01354201789945364, 0.013852805830538273, 0.01416359469294548, 0.014474382624030113, 0.014785170555114746, 0.015095959417521954, 0.015406747348606586, 0.015717536211013794, 0.016028324142098427, 0.01633911207318306, 0.016649900004267693, 0.016960687935352325, 0.01727147586643696, 0.01758226379752159, 0.017893053591251373, 0.018203841522336006, 0.01851462945342064, 0.018825417384505272, 0.019136205315589905, 0.019446995109319687]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 0.0, 6.0, 5.0, 7.0, 6.0, 4.0, 8.0, 18.0, 19.0, 22.0, 10.0, 17.0, 27.0, 24.0, 31.0, 33.0, 37.0, 39.0, 35.0, 41.0, 37.0, 38.0, 33.0, 37.0, 47.0, 46.0, 40.0, 35.0, 38.0, 29.0, 36.0, 29.0, 22.0, 23.0, 11.0, 23.0, 15.0, 16.0, 9.0, 10.0, 9.0, 5.0, 5.0, 4.0, 7.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009142756462097168, -0.0008855815976858139, -0.000856887549161911, -0.0008281935006380081, -0.0007994994521141052, -0.0007708054035902023, -0.0007421113550662994, -0.0007134173065423965, -0.0006847232580184937, -0.0006560292094945908, -0.0006273351609706879, -0.000598641112446785, -0.0005699470639228821, -0.0005412530153989792, -0.0005125589668750763, -0.0004838649183511734, -0.0004551708698272705, -0.0004264768213033676, -0.0003977827727794647, -0.00036908872425556183, -0.00034039467573165894, -0.00031170062720775604, -0.00028300657868385315, -0.00025431253015995026, -0.00022561848163604736, -0.00019692443311214447, -0.00016823038458824158, -0.00013953633606433868, -0.00011084228754043579, -8.21482390165329e-05, -5.3454190492630005e-05, -2.4760141968727112e-05, 3.933906555175781e-06, 3.2627955079078674e-05, 6.132200360298157e-05, 9.001605212688446e-05, 0.00011871010065078735, 0.00014740414917469025, 0.00017609819769859314, 0.00020479224622249603, 0.00023348629474639893, 0.0002621803432703018, 0.0002908743917942047, 0.0003195684403181076, 0.0003482624888420105, 0.0003769565373659134, 0.0004056505858898163, 0.0004343446344137192, 0.00046303868293762207, 0.000491732731461525, 0.0005204267799854279, 0.0005491208285093307, 0.0005778148770332336, 0.0006065089255571365, 0.0006352029740810394, 0.0006638970226049423, 0.0006925910711288452, 0.0007212851196527481, 0.000749979168176651, 0.0007786732167005539, 0.0008073672652244568, 0.0008360613137483597, 0.0008647553622722626, 0.0008934494107961655, 0.0009221434593200684]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 8.0, 9.0, 6.0, 9.0, 15.0, 17.0, 12.0, 17.0, 12.0, 19.0, 34.0, 24.0, 45.0, 34.0, 44.0, 37.0, 34.0, 44.0, 51.0, 37.0, 52.0, 48.0, 40.0, 48.0, 33.0, 31.0, 34.0, 27.0, 25.0, 23.0, 17.0, 23.0, 14.0, 15.0, 14.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.5625, -14.1263427734375, -13.690185546875, -13.2540283203125, -12.81787109375, -12.3817138671875, -11.945556640625, -11.5093994140625, -11.0732421875, -10.6370849609375, -10.200927734375, -9.7647705078125, -9.32861328125, -8.8924560546875, -8.456298828125, -8.0201416015625, -7.583984375, -7.1478271484375, -6.711669921875, -6.2755126953125, -5.83935546875, -5.4031982421875, -4.967041015625, -4.5308837890625, -4.0947265625, -3.6585693359375, -3.222412109375, -2.7862548828125, -2.35009765625, -1.9139404296875, -1.477783203125, -1.0416259765625, -0.60546875, -0.1693115234375, 0.266845703125, 0.7030029296875, 1.13916015625, 1.5753173828125, 2.011474609375, 2.4476318359375, 2.8837890625, 3.3199462890625, 3.756103515625, 4.1922607421875, 4.62841796875, 5.0645751953125, 5.500732421875, 5.9368896484375, 6.373046875, 6.8092041015625, 7.245361328125, 7.6815185546875, 8.11767578125, 8.5538330078125, 8.989990234375, 9.4261474609375, 9.8623046875, 10.2984619140625, 10.734619140625, 11.1707763671875, 11.60693359375, 12.0430908203125, 12.479248046875, 12.9154052734375, 13.3515625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 7.0, 12.0, 12.0, 20.0, 34.0, 30.0, 56.0, 93.0, 154.0, 293.0, 483.0, 910.0, 1612.0, 3190.0, 6663.0, 16346.0, 49238.0, 187190.0, 483830.0, 211518.0, 54649.0, 17736.0, 7203.0, 3336.0, 1674.0, 951.0, 536.0, 285.0, 173.0, 119.0, 67.0, 29.0, 25.0, 22.0, 13.0, 9.0, 3.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.0, -8.731689453125, -8.46337890625, -8.195068359375, -7.9267578125, -7.658447265625, -7.39013671875, -7.121826171875, -6.853515625, -6.585205078125, -6.31689453125, -6.048583984375, -5.7802734375, -5.511962890625, -5.24365234375, -4.975341796875, -4.70703125, -4.438720703125, -4.17041015625, -3.902099609375, -3.6337890625, -3.365478515625, -3.09716796875, -2.828857421875, -2.560546875, -2.292236328125, -2.02392578125, -1.755615234375, -1.4873046875, -1.218994140625, -0.95068359375, -0.682373046875, -0.4140625, -0.145751953125, 0.12255859375, 0.390869140625, 0.6591796875, 0.927490234375, 1.19580078125, 1.464111328125, 1.732421875, 2.000732421875, 2.26904296875, 2.537353515625, 2.8056640625, 3.073974609375, 3.34228515625, 3.610595703125, 3.87890625, 4.147216796875, 4.41552734375, 4.683837890625, 4.9521484375, 5.220458984375, 5.48876953125, 5.757080078125, 6.025390625, 6.293701171875, 6.56201171875, 6.830322265625, 7.0986328125, 7.366943359375, 7.63525390625, 7.903564453125, 8.171875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 13.0, 14.0, 12.0, 20.0, 22.0, 31.0, 25.0, 27.0, 24.0, 36.0, 34.0, 38.0, 50.0, 46.0, 87.0, 1726.0, 354.0, 69.0, 31.0, 47.0, 41.0, 38.0, 31.0, 41.0, 23.0, 29.0, 17.0, 14.0, 15.0, 22.0, 3.0, 9.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -48.21923828125, -46.6572265625, -45.09521484375, -43.533203125, -41.97119140625, -40.4091796875, -38.84716796875, -37.28515625, -35.72314453125, -34.1611328125, -32.59912109375, -31.037109375, -29.47509765625, -27.9130859375, -26.35107421875, -24.7890625, -23.22705078125, -21.6650390625, -20.10302734375, -18.541015625, -16.97900390625, -15.4169921875, -13.85498046875, -12.29296875, -10.73095703125, -9.1689453125, -7.60693359375, -6.044921875, -4.48291015625, -2.9208984375, -1.35888671875, 0.203125, 1.76513671875, 3.3271484375, 4.88916015625, 6.451171875, 8.01318359375, 9.5751953125, 11.13720703125, 12.69921875, 14.26123046875, 15.8232421875, 17.38525390625, 18.947265625, 20.50927734375, 22.0712890625, 23.63330078125, 25.1953125, 26.75732421875, 28.3193359375, 29.88134765625, 31.443359375, 33.00537109375, 34.5673828125, 36.12939453125, 37.69140625, 39.25341796875, 40.8154296875, 42.37744140625, 43.939453125, 45.50146484375, 47.0634765625, 48.62548828125, 50.1875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 7.0, 13.0, 5.0, 16.0, 16.0, 16.0, 20.0, 38.0, 42.0, 59.0, 70.0, 97.0, 157.0, 250.0, 533.0, 1684.0, 323725.0, 2814901.0, 2503.0, 587.0, 289.0, 203.0, 112.0, 68.0, 54.0, 34.0, 34.0, 37.0, 20.0, 20.0, 16.0, 15.0, 10.0, 7.0, 5.0, 3.0, 8.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.125, -78.515625, -75.90625, -73.296875, -70.6875, -68.078125, -65.46875, -62.859375, -60.25, -57.640625, -55.03125, -52.421875, -49.8125, -47.203125, -44.59375, -41.984375, -39.375, -36.765625, -34.15625, -31.546875, -28.9375, -26.328125, -23.71875, -21.109375, -18.5, -15.890625, -13.28125, -10.671875, -8.0625, -5.453125, -2.84375, -0.234375, 2.375, 4.984375, 7.59375, 10.203125, 12.8125, 15.421875, 18.03125, 20.640625, 23.25, 25.859375, 28.46875, 31.078125, 33.6875, 36.296875, 38.90625, 41.515625, 44.125, 46.734375, 49.34375, 51.953125, 54.5625, 57.171875, 59.78125, 62.390625, 65.0, 67.609375, 70.21875, 72.828125, 75.4375, 78.046875, 80.65625, 83.265625, 85.875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 200.0, 743.0, 62.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.77931213378906, -132.55543518066406, -125.3315658569336, -118.10769653320312, -110.88381958007812, -103.65994262695312, -96.43607330322266, -89.21220397949219, -81.98832702636719, -74.76445007324219, -67.54058074951172, -60.316707611083984, -53.09283447265625, -45.868961334228516, -38.64508819580078, -31.421215057373047, -24.197341918945312, -16.973468780517578, -9.749595642089844, -2.5257225036621094, 4.698150634765625, 11.92202377319336, 19.145896911621094, 26.369770050048828, 33.59364318847656, 40.8175163269043, 48.04138946533203, 55.265262603759766, 62.4891357421875, 69.7130126953125, 76.93688201904297, 84.16075134277344, 91.3846435546875, 98.6085205078125, 105.83238983154297, 113.05625915527344, 120.28013610839844, 127.50401306152344, 134.72787475585938, 141.95175170898438, 149.17562866210938, 156.39950561523438, 163.62338256835938, 170.8472442626953, 178.0711212158203, 185.2949981689453, 192.51885986328125, 199.74273681640625, 206.96661376953125, 214.19049072265625, 221.41436767578125, 228.6382293701172, 235.8621063232422, 243.0859832763672, 250.30984497070312, 257.5337219238281, 264.7575988769531, 271.9814758300781, 279.2053527832031, 286.4292297363281, 293.653076171875, 300.876953125, 308.100830078125, 315.32470703125, 322.548583984375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 3.0, 7.0, 4.0, 9.0, 7.0, 14.0, 7.0, 21.0, 20.0, 24.0, 26.0, 33.0, 29.0, 33.0, 44.0, 36.0, 44.0, 35.0, 39.0, 36.0, 57.0, 52.0, 48.0, 48.0, 37.0, 30.0, 25.0, 35.0, 28.0, 35.0, 19.0, 25.0, 14.0, 13.0, 8.0, 16.0, 10.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-165.99197387695312, -160.6900177001953, -155.3880615234375, -150.0861053466797, -144.78414916992188, -139.48219299316406, -134.18023681640625, -128.87828063964844, -123.57632446289062, -118.27436828613281, -112.972412109375, -107.67045593261719, -102.36849975585938, -97.06654357910156, -91.76458740234375, -86.46263122558594, -81.16067504882812, -75.85871887207031, -70.5567626953125, -65.25480651855469, -59.952850341796875, -54.65089416503906, -49.34893798828125, -44.04698181152344, -38.745025634765625, -33.44306945800781, -28.14111328125, -22.839157104492188, -17.537200927734375, -12.235244750976562, -6.93328857421875, -1.6313323974609375, 3.6706085205078125, 8.972564697265625, 14.274520874023438, 19.57647705078125, 24.878433227539062, 30.180389404296875, 35.48234558105469, 40.7843017578125, 46.08625793457031, 51.388214111328125, 56.69017028808594, 61.99212646484375, 67.29408264160156, 72.59603881835938, 77.89799499511719, 83.199951171875, 88.50190734863281, 93.80386352539062, 99.10581970214844, 104.40777587890625, 109.70973205566406, 115.01168823242188, 120.31364440917969, 125.6156005859375, 130.9175567626953, 136.21951293945312, 141.52146911621094, 146.82342529296875, 152.12538146972656, 157.42733764648438, 162.7292938232422, 168.03125, 173.3332061767578]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 5.0, 8.0, 9.0, 11.0, 17.0, 13.0, 17.0, 10.0, 20.0, 26.0, 31.0, 32.0, 36.0, 29.0, 45.0, 28.0, 40.0, 46.0, 45.0, 50.0, 41.0, 47.0, 34.0, 40.0, 32.0, 34.0, 28.0, 23.0, 25.0, 26.0, 18.0, 20.0, 19.0, 14.0, 10.0, 13.0, 8.0, 5.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-14.25, -13.8330078125, -13.416015625, -12.9990234375, -12.58203125, -12.1650390625, -11.748046875, -11.3310546875, -10.9140625, -10.4970703125, -10.080078125, -9.6630859375, -9.24609375, -8.8291015625, -8.412109375, -7.9951171875, -7.578125, -7.1611328125, -6.744140625, -6.3271484375, -5.91015625, -5.4931640625, -5.076171875, -4.6591796875, -4.2421875, -3.8251953125, -3.408203125, -2.9912109375, -2.57421875, -2.1572265625, -1.740234375, -1.3232421875, -0.90625, -0.4892578125, -0.072265625, 0.3447265625, 0.76171875, 1.1787109375, 1.595703125, 2.0126953125, 2.4296875, 2.8466796875, 3.263671875, 3.6806640625, 4.09765625, 4.5146484375, 4.931640625, 5.3486328125, 5.765625, 6.1826171875, 6.599609375, 7.0166015625, 7.43359375, 7.8505859375, 8.267578125, 8.6845703125, 9.1015625, 9.5185546875, 9.935546875, 10.3525390625, 10.76953125, 11.1865234375, 11.603515625, 12.0205078125, 12.4375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 7.0, 9.0, 5.0, 12.0, 14.0, 11.0, 19.0, 20.0, 26.0, 35.0, 46.0, 45.0, 55.0, 101.0, 175.0, 409.0, 1609.0, 15178.0, 331415.0, 3072804.0, 736416.0, 31809.0, 2742.0, 583.0, 215.0, 121.0, 92.0, 46.0, 34.0, 38.0, 18.0, 31.0, 23.0, 15.0, 17.0, 10.0, 9.0, 8.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-40.34375, -39.14404296875, -37.9443359375, -36.74462890625, -35.544921875, -34.34521484375, -33.1455078125, -31.94580078125, -30.74609375, -29.54638671875, -28.3466796875, -27.14697265625, -25.947265625, -24.74755859375, -23.5478515625, -22.34814453125, -21.1484375, -19.94873046875, -18.7490234375, -17.54931640625, -16.349609375, -15.14990234375, -13.9501953125, -12.75048828125, -11.55078125, -10.35107421875, -9.1513671875, -7.95166015625, -6.751953125, -5.55224609375, -4.3525390625, -3.15283203125, -1.953125, -0.75341796875, 0.4462890625, 1.64599609375, 2.845703125, 4.04541015625, 5.2451171875, 6.44482421875, 7.64453125, 8.84423828125, 10.0439453125, 11.24365234375, 12.443359375, 13.64306640625, 14.8427734375, 16.04248046875, 17.2421875, 18.44189453125, 19.6416015625, 20.84130859375, 22.041015625, 23.24072265625, 24.4404296875, 25.64013671875, 26.83984375, 28.03955078125, 29.2392578125, 30.43896484375, 31.638671875, 32.83837890625, 34.0380859375, 35.23779296875, 36.4375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 9.0, 10.0, 19.0, 25.0, 41.0, 49.0, 57.0, 90.0, 131.0, 171.0, 277.0, 376.0, 522.0, 565.0, 474.0, 338.0, 258.0, 190.0, 111.0, 88.0, 68.0, 59.0, 42.0, 25.0, 18.0, 14.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-51.0625, -49.69873046875, -48.3349609375, -46.97119140625, -45.607421875, -44.24365234375, -42.8798828125, -41.51611328125, -40.15234375, -38.78857421875, -37.4248046875, -36.06103515625, -34.697265625, -33.33349609375, -31.9697265625, -30.60595703125, -29.2421875, -27.87841796875, -26.5146484375, -25.15087890625, -23.787109375, -22.42333984375, -21.0595703125, -19.69580078125, -18.33203125, -16.96826171875, -15.6044921875, -14.24072265625, -12.876953125, -11.51318359375, -10.1494140625, -8.78564453125, -7.421875, -6.05810546875, -4.6943359375, -3.33056640625, -1.966796875, -0.60302734375, 0.7607421875, 2.12451171875, 3.48828125, 4.85205078125, 6.2158203125, 7.57958984375, 8.943359375, 10.30712890625, 11.6708984375, 13.03466796875, 14.3984375, 15.76220703125, 17.1259765625, 18.48974609375, 19.853515625, 21.21728515625, 22.5810546875, 23.94482421875, 25.30859375, 26.67236328125, 28.0361328125, 29.39990234375, 30.763671875, 32.12744140625, 33.4912109375, 34.85498046875, 36.21875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 12.0, 12.0, 13.0, 24.0, 31.0, 55.0, 77.0, 81.0, 151.0, 216.0, 378.0, 927.0, 16052.0, 4169314.0, 5173.0, 758.0, 341.0, 210.0, 143.0, 86.0, 68.0, 52.0, 32.0, 13.0, 15.0, 14.0, 2.0, 14.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.125, -179.759765625, -172.39453125, -165.029296875, -157.6640625, -150.298828125, -142.93359375, -135.568359375, -128.203125, -120.837890625, -113.47265625, -106.107421875, -98.7421875, -91.376953125, -84.01171875, -76.646484375, -69.28125, -61.916015625, -54.55078125, -47.185546875, -39.8203125, -32.455078125, -25.08984375, -17.724609375, -10.359375, -2.994140625, 4.37109375, 11.736328125, 19.1015625, 26.466796875, 33.83203125, 41.197265625, 48.5625, 55.927734375, 63.29296875, 70.658203125, 78.0234375, 85.388671875, 92.75390625, 100.119140625, 107.484375, 114.849609375, 122.21484375, 129.580078125, 136.9453125, 144.310546875, 151.67578125, 159.041015625, 166.40625, 173.771484375, 181.13671875, 188.501953125, 195.8671875, 203.232421875, 210.59765625, 217.962890625, 225.328125, 232.693359375, 240.05859375, 247.423828125, 254.7890625, 262.154296875, 269.51953125, 276.884765625, 284.25]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 16.0, 25.0, 78.0, 151.0, 207.0, 223.0, 169.0, 76.0, 35.0, 17.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.46455383300781, -102.0787582397461, -95.69295501708984, -89.30715942382812, -82.92135620117188, -76.53556060791016, -70.14976501464844, -63.76396560668945, -57.37816619873047, -50.992366790771484, -44.6065673828125, -38.22077178955078, -31.834972381591797, -25.449172973632812, -19.063377380371094, -12.67757797241211, -6.291778564453125, 0.09401988983154297, 6.479818344116211, 12.865615844726562, 19.251415252685547, 25.63721466064453, 32.02301025390625, 38.408809661865234, 44.79460906982422, 51.1804084777832, 57.56620788574219, 63.952003479003906, 70.33779907226562, 76.72360229492188, 83.1093978881836, 89.49519348144531, 95.8809814453125, 102.26677703857422, 108.65258026123047, 115.03837585449219, 121.42417907714844, 127.80997467041016, 134.19577026367188, 140.58157348632812, 146.96737670898438, 153.35317993164062, 159.7389678955078, 166.12477111816406, 172.5105743408203, 178.8963623046875, 185.28216552734375, 191.66796875, 198.0537567138672, 204.43955993652344, 210.82534790039062, 217.21115112304688, 223.59695434570312, 229.98275756835938, 236.36854553222656, 242.7543487548828, 249.14013671875, 255.52593994140625, 261.9117431640625, 268.29754638671875, 274.6833190917969, 281.0691223144531, 287.4549255371094, 293.8407287597656, 300.2265319824219]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 4.0, 7.0, 9.0, 14.0, 12.0, 21.0, 20.0, 29.0, 22.0, 24.0, 33.0, 46.0, 41.0, 42.0, 42.0, 47.0, 50.0, 53.0, 52.0, 58.0, 45.0, 42.0, 34.0, 37.0, 33.0, 28.0, 33.0, 21.0, 20.0, 15.0, 16.0, 9.0, 13.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-162.5196533203125, -157.79641723632812, -153.07318115234375, -148.34994506835938, -143.626708984375, -138.90347290039062, -134.18023681640625, -129.45700073242188, -124.7337646484375, -120.01052856445312, -115.28729248046875, -110.56405639648438, -105.8408203125, -101.11758422851562, -96.39434814453125, -91.67111206054688, -86.94788360595703, -82.22464752197266, -77.50141143798828, -72.7781753540039, -68.05493927001953, -63.331703186035156, -58.60847091674805, -53.88523483276367, -49.1619987487793, -44.43876266479492, -39.71552658081055, -34.99229431152344, -30.26905632019043, -25.545820236206055, -20.822586059570312, -16.099349975585938, -11.376113891601562, -6.652878284454346, -1.929642677307129, 2.7935924530029297, 7.516828536987305, 12.24006462097168, 16.963298797607422, 21.686534881591797, 26.409770965576172, 31.133007049560547, 35.85624313354492, 40.57947540283203, 45.302711486816406, 50.02594757080078, 54.749183654785156, 59.47241973876953, 64.1956558227539, 68.91889190673828, 73.64212799072266, 78.36536407470703, 83.0886001586914, 87.81183624267578, 92.53506469726562, 97.25830078125, 101.98153686523438, 106.70477294921875, 111.42800903320312, 116.1512451171875, 120.87448120117188, 125.59771728515625, 130.32095336914062, 135.044189453125, 139.76742553710938]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 8.0, 7.0, 11.0, 9.0, 11.0, 19.0, 18.0, 14.0, 21.0, 29.0, 32.0, 31.0, 39.0, 29.0, 39.0, 43.0, 46.0, 41.0, 43.0, 42.0, 55.0, 39.0, 40.0, 33.0, 30.0, 33.0, 25.0, 25.0, 27.0, 28.0, 15.0, 17.0, 10.0, 13.0, 16.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.640625, -14.206298828125, -13.77197265625, -13.337646484375, -12.9033203125, -12.468994140625, -12.03466796875, -11.600341796875, -11.166015625, -10.731689453125, -10.29736328125, -9.863037109375, -9.4287109375, -8.994384765625, -8.56005859375, -8.125732421875, -7.69140625, -7.257080078125, -6.82275390625, -6.388427734375, -5.9541015625, -5.519775390625, -5.08544921875, -4.651123046875, -4.216796875, -3.782470703125, -3.34814453125, -2.913818359375, -2.4794921875, -2.045166015625, -1.61083984375, -1.176513671875, -0.7421875, -0.307861328125, 0.12646484375, 0.560791015625, 0.9951171875, 1.429443359375, 1.86376953125, 2.298095703125, 2.732421875, 3.166748046875, 3.60107421875, 4.035400390625, 4.4697265625, 4.904052734375, 5.33837890625, 5.772705078125, 6.20703125, 6.641357421875, 7.07568359375, 7.510009765625, 7.9443359375, 8.378662109375, 8.81298828125, 9.247314453125, 9.681640625, 10.115966796875, 10.55029296875, 10.984619140625, 11.4189453125, 11.853271484375, 12.28759765625, 12.721923828125, 13.15625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 7.0, 20.0, 34.0, 31.0, 57.0, 87.0, 113.0, 156.0, 232.0, 340.0, 465.0, 664.0, 980.0, 1376.0, 1982.0, 2947.0, 4098.0, 5863.0, 8669.0, 12875.0, 18888.0, 28531.0, 43839.0, 70135.0, 122292.0, 290517.0, 180886.0, 89904.0, 54911.0, 35202.0, 23032.0, 15585.0, 10384.0, 7259.0, 4918.0, 3371.0, 2390.0, 1664.0, 1165.0, 793.0, 564.0, 418.0, 286.0, 183.0, 134.0, 95.0, 65.0, 37.0, 21.0, 35.0, 19.0, 14.0, 5.0, 6.0, 3.0, 3.0, 1.0], "bins": [-3.08984375, -2.9954833984375, -2.901123046875, -2.8067626953125, -2.71240234375, -2.6180419921875, -2.523681640625, -2.4293212890625, -2.3349609375, -2.2406005859375, -2.146240234375, -2.0518798828125, -1.95751953125, -1.8631591796875, -1.768798828125, -1.6744384765625, -1.580078125, -1.4857177734375, -1.391357421875, -1.2969970703125, -1.20263671875, -1.1082763671875, -1.013916015625, -0.9195556640625, -0.8251953125, -0.7308349609375, -0.636474609375, -0.5421142578125, -0.44775390625, -0.3533935546875, -0.259033203125, -0.1646728515625, -0.0703125, 0.0240478515625, 0.118408203125, 0.2127685546875, 0.30712890625, 0.4014892578125, 0.495849609375, 0.5902099609375, 0.6845703125, 0.7789306640625, 0.873291015625, 0.9676513671875, 1.06201171875, 1.1563720703125, 1.250732421875, 1.3450927734375, 1.439453125, 1.5338134765625, 1.628173828125, 1.7225341796875, 1.81689453125, 1.9112548828125, 2.005615234375, 2.0999755859375, 2.1943359375, 2.2886962890625, 2.383056640625, 2.4774169921875, 2.57177734375, 2.6661376953125, 2.760498046875, 2.8548583984375, 2.94921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 11.0, 7.0, 12.0, 24.0, 32.0, 23.0, 28.0, 30.0, 36.0, 50.0, 40.0, 34.0, 37.0, 49.0, 1062.0, 43.0, 60.0, 53.0, 49.0, 52.0, 37.0, 37.0, 42.0, 32.0, 28.0, 17.0, 21.0, 16.0, 12.0, 8.0, 8.0, 4.0, 2.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.25, -9.9151611328125, -9.580322265625, -9.2454833984375, -8.91064453125, -8.5758056640625, -8.240966796875, -7.9061279296875, -7.5712890625, -7.2364501953125, -6.901611328125, -6.5667724609375, -6.23193359375, -5.8970947265625, -5.562255859375, -5.2274169921875, -4.892578125, -4.5577392578125, -4.222900390625, -3.8880615234375, -3.55322265625, -3.2183837890625, -2.883544921875, -2.5487060546875, -2.2138671875, -1.8790283203125, -1.544189453125, -1.2093505859375, -0.87451171875, -0.5396728515625, -0.204833984375, 0.1300048828125, 0.46484375, 0.7996826171875, 1.134521484375, 1.4693603515625, 1.80419921875, 2.1390380859375, 2.473876953125, 2.8087158203125, 3.1435546875, 3.4783935546875, 3.813232421875, 4.1480712890625, 4.48291015625, 4.8177490234375, 5.152587890625, 5.4874267578125, 5.822265625, 6.1571044921875, 6.491943359375, 6.8267822265625, 7.16162109375, 7.4964599609375, 7.831298828125, 8.1661376953125, 8.5009765625, 8.8358154296875, 9.170654296875, 9.5054931640625, 9.84033203125, 10.1751708984375, 10.510009765625, 10.8448486328125, 11.1796875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 6.0, 24.0, 37.0, 36.0, 54.0, 75.0, 114.0, 178.0, 267.0, 431.0, 601.0, 994.0, 1558.0, 2487.0, 4144.0, 6987.0, 12150.0, 21738.0, 39191.0, 72962.0, 145730.0, 1411201.0, 182996.0, 86884.0, 46238.0, 25446.0, 14216.0, 8114.0, 4629.0, 2867.0, 1786.0, 1070.0, 602.0, 404.0, 295.0, 203.0, 139.0, 84.0, 49.0, 40.0, 34.0, 17.0, 15.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.390625, -4.256103515625, -4.12158203125, -3.987060546875, -3.8525390625, -3.718017578125, -3.58349609375, -3.448974609375, -3.314453125, -3.179931640625, -3.04541015625, -2.910888671875, -2.7763671875, -2.641845703125, -2.50732421875, -2.372802734375, -2.23828125, -2.103759765625, -1.96923828125, -1.834716796875, -1.7001953125, -1.565673828125, -1.43115234375, -1.296630859375, -1.162109375, -1.027587890625, -0.89306640625, -0.758544921875, -0.6240234375, -0.489501953125, -0.35498046875, -0.220458984375, -0.0859375, 0.048583984375, 0.18310546875, 0.317626953125, 0.4521484375, 0.586669921875, 0.72119140625, 0.855712890625, 0.990234375, 1.124755859375, 1.25927734375, 1.393798828125, 1.5283203125, 1.662841796875, 1.79736328125, 1.931884765625, 2.06640625, 2.200927734375, 2.33544921875, 2.469970703125, 2.6044921875, 2.739013671875, 2.87353515625, 3.008056640625, 3.142578125, 3.277099609375, 3.41162109375, 3.546142578125, 3.6806640625, 3.815185546875, 3.94970703125, 4.084228515625, 4.21875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 12.0, 12.0, 15.0, 31.0, 49.0, 64.0, 72.0, 117.0, 144.0, 129.0, 89.0, 69.0, 49.0, 45.0, 29.0, 20.0, 10.0, 3.0, 11.0, 4.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047149658203125, -0.004557132720947266, -0.004399299621582031, -0.004241466522216797, -0.0040836334228515625, -0.003925800323486328, -0.0037679672241210938, -0.0036101341247558594, -0.003452301025390625, -0.0032944679260253906, -0.0031366348266601562, -0.002978801727294922, -0.0028209686279296875, -0.002663135528564453, -0.0025053024291992188, -0.0023474693298339844, -0.00218963623046875, -0.0020318031311035156, -0.0018739700317382812, -0.0017161369323730469, -0.0015583038330078125, -0.0014004707336425781, -0.0012426376342773438, -0.0010848045349121094, -0.000926971435546875, -0.0007691383361816406, -0.0006113052368164062, -0.0004534721374511719, -0.0002956390380859375, -0.00013780593872070312, 2.002716064453125e-05, 0.00017786026000976562, 0.000335693359375, 0.0004935264587402344, 0.0006513595581054688, 0.0008091926574707031, 0.0009670257568359375, 0.0011248588562011719, 0.0012826919555664062, 0.0014405250549316406, 0.001598358154296875, 0.0017561912536621094, 0.0019140243530273438, 0.002071857452392578, 0.0022296905517578125, 0.002387523651123047, 0.0025453567504882812, 0.0027031898498535156, 0.00286102294921875, 0.0030188560485839844, 0.0031766891479492188, 0.003334522247314453, 0.0034923553466796875, 0.003650188446044922, 0.0038080215454101562, 0.003965854644775391, 0.004123687744140625, 0.004281520843505859, 0.004439353942871094, 0.004597187042236328, 0.0047550201416015625, 0.004912853240966797, 0.005070686340332031, 0.005228519439697266, 0.0053863525390625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 7.0, 6.0, 11.0, 17.0, 17.0, 38.0, 39.0, 55.0, 112.0, 314.0, 11111.0, 1035982.0, 476.0, 130.0, 81.0, 40.0, 30.0, 24.0, 16.0, 11.0, 10.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14453125, -0.14029693603515625, -0.1360626220703125, -0.13182830810546875, -0.127593994140625, -0.12335968017578125, -0.1191253662109375, -0.11489105224609375, -0.11065673828125, -0.10642242431640625, -0.1021881103515625, -0.09795379638671875, -0.093719482421875, -0.08948516845703125, -0.0852508544921875, -0.08101654052734375, -0.0767822265625, -0.07254791259765625, -0.0683135986328125, -0.06407928466796875, -0.059844970703125, -0.05561065673828125, -0.0513763427734375, -0.04714202880859375, -0.04290771484375, -0.03867340087890625, -0.0344390869140625, -0.03020477294921875, -0.025970458984375, -0.02173614501953125, -0.0175018310546875, -0.01326751708984375, -0.009033203125, -0.00479888916015625, -0.0005645751953125, 0.00366973876953125, 0.007904052734375, 0.01213836669921875, 0.0163726806640625, 0.02060699462890625, 0.02484130859375, 0.02907562255859375, 0.0333099365234375, 0.03754425048828125, 0.041778564453125, 0.04601287841796875, 0.0502471923828125, 0.05448150634765625, 0.0587158203125, 0.06295013427734375, 0.0671844482421875, 0.07141876220703125, 0.075653076171875, 0.07988739013671875, 0.0841217041015625, 0.08835601806640625, 0.09259033203125, 0.09682464599609375, 0.1010589599609375, 0.10529327392578125, 0.109527587890625, 0.11376190185546875, 0.1179962158203125, 0.12223052978515625, 0.12646484375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 437.0, 544.0, 23.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004431617446243763, -0.004155469126999378, -0.0038793208077549934, -0.0036031727213412523, -0.0033270244020968676, -0.003050876082852483, -0.0027747279964387417, -0.002498579677194357, -0.002222431357949972, -0.0019462830387055874, -0.0016701348358765244, -0.0013939866330474615, -0.0011178383138030767, -0.000841689994558692, -0.000565541791729629, -0.0002893935889005661, -1.3245269656181335e-05, 0.0002629029913805425, 0.0005390512524172664, 0.0008151995134539902, 0.001091347774490714, 0.0013674960937350988, 0.0016436442965641618, 0.0019197924993932247, 0.0021959408186376095, 0.0024720891378819942, 0.002748237457126379, 0.00302438554354012, 0.003300533862784505, 0.0035766821820288897, 0.0038528302684426308, 0.0041289785876870155, 0.004405127838253975, 0.00468127615749836, 0.0049574244767427444, 0.005233572795987129, 0.005509721115231514, 0.005785869434475899, 0.006062017288058996, 0.006338165607303381, 0.006614313926547766, 0.0068904622457921505, 0.007166610565036535, 0.00744275888428092, 0.0077189067378640175, 0.007995055057108402, 0.008271203376352787, 0.008547351695597172, 0.008823500014841557, 0.009099648334085941, 0.009375796653330326, 0.00965194497257471, 0.009928093291819096, 0.01020424161106348, 0.010480389930307865, 0.010756537318229675, 0.01103268563747406, 0.011308833956718445, 0.01158498227596283, 0.011861130595207214, 0.012137278914451599, 0.012413427233695984, 0.012689575552940369, 0.012965723872184753, 0.013241872191429138]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 6.0, 14.0, 13.0, 17.0, 16.0, 22.0, 23.0, 36.0, 29.0, 40.0, 31.0, 35.0, 45.0, 37.0, 40.0, 49.0, 51.0, 45.0, 43.0, 39.0, 44.0, 36.0, 29.0, 33.0, 29.0, 25.0, 26.0, 18.0, 18.0, 27.0, 11.0, 10.0, 7.0, 12.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0016613006591796875, -0.001611512154340744, -0.0015617236495018005, -0.001511935144662857, -0.0014621466398239136, -0.00141235813498497, -0.0013625696301460266, -0.0013127811253070831, -0.0012629926204681396, -0.0012132041156291962, -0.0011634156107902527, -0.0011136271059513092, -0.0010638386011123657, -0.0010140500962734222, -0.0009642615914344788, -0.0009144730865955353, -0.0008646845817565918, -0.0008148960769176483, -0.0007651075720787048, -0.0007153190672397614, -0.0006655305624008179, -0.0006157420575618744, -0.0005659535527229309, -0.0005161650478839874, -0.00046637654304504395, -0.00041658803820610046, -0.000366799533367157, -0.0003170110285282135, -0.00026722252368927, -0.00021743401885032654, -0.00016764551401138306, -0.00011785700917243958, -6.80685043334961e-05, -1.8279999494552612e-05, 3.150850534439087e-05, 8.129701018333435e-05, 0.00013108551502227783, 0.0001808740198612213, 0.0002306625247001648, 0.0002804510295391083, 0.00033023953437805176, 0.00038002803921699524, 0.0004298165440559387, 0.0004796050488948822, 0.0005293935537338257, 0.0005791820585727692, 0.0006289705634117126, 0.0006787590682506561, 0.0007285475730895996, 0.0007783360779285431, 0.0008281245827674866, 0.00087791308760643, 0.0009277015924453735, 0.000977490097284317, 0.0010272786021232605, 0.001077067106962204, 0.0011268556118011475, 0.001176644116640091, 0.0012264326214790344, 0.001276221126317978, 0.0013260096311569214, 0.0013757981359958649, 0.0014255866408348083, 0.0014753751456737518, 0.0015251636505126953]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 8.0, 7.0, 11.0, 9.0, 11.0, 19.0, 18.0, 14.0, 21.0, 29.0, 32.0, 32.0, 38.0, 29.0, 39.0, 43.0, 46.0, 41.0, 43.0, 42.0, 55.0, 39.0, 40.0, 33.0, 30.0, 33.0, 25.0, 25.0, 27.0, 28.0, 15.0, 17.0, 10.0, 13.0, 16.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.640625, -14.206298828125, -13.77197265625, -13.337646484375, -12.9033203125, -12.468994140625, -12.03466796875, -11.600341796875, -11.166015625, -10.731689453125, -10.29736328125, -9.863037109375, -9.4287109375, -8.994384765625, -8.56005859375, -8.125732421875, -7.69140625, -7.257080078125, -6.82275390625, -6.388427734375, -5.9541015625, -5.519775390625, -5.08544921875, -4.651123046875, -4.216796875, -3.782470703125, -3.34814453125, -2.913818359375, -2.4794921875, -2.045166015625, -1.61083984375, -1.176513671875, -0.7421875, -0.307861328125, 0.12646484375, 0.560791015625, 0.9951171875, 1.429443359375, 1.86376953125, 2.298095703125, 2.732421875, 3.166748046875, 3.60107421875, 4.035400390625, 4.4697265625, 4.904052734375, 5.33837890625, 5.772705078125, 6.20703125, 6.641357421875, 7.07568359375, 7.510009765625, 7.9443359375, 8.378662109375, 8.81298828125, 9.247314453125, 9.681640625, 10.115966796875, 10.55029296875, 10.984619140625, 11.4189453125, 11.853271484375, 12.28759765625, 12.721923828125, 13.15625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 7.0, 17.0, 17.0, 25.0, 45.0, 66.0, 82.0, 127.0, 182.0, 244.0, 338.0, 571.0, 785.0, 1230.0, 1817.0, 2835.0, 4568.0, 7781.0, 13210.0, 26343.0, 62595.0, 211819.0, 480762.0, 136955.0, 46510.0, 20998.0, 10942.0, 6473.0, 3737.0, 2454.0, 1614.0, 1087.0, 772.0, 493.0, 301.0, 233.0, 179.0, 98.0, 67.0, 41.0, 45.0, 20.0, 16.0, 18.0, 12.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-9.109375, -8.8441162109375, -8.578857421875, -8.3135986328125, -8.04833984375, -7.7830810546875, -7.517822265625, -7.2525634765625, -6.9873046875, -6.7220458984375, -6.456787109375, -6.1915283203125, -5.92626953125, -5.6610107421875, -5.395751953125, -5.1304931640625, -4.865234375, -4.5999755859375, -4.334716796875, -4.0694580078125, -3.80419921875, -3.5389404296875, -3.273681640625, -3.0084228515625, -2.7431640625, -2.4779052734375, -2.212646484375, -1.9473876953125, -1.68212890625, -1.4168701171875, -1.151611328125, -0.8863525390625, -0.62109375, -0.3558349609375, -0.090576171875, 0.1746826171875, 0.43994140625, 0.7052001953125, 0.970458984375, 1.2357177734375, 1.5009765625, 1.7662353515625, 2.031494140625, 2.2967529296875, 2.56201171875, 2.8272705078125, 3.092529296875, 3.3577880859375, 3.623046875, 3.8883056640625, 4.153564453125, 4.4188232421875, 4.68408203125, 4.9493408203125, 5.214599609375, 5.4798583984375, 5.7451171875, 6.0103759765625, 6.275634765625, 6.5408935546875, 6.80615234375, 7.0714111328125, 7.336669921875, 7.6019287109375, 7.8671875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 10.0, 16.0, 16.0, 21.0, 25.0, 33.0, 23.0, 30.0, 47.0, 47.0, 43.0, 47.0, 69.0, 208.0, 1840.0, 103.0, 48.0, 52.0, 62.0, 46.0, 35.0, 30.0, 29.0, 26.0, 27.0, 22.0, 14.0, 10.0, 7.0, 7.0, 8.0, 6.0, 11.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.3125, -64.53369140625, -62.7548828125, -60.97607421875, -59.197265625, -57.41845703125, -55.6396484375, -53.86083984375, -52.08203125, -50.30322265625, -48.5244140625, -46.74560546875, -44.966796875, -43.18798828125, -41.4091796875, -39.63037109375, -37.8515625, -36.07275390625, -34.2939453125, -32.51513671875, -30.736328125, -28.95751953125, -27.1787109375, -25.39990234375, -23.62109375, -21.84228515625, -20.0634765625, -18.28466796875, -16.505859375, -14.72705078125, -12.9482421875, -11.16943359375, -9.390625, -7.61181640625, -5.8330078125, -4.05419921875, -2.275390625, -0.49658203125, 1.2822265625, 3.06103515625, 4.83984375, 6.61865234375, 8.3974609375, 10.17626953125, 11.955078125, 13.73388671875, 15.5126953125, 17.29150390625, 19.0703125, 20.84912109375, 22.6279296875, 24.40673828125, 26.185546875, 27.96435546875, 29.7431640625, 31.52197265625, 33.30078125, 35.07958984375, 36.8583984375, 38.63720703125, 40.416015625, 42.19482421875, 43.9736328125, 45.75244140625, 47.53125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 6.0, 10.0, 10.0, 10.0, 14.0, 18.0, 31.0, 37.0, 31.0, 68.0, 84.0, 94.0, 195.0, 325.0, 623.0, 3437.0, 2885184.0, 252023.0, 2112.0, 501.0, 290.0, 177.0, 123.0, 67.0, 40.0, 50.0, 30.0, 21.0, 23.0, 16.0, 15.0, 11.0, 6.0, 5.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -94.7294921875, -91.333984375, -87.9384765625, -84.54296875, -81.1474609375, -77.751953125, -74.3564453125, -70.9609375, -67.5654296875, -64.169921875, -60.7744140625, -57.37890625, -53.9833984375, -50.587890625, -47.1923828125, -43.796875, -40.4013671875, -37.005859375, -33.6103515625, -30.21484375, -26.8193359375, -23.423828125, -20.0283203125, -16.6328125, -13.2373046875, -9.841796875, -6.4462890625, -3.05078125, 0.3447265625, 3.740234375, 7.1357421875, 10.53125, 13.9267578125, 17.322265625, 20.7177734375, 24.11328125, 27.5087890625, 30.904296875, 34.2998046875, 37.6953125, 41.0908203125, 44.486328125, 47.8818359375, 51.27734375, 54.6728515625, 58.068359375, 61.4638671875, 64.859375, 68.2548828125, 71.650390625, 75.0458984375, 78.44140625, 81.8369140625, 85.232421875, 88.6279296875, 92.0234375, 95.4189453125, 98.814453125, 102.2099609375, 105.60546875, 109.0009765625, 112.396484375, 115.7919921875, 119.1875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 233.0, 768.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-710.3665771484375, -697.4947509765625, -684.6229248046875, -671.7510986328125, -658.8792724609375, -646.0074462890625, -633.1355590820312, -620.2637329101562, -607.3919067382812, -594.5200805664062, -581.6482543945312, -568.7764282226562, -555.9046020507812, -543.03271484375, -530.160888671875, -517.2890625, -504.417236328125, -491.54541015625, -478.673583984375, -465.8017272949219, -452.9299011230469, -440.0580749511719, -427.1862487792969, -414.31439208984375, -401.4425964355469, -388.5707702636719, -375.6989440917969, -362.82708740234375, -349.95526123046875, -337.08343505859375, -324.21160888671875, -311.33978271484375, -298.46795654296875, -285.59613037109375, -272.72430419921875, -259.8524475097656, -246.98062133789062, -234.10879516601562, -221.23696899414062, -208.36512756347656, -195.4932861328125, -182.6214599609375, -169.74961853027344, -156.87779235839844, -144.00595092773438, -131.13412475585938, -118.26229095458984, -105.39045715332031, -92.51862335205078, -79.64678955078125, -66.77495574951172, -53.90312576293945, -41.03129196166992, -28.159461975097656, -15.287628173828125, -2.4157943725585938, 10.456039428710938, 23.32787322998047, 36.19970703125, 49.071537017822266, 61.9433708190918, 74.81520080566406, 87.6870346069336, 100.55886840820312, 113.43070220947266]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 6.0, 10.0, 5.0, 11.0, 14.0, 14.0, 17.0, 14.0, 12.0, 20.0, 19.0, 32.0, 32.0, 38.0, 21.0, 33.0, 31.0, 41.0, 34.0, 43.0, 38.0, 35.0, 39.0, 32.0, 34.0, 38.0, 23.0, 35.0, 30.0, 31.0, 35.0, 18.0, 17.0, 20.0, 21.0, 14.0, 25.0, 12.0, 9.0, 5.0, 10.0, 8.0, 6.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-128.62646484375, -124.45686340332031, -120.28726959228516, -116.11767578125, -111.94807434082031, -107.77847290039062, -103.60887908935547, -99.43928527832031, -95.26968383789062, -91.10008239746094, -86.93048858642578, -82.76089477539062, -78.59129333496094, -74.42169189453125, -70.2520980834961, -66.08250427246094, -61.91290283203125, -57.74330520629883, -53.573707580566406, -49.404109954833984, -45.23451232910156, -41.06491470336914, -36.89531707763672, -32.7257194519043, -28.556121826171875, -24.386524200439453, -20.21692657470703, -16.04732894897461, -11.877731323242188, -7.708133697509766, -3.5385360717773438, 0.6310615539550781, 4.8006744384765625, 8.970272064208984, 13.139869689941406, 17.309467315673828, 21.47906494140625, 25.648662567138672, 29.818260192871094, 33.987857818603516, 38.15745544433594, 42.32705307006836, 46.49665069580078, 50.6662483215332, 54.835845947265625, 59.00544357299805, 63.17504119873047, 67.34463500976562, 71.51423645019531, 75.683837890625, 79.85343170166016, 84.02302551269531, 88.192626953125, 92.36222839355469, 96.53182220458984, 100.701416015625, 104.87101745605469, 109.04061889648438, 113.21021270751953, 117.37980651855469, 121.54940795898438, 125.71900939941406, 129.88861083984375, 134.05819702148438, 138.22779846191406]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 10.0, 10.0, 8.0, 6.0, 13.0, 12.0, 14.0, 17.0, 16.0, 23.0, 22.0, 32.0, 37.0, 35.0, 28.0, 33.0, 45.0, 46.0, 38.0, 46.0, 36.0, 47.0, 52.0, 39.0, 29.0, 27.0, 35.0, 21.0, 33.0, 30.0, 25.0, 20.0, 15.0, 15.0, 18.0, 13.0, 8.0, 8.0, 6.0, 10.0, 7.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.34375, -13.90966796875, -13.4755859375, -13.04150390625, -12.607421875, -12.17333984375, -11.7392578125, -11.30517578125, -10.87109375, -10.43701171875, -10.0029296875, -9.56884765625, -9.134765625, -8.70068359375, -8.2666015625, -7.83251953125, -7.3984375, -6.96435546875, -6.5302734375, -6.09619140625, -5.662109375, -5.22802734375, -4.7939453125, -4.35986328125, -3.92578125, -3.49169921875, -3.0576171875, -2.62353515625, -2.189453125, -1.75537109375, -1.3212890625, -0.88720703125, -0.453125, -0.01904296875, 0.4150390625, 0.84912109375, 1.283203125, 1.71728515625, 2.1513671875, 2.58544921875, 3.01953125, 3.45361328125, 3.8876953125, 4.32177734375, 4.755859375, 5.18994140625, 5.6240234375, 6.05810546875, 6.4921875, 6.92626953125, 7.3603515625, 7.79443359375, 8.228515625, 8.66259765625, 9.0966796875, 9.53076171875, 9.96484375, 10.39892578125, 10.8330078125, 11.26708984375, 11.701171875, 12.13525390625, 12.5693359375, 13.00341796875, 13.4375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 18.0, 18.0, 25.0, 40.0, 45.0, 68.0, 87.0, 125.0, 219.0, 367.0, 693.0, 1482.0, 3563.0, 9964.0, 33948.0, 129501.0, 482920.0, 1354361.0, 1441849.0, 536168.0, 142249.0, 37947.0, 11188.0, 3943.0, 1534.0, 786.0, 414.0, 262.0, 146.0, 86.0, 56.0, 60.0, 36.0, 31.0, 23.0, 14.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.6982421875, -14.208984375, -13.7197265625, -13.23046875, -12.7412109375, -12.251953125, -11.7626953125, -11.2734375, -10.7841796875, -10.294921875, -9.8056640625, -9.31640625, -8.8271484375, -8.337890625, -7.8486328125, -7.359375, -6.8701171875, -6.380859375, -5.8916015625, -5.40234375, -4.9130859375, -4.423828125, -3.9345703125, -3.4453125, -2.9560546875, -2.466796875, -1.9775390625, -1.48828125, -0.9990234375, -0.509765625, -0.0205078125, 0.46875, 0.9580078125, 1.447265625, 1.9365234375, 2.42578125, 2.9150390625, 3.404296875, 3.8935546875, 4.3828125, 4.8720703125, 5.361328125, 5.8505859375, 6.33984375, 6.8291015625, 7.318359375, 7.8076171875, 8.296875, 8.7861328125, 9.275390625, 9.7646484375, 10.25390625, 10.7431640625, 11.232421875, 11.7216796875, 12.2109375, 12.7001953125, 13.189453125, 13.6787109375, 14.16796875, 14.6572265625, 15.146484375, 15.6357421875, 16.125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 8.0, 12.0, 7.0, 17.0, 18.0, 31.0, 30.0, 41.0, 56.0, 69.0, 91.0, 110.0, 177.0, 231.0, 285.0, 366.0, 503.0, 482.0, 403.0, 294.0, 229.0, 136.0, 122.0, 79.0, 52.0, 64.0, 41.0, 37.0, 24.0, 16.0, 15.0, 4.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.59375, -41.40966796875, -40.2255859375, -39.04150390625, -37.857421875, -36.67333984375, -35.4892578125, -34.30517578125, -33.12109375, -31.93701171875, -30.7529296875, -29.56884765625, -28.384765625, -27.20068359375, -26.0166015625, -24.83251953125, -23.6484375, -22.46435546875, -21.2802734375, -20.09619140625, -18.912109375, -17.72802734375, -16.5439453125, -15.35986328125, -14.17578125, -12.99169921875, -11.8076171875, -10.62353515625, -9.439453125, -8.25537109375, -7.0712890625, -5.88720703125, -4.703125, -3.51904296875, -2.3349609375, -1.15087890625, 0.033203125, 1.21728515625, 2.4013671875, 3.58544921875, 4.76953125, 5.95361328125, 7.1376953125, 8.32177734375, 9.505859375, 10.68994140625, 11.8740234375, 13.05810546875, 14.2421875, 15.42626953125, 16.6103515625, 17.79443359375, 18.978515625, 20.16259765625, 21.3466796875, 22.53076171875, 23.71484375, 24.89892578125, 26.0830078125, 27.26708984375, 28.451171875, 29.63525390625, 30.8193359375, 32.00341796875, 33.1875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 4.0, 11.0, 8.0, 13.0, 9.0, 22.0, 41.0, 60.0, 65.0, 73.0, 100.0, 172.0, 302.0, 529.0, 3428.0, 4156319.0, 31215.0, 827.0, 367.0, 216.0, 129.0, 107.0, 73.0, 44.0, 22.0, 38.0, 22.0, 26.0, 13.0, 7.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.375, -201.107421875, -193.83984375, -186.572265625, -179.3046875, -172.037109375, -164.76953125, -157.501953125, -150.234375, -142.966796875, -135.69921875, -128.431640625, -121.1640625, -113.896484375, -106.62890625, -99.361328125, -92.09375, -84.826171875, -77.55859375, -70.291015625, -63.0234375, -55.755859375, -48.48828125, -41.220703125, -33.953125, -26.685546875, -19.41796875, -12.150390625, -4.8828125, 2.384765625, 9.65234375, 16.919921875, 24.1875, 31.455078125, 38.72265625, 45.990234375, 53.2578125, 60.525390625, 67.79296875, 75.060546875, 82.328125, 89.595703125, 96.86328125, 104.130859375, 111.3984375, 118.666015625, 125.93359375, 133.201171875, 140.46875, 147.736328125, 155.00390625, 162.271484375, 169.5390625, 176.806640625, 184.07421875, 191.341796875, 198.609375, 205.876953125, 213.14453125, 220.412109375, 227.6796875, 234.947265625, 242.21484375, 249.482421875, 256.75]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 43.0, 409.0, 488.0, 70.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-924.8982543945312, -905.6610717773438, -886.4239501953125, -867.186767578125, -847.9495849609375, -828.71240234375, -809.4752807617188, -790.2380981445312, -771.0009765625, -751.7637939453125, -732.5266723632812, -713.2894897460938, -694.0523071289062, -674.815185546875, -655.5780029296875, -636.3408203125, -617.1036376953125, -597.866455078125, -578.6293334960938, -559.3921508789062, -540.1549682617188, -520.9178466796875, -501.6806640625, -482.4434814453125, -463.2063293457031, -443.96917724609375, -424.73199462890625, -405.4948425292969, -386.2576904296875, -367.0205078125, -347.7833557128906, -328.54620361328125, -309.3089599609375, -290.0718078613281, -270.8346252441406, -251.59747314453125, -232.3603057861328, -213.12313842773438, -193.885986328125, -174.64881896972656, -155.41165161132812, -136.1744842529297, -116.93732452392578, -97.70016479492188, -78.46299743652344, -59.225830078125, -39.988670349121094, -20.751510620117188, -1.51434326171875, 17.722820281982422, 36.959983825683594, 56.197147369384766, 75.43431091308594, 94.67147827148438, 113.90863800048828, 133.1457977294922, 152.38296508789062, 171.62013244628906, 190.8572998046875, 210.09445190429688, 229.3316192626953, 248.56878662109375, 267.8059387207031, 287.0430908203125, 306.2802734375]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 4.0, 14.0, 15.0, 13.0, 23.0, 24.0, 25.0, 23.0, 26.0, 29.0, 40.0, 36.0, 36.0, 45.0, 34.0, 38.0, 39.0, 39.0, 42.0, 41.0, 48.0, 36.0, 30.0, 32.0, 17.0, 22.0, 28.0, 16.0, 24.0, 25.0, 24.0, 14.0, 14.0, 10.0, 10.0, 9.0, 8.0, 6.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-115.96331787109375, -112.01614379882812, -108.0689697265625, -104.12178802490234, -100.17461395263672, -96.2274398803711, -92.28025817871094, -88.33308410644531, -84.38591003417969, -80.43873596191406, -76.49156188964844, -72.54438018798828, -68.59720611572266, -64.65003204345703, -60.70285415649414, -56.75567626953125, -52.808502197265625, -48.861328125, -44.91415023803711, -40.96697235107422, -37.019798278808594, -33.07262420654297, -29.125446319580078, -25.17827033996582, -21.231094360351562, -17.283918380737305, -13.336742401123047, -9.389566421508789, -5.442390441894531, -1.4952144622802734, 2.4519615173339844, 6.399137496948242, 10.3463134765625, 14.293489456176758, 18.240665435791016, 22.187841415405273, 26.13501739501953, 30.08219337463379, 34.02936935424805, 37.97654724121094, 41.92372131347656, 45.87089538574219, 49.81807327270508, 53.76525115966797, 57.712425231933594, 61.65959930419922, 65.60678100585938, 69.553955078125, 73.50112915039062, 77.44830322265625, 81.39547729492188, 85.34265899658203, 89.28983306884766, 93.23700714111328, 97.18418884277344, 101.13136291503906, 105.07853698730469, 109.02571105957031, 112.97288513183594, 116.9200668334961, 120.86724090576172, 124.81441497802734, 128.7615966796875, 132.70877075195312, 136.65594482421875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 14.0, 4.0, 11.0, 12.0, 15.0, 18.0, 21.0, 25.0, 19.0, 35.0, 38.0, 39.0, 35.0, 40.0, 32.0, 40.0, 58.0, 51.0, 41.0, 35.0, 42.0, 43.0, 24.0, 33.0, 34.0, 27.0, 27.0, 23.0, 21.0, 20.0, 19.0, 16.0, 14.0, 9.0, 9.0, 6.0, 10.0, 3.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.05712890625, -13.5986328125, -13.14013671875, -12.681640625, -12.22314453125, -11.7646484375, -11.30615234375, -10.84765625, -10.38916015625, -9.9306640625, -9.47216796875, -9.013671875, -8.55517578125, -8.0966796875, -7.63818359375, -7.1796875, -6.72119140625, -6.2626953125, -5.80419921875, -5.345703125, -4.88720703125, -4.4287109375, -3.97021484375, -3.51171875, -3.05322265625, -2.5947265625, -2.13623046875, -1.677734375, -1.21923828125, -0.7607421875, -0.30224609375, 0.15625, 0.61474609375, 1.0732421875, 1.53173828125, 1.990234375, 2.44873046875, 2.9072265625, 3.36572265625, 3.82421875, 4.28271484375, 4.7412109375, 5.19970703125, 5.658203125, 6.11669921875, 6.5751953125, 7.03369140625, 7.4921875, 7.95068359375, 8.4091796875, 8.86767578125, 9.326171875, 9.78466796875, 10.2431640625, 10.70166015625, 11.16015625, 11.61865234375, 12.0771484375, 12.53564453125, 12.994140625, 13.45263671875, 13.9111328125, 14.36962890625, 14.828125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 11.0, 17.0, 10.0, 19.0, 31.0, 46.0, 64.0, 83.0, 139.0, 152.0, 226.0, 329.0, 423.0, 641.0, 853.0, 1259.0, 1725.0, 2360.0, 3500.0, 5043.0, 7091.0, 10305.0, 15270.0, 22915.0, 34995.0, 55716.0, 94396.0, 190049.0, 289636.0, 118014.0, 67698.0, 41478.0, 26720.0, 17736.0, 12051.0, 8298.0, 5683.0, 3958.0, 2767.0, 1946.0, 1441.0, 992.0, 658.0, 550.0, 358.0, 271.0, 173.0, 150.0, 92.0, 63.0, 43.0, 49.0, 18.0, 17.0, 5.0, 13.0, 10.0, 2.0, 3.0, 5.0], "bins": [-3.3046875, -3.2020263671875, -3.099365234375, -2.9967041015625, -2.89404296875, -2.7913818359375, -2.688720703125, -2.5860595703125, -2.4833984375, -2.3807373046875, -2.278076171875, -2.1754150390625, -2.07275390625, -1.9700927734375, -1.867431640625, -1.7647705078125, -1.662109375, -1.5594482421875, -1.456787109375, -1.3541259765625, -1.25146484375, -1.1488037109375, -1.046142578125, -0.9434814453125, -0.8408203125, -0.7381591796875, -0.635498046875, -0.5328369140625, -0.43017578125, -0.3275146484375, -0.224853515625, -0.1221923828125, -0.01953125, 0.0831298828125, 0.185791015625, 0.2884521484375, 0.39111328125, 0.4937744140625, 0.596435546875, 0.6990966796875, 0.8017578125, 0.9044189453125, 1.007080078125, 1.1097412109375, 1.21240234375, 1.3150634765625, 1.417724609375, 1.5203857421875, 1.623046875, 1.7257080078125, 1.828369140625, 1.9310302734375, 2.03369140625, 2.1363525390625, 2.239013671875, 2.3416748046875, 2.4443359375, 2.5469970703125, 2.649658203125, 2.7523193359375, 2.85498046875, 2.9576416015625, 3.060302734375, 3.1629638671875, 3.265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 9.0, 4.0, 11.0, 13.0, 12.0, 13.0, 14.0, 13.0, 21.0, 22.0, 25.0, 28.0, 38.0, 42.0, 39.0, 40.0, 38.0, 38.0, 34.0, 54.0, 1060.0, 27.0, 41.0, 37.0, 34.0, 33.0, 22.0, 30.0, 32.0, 23.0, 15.0, 22.0, 29.0, 17.0, 12.0, 13.0, 12.0, 7.0, 7.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.93359375, -7.66949462890625, -7.4053955078125, -7.14129638671875, -6.877197265625, -6.61309814453125, -6.3489990234375, -6.08489990234375, -5.82080078125, -5.55670166015625, -5.2926025390625, -5.02850341796875, -4.764404296875, -4.50030517578125, -4.2362060546875, -3.97210693359375, -3.7080078125, -3.44390869140625, -3.1798095703125, -2.91571044921875, -2.651611328125, -2.38751220703125, -2.1234130859375, -1.85931396484375, -1.59521484375, -1.33111572265625, -1.0670166015625, -0.80291748046875, -0.538818359375, -0.27471923828125, -0.0106201171875, 0.25347900390625, 0.517578125, 0.78167724609375, 1.0457763671875, 1.30987548828125, 1.573974609375, 1.83807373046875, 2.1021728515625, 2.36627197265625, 2.63037109375, 2.89447021484375, 3.1585693359375, 3.42266845703125, 3.686767578125, 3.95086669921875, 4.2149658203125, 4.47906494140625, 4.7431640625, 5.00726318359375, 5.2713623046875, 5.53546142578125, 5.799560546875, 6.06365966796875, 6.3277587890625, 6.59185791015625, 6.85595703125, 7.12005615234375, 7.3841552734375, 7.64825439453125, 7.912353515625, 8.17645263671875, 8.4405517578125, 8.70465087890625, 8.96875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 10.0, 20.0, 19.0, 37.0, 50.0, 70.0, 117.0, 129.0, 185.0, 298.0, 420.0, 599.0, 887.0, 1266.0, 1957.0, 2879.0, 4414.0, 6854.0, 10501.0, 16281.0, 25677.0, 41776.0, 70845.0, 127435.0, 1368514.0, 180427.0, 92417.0, 53208.0, 32373.0, 20258.0, 12887.0, 8187.0, 5439.0, 3502.0, 2344.0, 1500.0, 1032.0, 717.0, 502.0, 330.0, 216.0, 157.0, 132.0, 74.0, 58.0, 44.0, 24.0, 15.0, 10.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.525390625, -3.417694091796875, -3.30999755859375, -3.202301025390625, -3.0946044921875, -2.986907958984375, -2.87921142578125, -2.771514892578125, -2.663818359375, -2.556121826171875, -2.44842529296875, -2.340728759765625, -2.2330322265625, -2.125335693359375, -2.01763916015625, -1.909942626953125, -1.80224609375, -1.694549560546875, -1.58685302734375, -1.479156494140625, -1.3714599609375, -1.263763427734375, -1.15606689453125, -1.048370361328125, -0.940673828125, -0.832977294921875, -0.72528076171875, -0.617584228515625, -0.5098876953125, -0.402191162109375, -0.29449462890625, -0.186798095703125, -0.0791015625, 0.028594970703125, 0.13629150390625, 0.243988037109375, 0.3516845703125, 0.459381103515625, 0.56707763671875, 0.674774169921875, 0.782470703125, 0.890167236328125, 0.99786376953125, 1.105560302734375, 1.2132568359375, 1.320953369140625, 1.42864990234375, 1.536346435546875, 1.64404296875, 1.751739501953125, 1.85943603515625, 1.967132568359375, 2.0748291015625, 2.182525634765625, 2.29022216796875, 2.397918701171875, 2.505615234375, 2.613311767578125, 2.72100830078125, 2.828704833984375, 2.9364013671875, 3.044097900390625, 3.15179443359375, 3.259490966796875, 3.3671875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 11.0, 13.0, 19.0, 31.0, 32.0, 50.0, 68.0, 86.0, 115.0, 129.0, 97.0, 92.0, 68.0, 44.0, 40.0, 20.0, 18.0, 12.0, 8.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00383758544921875, -0.0037261545658111572, -0.0036147236824035645, -0.0035032927989959717, -0.003391861915588379, -0.003280431032180786, -0.0031690001487731934, -0.0030575692653656006, -0.002946138381958008, -0.002834707498550415, -0.0027232766151428223, -0.0026118457317352295, -0.0025004148483276367, -0.002388983964920044, -0.002277553081512451, -0.0021661221981048584, -0.0020546913146972656, -0.0019432604312896729, -0.00183182954788208, -0.0017203986644744873, -0.0016089677810668945, -0.0014975368976593018, -0.001386106014251709, -0.0012746751308441162, -0.0011632442474365234, -0.0010518133640289307, -0.0009403824806213379, -0.0008289515972137451, -0.0007175207138061523, -0.0006060898303985596, -0.0004946589469909668, -0.000383228063583374, -0.00027179718017578125, -0.00016036629676818848, -4.89354133605957e-05, 6.249547004699707e-05, 0.00017392635345458984, 0.0002853572368621826, 0.0003967881202697754, 0.0005082190036773682, 0.0006196498870849609, 0.0007310807704925537, 0.0008425116539001465, 0.0009539425373077393, 0.001065373420715332, 0.0011768043041229248, 0.0012882351875305176, 0.0013996660709381104, 0.0015110969543457031, 0.001622527837753296, 0.0017339587211608887, 0.0018453896045684814, 0.0019568204879760742, 0.002068251371383667, 0.0021796822547912598, 0.0022911131381988525, 0.0024025440216064453, 0.002513974905014038, 0.002625405788421631, 0.0027368366718292236, 0.0028482675552368164, 0.002959698438644409, 0.003071129322052002, 0.0031825602054595947, 0.0032939910888671875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 10.0, 10.0, 14.0, 20.0, 22.0, 39.0, 66.0, 109.0, 317.0, 1411.0, 1044648.0, 1275.0, 281.0, 109.0, 56.0, 35.0, 40.0, 18.0, 14.0, 10.0, 4.0, 6.0, 12.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07765674591064453, -0.07493019104003906, -0.0722036361694336, -0.06947708129882812, -0.06675052642822266, -0.06402397155761719, -0.06129741668701172, -0.05857086181640625, -0.05584430694580078, -0.05311775207519531, -0.050391197204589844, -0.047664642333984375, -0.044938087463378906, -0.04221153259277344, -0.03948497772216797, -0.0367584228515625, -0.03403186798095703, -0.03130531311035156, -0.028578758239746094, -0.025852203369140625, -0.023125648498535156, -0.020399093627929688, -0.01767253875732422, -0.01494598388671875, -0.012219429016113281, -0.009492874145507812, -0.006766319274902344, -0.004039764404296875, -0.0013132095336914062, 0.0014133453369140625, 0.004139900207519531, 0.006866455078125, 0.009593009948730469, 0.012319564819335938, 0.015046119689941406, 0.017772674560546875, 0.020499229431152344, 0.023225784301757812, 0.02595233917236328, 0.02867889404296875, 0.03140544891357422, 0.03413200378417969, 0.036858558654785156, 0.039585113525390625, 0.042311668395996094, 0.04503822326660156, 0.04776477813720703, 0.0504913330078125, 0.05321788787841797, 0.05594444274902344, 0.058670997619628906, 0.061397552490234375, 0.06412410736083984, 0.06685066223144531, 0.06957721710205078, 0.07230377197265625, 0.07503032684326172, 0.07775688171386719, 0.08048343658447266, 0.08320999145507812, 0.0859365463256836, 0.08866310119628906, 0.09138965606689453, 0.0941162109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 574.0, 437.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.02189924195408821, -0.021527711302042007, -0.021156180649995804, -0.0207846499979496, -0.020413117483258247, -0.020041586831212044, -0.01967005617916584, -0.019298525527119637, -0.018926994875073433, -0.01855546422302723, -0.018183933570981026, -0.017812401056289673, -0.01744087040424347, -0.017069339752197266, -0.016697809100151062, -0.01632627844810486, -0.015954745933413506, -0.015583215281367302, -0.015211683697998524, -0.01484015304595232, -0.014468622393906116, -0.014097090810537338, -0.013725560158491135, -0.013354029506444931, -0.012982498854398727, -0.012610968202352524, -0.012239436618983746, -0.011867905966937542, -0.011496375314891338, -0.01112484373152256, -0.010753313079476357, -0.010381782427430153, -0.0100102499127388, -0.009638719260692596, -0.009267187677323818, -0.008895657025277615, -0.008524126373231411, -0.008152594789862633, -0.007781064137816429, -0.007409533020108938, -0.007038002368062735, -0.006666471250355244, -0.00629494059830904, -0.005923409480601549, -0.005551878362894058, -0.005180347710847855, -0.004808816593140364, -0.004437285475432873, -0.004065754357725382, -0.0036942234728485346, -0.0033226923551410437, -0.0029511614702641964, -0.0025796303525567055, -0.002208099467679858, -0.001836568582803011, -0.00146503746509552, -0.0010935066966339946, -0.0007219756953418255, -0.0003504447522573173, 2.1086190827190876e-05, 0.00039261719211935997, 0.0007641481934115291, 0.0011356790782883763, 0.0015072101959958673, 0.0018787410808727145]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 3.0, 7.0, 8.0, 9.0, 9.0, 14.0, 19.0, 17.0, 30.0, 17.0, 13.0, 24.0, 41.0, 37.0, 33.0, 31.0, 37.0, 31.0, 33.0, 26.0, 43.0, 43.0, 31.0, 37.0, 36.0, 31.0, 36.0, 32.0, 34.0, 21.0, 27.0, 33.0, 12.0, 19.0, 10.0, 15.0, 18.0, 14.0, 5.0, 12.0, 12.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.001175224781036377, -0.0011422708630561829, -0.0011093169450759888, -0.0010763630270957947, -0.0010434091091156006, -0.0010104551911354065, -0.0009775012731552124, -0.0009445473551750183, -0.0009115934371948242, -0.0008786395192146301, -0.000845685601234436, -0.0008127316832542419, -0.0007797777652740479, -0.0007468238472938538, -0.0007138699293136597, -0.0006809160113334656, -0.0006479620933532715, -0.0006150081753730774, -0.0005820542573928833, -0.0005491003394126892, -0.0005161464214324951, -0.000483192503452301, -0.00045023858547210693, -0.00041728466749191284, -0.00038433074951171875, -0.00035137683153152466, -0.00031842291355133057, -0.0002854689955711365, -0.0002525150775909424, -0.0002195611596107483, -0.0001866072416305542, -0.0001536533236503601, -0.00012069940567016602, -8.774548768997192e-05, -5.479156970977783e-05, -2.183765172958374e-05, 1.1116266250610352e-05, 4.407018423080444e-05, 7.702410221099854e-05, 0.00010997802019119263, 0.00014293193817138672, 0.0001758858561515808, 0.0002088397741317749, 0.000241793692111969, 0.0002747476100921631, 0.0003077015280723572, 0.00034065544605255127, 0.00037360936403274536, 0.00040656328201293945, 0.00043951719999313354, 0.00047247111797332764, 0.0005054250359535217, 0.0005383789539337158, 0.0005713328719139099, 0.000604286789894104, 0.0006372407078742981, 0.0006701946258544922, 0.0007031485438346863, 0.0007361024618148804, 0.0007690563797950745, 0.0008020102977752686, 0.0008349642157554626, 0.0008679181337356567, 0.0009008720517158508, 0.0009338259696960449]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 14.0, 4.0, 11.0, 12.0, 15.0, 18.0, 21.0, 25.0, 19.0, 35.0, 38.0, 39.0, 35.0, 40.0, 32.0, 40.0, 58.0, 51.0, 41.0, 35.0, 42.0, 43.0, 24.0, 33.0, 34.0, 27.0, 27.0, 23.0, 21.0, 20.0, 19.0, 16.0, 14.0, 9.0, 9.0, 6.0, 10.0, 3.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.05712890625, -13.5986328125, -13.14013671875, -12.681640625, -12.22314453125, -11.7646484375, -11.30615234375, -10.84765625, -10.38916015625, -9.9306640625, -9.47216796875, -9.013671875, -8.55517578125, -8.0966796875, -7.63818359375, -7.1796875, -6.72119140625, -6.2626953125, -5.80419921875, -5.345703125, -4.88720703125, -4.4287109375, -3.97021484375, -3.51171875, -3.05322265625, -2.5947265625, -2.13623046875, -1.677734375, -1.21923828125, -0.7607421875, -0.30224609375, 0.15625, 0.61474609375, 1.0732421875, 1.53173828125, 1.990234375, 2.44873046875, 2.9072265625, 3.36572265625, 3.82421875, 4.28271484375, 4.7412109375, 5.19970703125, 5.658203125, 6.11669921875, 6.5751953125, 7.03369140625, 7.4921875, 7.95068359375, 8.4091796875, 8.86767578125, 9.326171875, 9.78466796875, 10.2431640625, 10.70166015625, 11.16015625, 11.61865234375, 12.0771484375, 12.53564453125, 12.994140625, 13.45263671875, 13.9111328125, 14.36962890625, 14.828125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 8.0, 17.0, 21.0, 32.0, 36.0, 47.0, 80.0, 102.0, 188.0, 327.0, 551.0, 1054.0, 2270.0, 4741.0, 11038.0, 28624.0, 88217.0, 336323.0, 407385.0, 109531.0, 34239.0, 13017.0, 5447.0, 2434.0, 1206.0, 659.0, 324.0, 207.0, 118.0, 69.0, 65.0, 55.0, 24.0, 17.0, 16.0, 12.0, 6.0, 6.0, 7.0, 4.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4296875, -11.084228515625, -10.73876953125, -10.393310546875, -10.0478515625, -9.702392578125, -9.35693359375, -9.011474609375, -8.666015625, -8.320556640625, -7.97509765625, -7.629638671875, -7.2841796875, -6.938720703125, -6.59326171875, -6.247802734375, -5.90234375, -5.556884765625, -5.21142578125, -4.865966796875, -4.5205078125, -4.175048828125, -3.82958984375, -3.484130859375, -3.138671875, -2.793212890625, -2.44775390625, -2.102294921875, -1.7568359375, -1.411376953125, -1.06591796875, -0.720458984375, -0.375, -0.029541015625, 0.31591796875, 0.661376953125, 1.0068359375, 1.352294921875, 1.69775390625, 2.043212890625, 2.388671875, 2.734130859375, 3.07958984375, 3.425048828125, 3.7705078125, 4.115966796875, 4.46142578125, 4.806884765625, 5.15234375, 5.497802734375, 5.84326171875, 6.188720703125, 6.5341796875, 6.879638671875, 7.22509765625, 7.570556640625, 7.916015625, 8.261474609375, 8.60693359375, 8.952392578125, 9.2978515625, 9.643310546875, 9.98876953125, 10.334228515625, 10.6796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 7.0, 12.0, 4.0, 10.0, 9.0, 12.0, 22.0, 22.0, 31.0, 26.0, 24.0, 28.0, 31.0, 38.0, 34.0, 42.0, 65.0, 73.0, 187.0, 1673.0, 192.0, 73.0, 37.0, 41.0, 34.0, 39.0, 52.0, 21.0, 25.0, 24.0, 24.0, 13.0, 15.0, 14.0, 18.0, 10.0, 13.0, 10.0, 7.0, 9.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.21875, -45.76318359375, -44.3076171875, -42.85205078125, -41.396484375, -39.94091796875, -38.4853515625, -37.02978515625, -35.57421875, -34.11865234375, -32.6630859375, -31.20751953125, -29.751953125, -28.29638671875, -26.8408203125, -25.38525390625, -23.9296875, -22.47412109375, -21.0185546875, -19.56298828125, -18.107421875, -16.65185546875, -15.1962890625, -13.74072265625, -12.28515625, -10.82958984375, -9.3740234375, -7.91845703125, -6.462890625, -5.00732421875, -3.5517578125, -2.09619140625, -0.640625, 0.81494140625, 2.2705078125, 3.72607421875, 5.181640625, 6.63720703125, 8.0927734375, 9.54833984375, 11.00390625, 12.45947265625, 13.9150390625, 15.37060546875, 16.826171875, 18.28173828125, 19.7373046875, 21.19287109375, 22.6484375, 24.10400390625, 25.5595703125, 27.01513671875, 28.470703125, 29.92626953125, 31.3818359375, 32.83740234375, 34.29296875, 35.74853515625, 37.2041015625, 38.65966796875, 40.115234375, 41.57080078125, 43.0263671875, 44.48193359375, 45.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 10.0, 13.0, 11.0, 13.0, 18.0, 20.0, 24.0, 26.0, 39.0, 52.0, 71.0, 104.0, 129.0, 139.0, 217.0, 342.0, 844.0, 4898.0, 2599825.0, 533489.0, 3536.0, 698.0, 287.0, 210.0, 165.0, 106.0, 86.0, 56.0, 45.0, 40.0, 40.0, 31.0, 24.0, 12.0, 9.0, 9.0, 8.0, 11.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-95.25, -92.2666015625, -89.283203125, -86.2998046875, -83.31640625, -80.3330078125, -77.349609375, -74.3662109375, -71.3828125, -68.3994140625, -65.416015625, -62.4326171875, -59.44921875, -56.4658203125, -53.482421875, -50.4990234375, -47.515625, -44.5322265625, -41.548828125, -38.5654296875, -35.58203125, -32.5986328125, -29.615234375, -26.6318359375, -23.6484375, -20.6650390625, -17.681640625, -14.6982421875, -11.71484375, -8.7314453125, -5.748046875, -2.7646484375, 0.21875, 3.2021484375, 6.185546875, 9.1689453125, 12.15234375, 15.1357421875, 18.119140625, 21.1025390625, 24.0859375, 27.0693359375, 30.052734375, 33.0361328125, 36.01953125, 39.0029296875, 41.986328125, 44.9697265625, 47.953125, 50.9365234375, 53.919921875, 56.9033203125, 59.88671875, 62.8701171875, 65.853515625, 68.8369140625, 71.8203125, 74.8037109375, 77.787109375, 80.7705078125, 83.75390625, 86.7373046875, 89.720703125, 92.7041015625, 95.6875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 20.0, 71.0, 203.0, 304.0, 240.0, 120.0, 37.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.35346984863281, -74.33320617675781, -71.31294250488281, -68.29267120361328, -65.27240753173828, -62.25214385986328, -59.231876373291016, -56.21160888671875, -53.19134521484375, -50.17108154296875, -47.150814056396484, -44.13054656982422, -41.11028289794922, -38.09001922607422, -35.06975173950195, -32.04948425292969, -29.029220581054688, -26.008955001831055, -22.988689422607422, -19.96842384338379, -16.948158264160156, -13.927892684936523, -10.90762710571289, -7.887361526489258, -4.867095947265625, -1.8468303680419922, 1.1734352111816406, 4.193700790405273, 7.213966369628906, 10.234231948852539, 13.254497528076172, 16.274763107299805, 19.29503631591797, 22.3153018951416, 25.335567474365234, 28.355833053588867, 31.3760986328125, 34.3963623046875, 37.416629791259766, 40.43689727783203, 43.45716094970703, 46.47742462158203, 49.4976921081543, 52.51795959472656, 55.53822326660156, 58.55848693847656, 61.57875442504883, 64.5990219116211, 67.6192855834961, 70.6395492553711, 73.65982055664062, 76.68008422851562, 79.70034790039062, 82.72061157226562, 85.74087524414062, 88.76114654541016, 91.78141021728516, 94.80167388916016, 97.82194519042969, 100.84220886230469, 103.86247253417969, 106.88273620605469, 109.90299987792969, 112.92327117919922, 115.94353485107422]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 2.0, 10.0, 9.0, 17.0, 14.0, 20.0, 18.0, 20.0, 26.0, 25.0, 33.0, 37.0, 29.0, 39.0, 36.0, 31.0, 39.0, 39.0, 50.0, 40.0, 46.0, 52.0, 36.0, 33.0, 31.0, 28.0, 24.0, 29.0, 24.0, 22.0, 17.0, 20.0, 17.0, 15.0, 11.0, 11.0, 11.0, 1.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-114.98191833496094, -111.24540710449219, -107.50889587402344, -103.77238464355469, -100.03587341308594, -96.29936218261719, -92.56285095214844, -88.82634735107422, -85.08983612060547, -81.35332489013672, -77.61681365966797, -73.88030242919922, -70.14379119873047, -66.40728759765625, -62.670772552490234, -58.93426513671875, -55.197750091552734, -51.461238861083984, -47.724727630615234, -43.98822021484375, -40.251708984375, -36.51519775390625, -32.7786865234375, -29.042177200317383, -25.305665969848633, -21.569154739379883, -17.832645416259766, -14.096134185791016, -10.359623908996582, -6.623113632202148, -2.8866024017333984, 0.8499069213867188, 4.586418151855469, 8.322928428649902, 12.059438705444336, 15.795949935913086, 19.532459259033203, 23.268970489501953, 27.005481719970703, 30.74199104309082, 34.47850036621094, 38.21501159667969, 41.95152282714844, 45.68803405761719, 49.42454147338867, 53.16105270385742, 56.89756393432617, 60.634071350097656, 64.37059020996094, 68.10710144042969, 71.84361267089844, 75.58012390136719, 79.31663513183594, 83.05314636230469, 86.78965759277344, 90.52616119384766, 94.2626724243164, 97.99918365478516, 101.7356948852539, 105.47220611572266, 109.2087173461914, 112.94522094726562, 116.68173217773438, 120.41824340820312, 124.15475463867188]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 13.0, 10.0, 5.0, 11.0, 19.0, 17.0, 16.0, 24.0, 25.0, 27.0, 36.0, 38.0, 42.0, 40.0, 41.0, 37.0, 48.0, 54.0, 45.0, 35.0, 51.0, 35.0, 31.0, 40.0, 26.0, 31.0, 30.0, 24.0, 18.0, 19.0, 24.0, 18.0, 7.0, 8.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3359375, -14.85546875, -14.375, -13.89453125, -13.4140625, -12.93359375, -12.453125, -11.97265625, -11.4921875, -11.01171875, -10.53125, -10.05078125, -9.5703125, -9.08984375, -8.609375, -8.12890625, -7.6484375, -7.16796875, -6.6875, -6.20703125, -5.7265625, -5.24609375, -4.765625, -4.28515625, -3.8046875, -3.32421875, -2.84375, -2.36328125, -1.8828125, -1.40234375, -0.921875, -0.44140625, 0.0390625, 0.51953125, 1.0, 1.48046875, 1.9609375, 2.44140625, 2.921875, 3.40234375, 3.8828125, 4.36328125, 4.84375, 5.32421875, 5.8046875, 6.28515625, 6.765625, 7.24609375, 7.7265625, 8.20703125, 8.6875, 9.16796875, 9.6484375, 10.12890625, 10.609375, 11.08984375, 11.5703125, 12.05078125, 12.53125, 13.01171875, 13.4921875, 13.97265625, 14.453125, 14.93359375, 15.4140625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 11.0, 8.0, 8.0, 10.0, 12.0, 21.0, 15.0, 21.0, 17.0, 29.0, 40.0, 38.0, 63.0, 74.0, 123.0, 238.0, 862.0, 64593.0, 4062932.0, 63543.0, 888.0, 236.0, 112.0, 75.0, 66.0, 33.0, 35.0, 20.0, 20.0, 25.0, 17.0, 17.0, 17.0, 7.0, 8.0, 10.0, 6.0, 7.0, 4.0, 1.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.5634765625, -85.751953125, -82.9404296875, -80.12890625, -77.3173828125, -74.505859375, -71.6943359375, -68.8828125, -66.0712890625, -63.259765625, -60.4482421875, -57.63671875, -54.8251953125, -52.013671875, -49.2021484375, -46.390625, -43.5791015625, -40.767578125, -37.9560546875, -35.14453125, -32.3330078125, -29.521484375, -26.7099609375, -23.8984375, -21.0869140625, -18.275390625, -15.4638671875, -12.65234375, -9.8408203125, -7.029296875, -4.2177734375, -1.40625, 1.4052734375, 4.216796875, 7.0283203125, 9.83984375, 12.6513671875, 15.462890625, 18.2744140625, 21.0859375, 23.8974609375, 26.708984375, 29.5205078125, 32.33203125, 35.1435546875, 37.955078125, 40.7666015625, 43.578125, 46.3896484375, 49.201171875, 52.0126953125, 54.82421875, 57.6357421875, 60.447265625, 63.2587890625, 66.0703125, 68.8818359375, 71.693359375, 74.5048828125, 77.31640625, 80.1279296875, 82.939453125, 85.7509765625, 88.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 7.0, 14.0, 17.0, 23.0, 22.0, 21.0, 52.0, 42.0, 49.0, 79.0, 81.0, 119.0, 155.0, 222.0, 251.0, 340.0, 407.0, 412.0, 373.0, 296.0, 250.0, 174.0, 150.0, 122.0, 73.0, 53.0, 50.0, 41.0, 36.0, 30.0, 15.0, 10.0, 13.0, 14.0, 10.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.359375, -27.481689453125, -26.60400390625, -25.726318359375, -24.8486328125, -23.970947265625, -23.09326171875, -22.215576171875, -21.337890625, -20.460205078125, -19.58251953125, -18.704833984375, -17.8271484375, -16.949462890625, -16.07177734375, -15.194091796875, -14.31640625, -13.438720703125, -12.56103515625, -11.683349609375, -10.8056640625, -9.927978515625, -9.05029296875, -8.172607421875, -7.294921875, -6.417236328125, -5.53955078125, -4.661865234375, -3.7841796875, -2.906494140625, -2.02880859375, -1.151123046875, -0.2734375, 0.604248046875, 1.48193359375, 2.359619140625, 3.2373046875, 4.114990234375, 4.99267578125, 5.870361328125, 6.748046875, 7.625732421875, 8.50341796875, 9.381103515625, 10.2587890625, 11.136474609375, 12.01416015625, 12.891845703125, 13.76953125, 14.647216796875, 15.52490234375, 16.402587890625, 17.2802734375, 18.157958984375, 19.03564453125, 19.913330078125, 20.791015625, 21.668701171875, 22.54638671875, 23.424072265625, 24.3017578125, 25.179443359375, 26.05712890625, 26.934814453125, 27.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 14.0, 19.0, 19.0, 19.0, 37.0, 46.0, 63.0, 76.0, 92.0, 112.0, 157.0, 224.0, 490.0, 919.0, 14319.0, 4160819.0, 14426.0, 915.0, 474.0, 271.0, 173.0, 133.0, 117.0, 74.0, 58.0, 50.0, 35.0, 32.0, 24.0, 14.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-185.625, -179.732421875, -173.83984375, -167.947265625, -162.0546875, -156.162109375, -150.26953125, -144.376953125, -138.484375, -132.591796875, -126.69921875, -120.806640625, -114.9140625, -109.021484375, -103.12890625, -97.236328125, -91.34375, -85.451171875, -79.55859375, -73.666015625, -67.7734375, -61.880859375, -55.98828125, -50.095703125, -44.203125, -38.310546875, -32.41796875, -26.525390625, -20.6328125, -14.740234375, -8.84765625, -2.955078125, 2.9375, 8.830078125, 14.72265625, 20.615234375, 26.5078125, 32.400390625, 38.29296875, 44.185546875, 50.078125, 55.970703125, 61.86328125, 67.755859375, 73.6484375, 79.541015625, 85.43359375, 91.326171875, 97.21875, 103.111328125, 109.00390625, 114.896484375, 120.7890625, 126.681640625, 132.57421875, 138.466796875, 144.359375, 150.251953125, 156.14453125, 162.037109375, 167.9296875, 173.822265625, 179.71484375, 185.607421875, 191.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 16.0, 64.0, 149.0, 221.0, 266.0, 169.0, 71.0, 40.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.3545227050781, -318.79656982421875, -311.2386169433594, -303.6806335449219, -296.1226806640625, -288.5647277832031, -281.00677490234375, -273.4488220214844, -265.890869140625, -258.3329162597656, -250.7749481201172, -243.2169952392578, -235.65902709960938, -228.10107421875, -220.54312133789062, -212.98516845703125, -205.42718505859375, -197.86923217773438, -190.31126403808594, -182.75331115722656, -175.19534301757812, -167.63739013671875, -160.07943725585938, -152.521484375, -144.96351623535156, -137.4055633544922, -129.84759521484375, -122.28964233398438, -114.73168182373047, -107.17372131347656, -99.61576843261719, -92.05780792236328, -84.49983215332031, -76.9418716430664, -69.3839111328125, -61.825958251953125, -54.26799774169922, -46.71003723144531, -39.15208053588867, -31.59412384033203, -24.036163330078125, -16.47820472717285, -8.920246124267578, -1.3622875213623047, 6.195671081542969, 13.753631591796875, 21.311588287353516, 28.869544982910156, 36.42750549316406, 43.98546600341797, 51.54342269897461, 59.10137939453125, 66.65933990478516, 74.21730041503906, 81.77525329589844, 89.33321380615234, 96.89117431640625, 104.44913482666016, 112.00709533691406, 119.56504821777344, 127.12300872802734, 134.68096923828125, 142.23892211914062, 149.796875, 157.35484313964844]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 8.0, 4.0, 9.0, 5.0, 8.0, 15.0, 17.0, 20.0, 18.0, 17.0, 17.0, 33.0, 35.0, 30.0, 40.0, 38.0, 33.0, 36.0, 58.0, 27.0, 42.0, 52.0, 49.0, 38.0, 40.0, 39.0, 31.0, 31.0, 31.0, 32.0, 30.0, 16.0, 21.0, 14.0, 15.0, 11.0, 8.0, 5.0, 8.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0], "bins": [-135.011474609375, -131.31752014160156, -127.62358093261719, -123.92963409423828, -120.23568725585938, -116.54173278808594, -112.84778594970703, -109.15383911132812, -105.45989227294922, -101.76594543457031, -98.0719985961914, -94.3780517578125, -90.68409729003906, -86.99015808105469, -83.29620361328125, -79.60225677490234, -75.90830993652344, -72.21436309814453, -68.52041625976562, -64.82646942138672, -61.13251876831055, -57.43857192993164, -53.74462127685547, -50.05067443847656, -46.356727600097656, -42.66278076171875, -38.968833923339844, -35.27488327026367, -31.580936431884766, -27.88698959350586, -24.19304084777832, -20.49909210205078, -16.805145263671875, -13.111197471618652, -9.41724967956543, -5.723301887512207, -2.0293540954589844, 1.6645927429199219, 5.358541488647461, 9.052490234375, 12.746437072753906, 16.440383911132812, 20.13433265686035, 23.82828140258789, 27.522228240966797, 31.216175079345703, 34.910125732421875, 38.60407257080078, 42.29801940917969, 45.991966247558594, 49.6859130859375, 53.37986373901367, 57.07381057739258, 60.767757415771484, 64.46170806884766, 68.15565490722656, 71.84960174560547, 75.54354858398438, 79.23749542236328, 82.93144226074219, 86.62539672851562, 90.3193359375, 94.01329040527344, 97.70723724365234, 101.40118408203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 9.0, 10.0, 16.0, 11.0, 11.0, 13.0, 15.0, 30.0, 27.0, 35.0, 34.0, 47.0, 31.0, 35.0, 38.0, 64.0, 52.0, 48.0, 46.0, 35.0, 40.0, 53.0, 31.0, 25.0, 38.0, 29.0, 30.0, 21.0, 16.0, 26.0, 11.0, 10.0, 9.0, 13.0, 8.0, 2.0, 5.0, 2.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.78125, -16.2791748046875, -15.777099609375, -15.2750244140625, -14.77294921875, -14.2708740234375, -13.768798828125, -13.2667236328125, -12.7646484375, -12.2625732421875, -11.760498046875, -11.2584228515625, -10.75634765625, -10.2542724609375, -9.752197265625, -9.2501220703125, -8.748046875, -8.2459716796875, -7.743896484375, -7.2418212890625, -6.73974609375, -6.2376708984375, -5.735595703125, -5.2335205078125, -4.7314453125, -4.2293701171875, -3.727294921875, -3.2252197265625, -2.72314453125, -2.2210693359375, -1.718994140625, -1.2169189453125, -0.71484375, -0.2127685546875, 0.289306640625, 0.7913818359375, 1.29345703125, 1.7955322265625, 2.297607421875, 2.7996826171875, 3.3017578125, 3.8038330078125, 4.305908203125, 4.8079833984375, 5.31005859375, 5.8121337890625, 6.314208984375, 6.8162841796875, 7.318359375, 7.8204345703125, 8.322509765625, 8.8245849609375, 9.32666015625, 9.8287353515625, 10.330810546875, 10.8328857421875, 11.3349609375, 11.8370361328125, 12.339111328125, 12.8411865234375, 13.34326171875, 13.8453369140625, 14.347412109375, 14.8494873046875, 15.3515625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 16.0, 17.0, 25.0, 50.0, 60.0, 86.0, 146.0, 195.0, 297.0, 400.0, 585.0, 856.0, 1319.0, 1883.0, 2887.0, 4333.0, 6742.0, 10666.0, 16468.0, 26306.0, 43472.0, 73503.0, 138267.0, 337098.0, 168659.0, 83069.0, 49254.0, 29787.0, 18441.0, 11651.0, 7514.0, 4884.0, 3074.0, 2193.0, 1297.0, 984.0, 660.0, 428.0, 285.0, 210.0, 125.0, 97.0, 74.0, 55.0, 41.0, 29.0, 19.0, 7.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0], "bins": [-4.12109375, -3.998504638671875, -3.87591552734375, -3.753326416015625, -3.6307373046875, -3.508148193359375, -3.38555908203125, -3.262969970703125, -3.140380859375, -3.017791748046875, -2.89520263671875, -2.772613525390625, -2.6500244140625, -2.527435302734375, -2.40484619140625, -2.282257080078125, -2.15966796875, -2.037078857421875, -1.91448974609375, -1.791900634765625, -1.6693115234375, -1.546722412109375, -1.42413330078125, -1.301544189453125, -1.178955078125, -1.056365966796875, -0.93377685546875, -0.811187744140625, -0.6885986328125, -0.566009521484375, -0.44342041015625, -0.320831298828125, -0.1982421875, -0.075653076171875, 0.04693603515625, 0.169525146484375, 0.2921142578125, 0.414703369140625, 0.53729248046875, 0.659881591796875, 0.782470703125, 0.905059814453125, 1.02764892578125, 1.150238037109375, 1.2728271484375, 1.395416259765625, 1.51800537109375, 1.640594482421875, 1.76318359375, 1.885772705078125, 2.00836181640625, 2.130950927734375, 2.2535400390625, 2.376129150390625, 2.49871826171875, 2.621307373046875, 2.743896484375, 2.866485595703125, 2.98907470703125, 3.111663818359375, 3.2342529296875, 3.356842041015625, 3.47943115234375, 3.602020263671875, 3.724609375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 9.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 12.0, 16.0, 14.0, 22.0, 25.0, 23.0, 19.0, 33.0, 25.0, 48.0, 40.0, 36.0, 46.0, 54.0, 1063.0, 47.0, 48.0, 60.0, 45.0, 41.0, 45.0, 33.0, 39.0, 31.0, 35.0, 14.0, 21.0, 16.0, 5.0, 15.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.402099609375, -9.06201171875, -8.721923828125, -8.3818359375, -8.041748046875, -7.70166015625, -7.361572265625, -7.021484375, -6.681396484375, -6.34130859375, -6.001220703125, -5.6611328125, -5.321044921875, -4.98095703125, -4.640869140625, -4.30078125, -3.960693359375, -3.62060546875, -3.280517578125, -2.9404296875, -2.600341796875, -2.26025390625, -1.920166015625, -1.580078125, -1.239990234375, -0.89990234375, -0.559814453125, -0.2197265625, 0.120361328125, 0.46044921875, 0.800537109375, 1.140625, 1.480712890625, 1.82080078125, 2.160888671875, 2.5009765625, 2.841064453125, 3.18115234375, 3.521240234375, 3.861328125, 4.201416015625, 4.54150390625, 4.881591796875, 5.2216796875, 5.561767578125, 5.90185546875, 6.241943359375, 6.58203125, 6.922119140625, 7.26220703125, 7.602294921875, 7.9423828125, 8.282470703125, 8.62255859375, 8.962646484375, 9.302734375, 9.642822265625, 9.98291015625, 10.322998046875, 10.6630859375, 11.003173828125, 11.34326171875, 11.683349609375, 12.0234375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 10.0, 11.0, 23.0, 26.0, 39.0, 44.0, 72.0, 119.0, 159.0, 271.0, 360.0, 536.0, 927.0, 1519.0, 2354.0, 3796.0, 6538.0, 11395.0, 19938.0, 36346.0, 67318.0, 137690.0, 1424705.0, 191938.0, 86240.0, 45633.0, 24862.0, 13912.0, 8001.0, 4623.0, 2779.0, 1798.0, 1089.0, 701.0, 428.0, 309.0, 208.0, 131.0, 94.0, 53.0, 47.0, 21.0, 26.0, 14.0, 13.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.7265625, -4.58197021484375, -4.4373779296875, -4.29278564453125, -4.148193359375, -4.00360107421875, -3.8590087890625, -3.71441650390625, -3.56982421875, -3.42523193359375, -3.2806396484375, -3.13604736328125, -2.991455078125, -2.84686279296875, -2.7022705078125, -2.55767822265625, -2.4130859375, -2.26849365234375, -2.1239013671875, -1.97930908203125, -1.834716796875, -1.69012451171875, -1.5455322265625, -1.40093994140625, -1.25634765625, -1.11175537109375, -0.9671630859375, -0.82257080078125, -0.677978515625, -0.53338623046875, -0.3887939453125, -0.24420166015625, -0.099609375, 0.04498291015625, 0.1895751953125, 0.33416748046875, 0.478759765625, 0.62335205078125, 0.7679443359375, 0.91253662109375, 1.05712890625, 1.20172119140625, 1.3463134765625, 1.49090576171875, 1.635498046875, 1.78009033203125, 1.9246826171875, 2.06927490234375, 2.2138671875, 2.35845947265625, 2.5030517578125, 2.64764404296875, 2.792236328125, 2.93682861328125, 3.0814208984375, 3.22601318359375, 3.37060546875, 3.51519775390625, 3.6597900390625, 3.80438232421875, 3.948974609375, 4.09356689453125, 4.2381591796875, 4.38275146484375, 4.52734375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 6.0, 1.0, 6.0, 4.0, 8.0, 8.0, 12.0, 15.0, 15.0, 21.0, 18.0, 35.0, 61.0, 68.0, 80.0, 98.0, 118.0, 99.0, 75.0, 63.0, 48.0, 27.0, 24.0, 16.0, 13.0, 18.0, 17.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.002727508544921875, -0.0026548057794570923, -0.0025821030139923096, -0.002509400248527527, -0.002436697483062744, -0.0023639947175979614, -0.0022912919521331787, -0.002218589186668396, -0.0021458864212036133, -0.0020731836557388306, -0.002000480890274048, -0.0019277781248092651, -0.0018550753593444824, -0.0017823725938796997, -0.001709669828414917, -0.0016369670629501343, -0.0015642642974853516, -0.0014915615320205688, -0.0014188587665557861, -0.0013461560010910034, -0.0012734532356262207, -0.001200750470161438, -0.0011280477046966553, -0.0010553449392318726, -0.0009826421737670898, -0.0009099394083023071, -0.0008372366428375244, -0.0007645338773727417, -0.000691831111907959, -0.0006191283464431763, -0.0005464255809783936, -0.00047372281551361084, -0.0004010200500488281, -0.0003283172845840454, -0.0002556145191192627, -0.00018291175365447998, -0.00011020898818969727, -3.750622272491455e-05, 3.5196542739868164e-05, 0.00010789930820465088, 0.0001806020736694336, 0.0002533048391342163, 0.000326007604598999, 0.00039871037006378174, 0.00047141313552856445, 0.0005441159009933472, 0.0006168186664581299, 0.0006895214319229126, 0.0007622241973876953, 0.000834926962852478, 0.0009076297283172607, 0.0009803324937820435, 0.0010530352592468262, 0.0011257380247116089, 0.0011984407901763916, 0.0012711435556411743, 0.001343846321105957, 0.0014165490865707397, 0.0014892518520355225, 0.0015619546175003052, 0.0016346573829650879, 0.0017073601484298706, 0.0017800629138946533, 0.001852765679359436, 0.0019254684448242188]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 9.0, 16.0, 9.0, 27.0, 20.0, 28.0, 24.0, 36.0, 66.0, 114.0, 238.0, 467.0, 4702.0, 1036799.0, 4785.0, 523.0, 233.0, 121.0, 75.0, 47.0, 44.0, 21.0, 31.0, 20.0, 14.0, 6.0, 11.0, 6.0, 6.0, 1.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042388916015625, -0.04078960418701172, -0.03919029235839844, -0.037590980529785156, -0.035991668701171875, -0.034392356872558594, -0.03279304504394531, -0.03119373321533203, -0.02959442138671875, -0.02799510955810547, -0.026395797729492188, -0.024796485900878906, -0.023197174072265625, -0.021597862243652344, -0.019998550415039062, -0.01839923858642578, -0.0167999267578125, -0.015200614929199219, -0.013601303100585938, -0.012001991271972656, -0.010402679443359375, -0.008803367614746094, -0.0072040557861328125, -0.005604743957519531, -0.00400543212890625, -0.0024061203002929688, -0.0008068084716796875, 0.0007925033569335938, 0.002391815185546875, 0.003991127014160156, 0.0055904388427734375, 0.007189750671386719, 0.0087890625, 0.010388374328613281, 0.011987686157226562, 0.013586997985839844, 0.015186309814453125, 0.016785621643066406, 0.018384933471679688, 0.01998424530029297, 0.02158355712890625, 0.02318286895751953, 0.024782180786132812, 0.026381492614746094, 0.027980804443359375, 0.029580116271972656, 0.031179428100585938, 0.03277873992919922, 0.0343780517578125, 0.03597736358642578, 0.03757667541503906, 0.039175987243652344, 0.040775299072265625, 0.042374610900878906, 0.04397392272949219, 0.04557323455810547, 0.04717254638671875, 0.04877185821533203, 0.05037117004394531, 0.051970481872558594, 0.053569793701171875, 0.055169105529785156, 0.05676841735839844, 0.05836772918701172, 0.059967041015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 11.0, 33.0, 29.0, 61.0, 90.0, 102.0, 129.0, 116.0, 102.0, 102.0, 71.0, 53.0, 37.0, 15.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005632064421661198, -0.0005305611412040889, -0.000497915840242058, -0.0004652705101761967, -0.0004326252092141658, -0.0003999799082521349, -0.0003673345781862736, -0.0003346892772242427, -0.0003020439762622118, -0.0002693986753001809, -0.0002367533597862348, -0.00020410804427228868, -0.0001714627433102578, -0.0001388174423482269, -0.00010617212683428079, -7.352681132033467e-05, -4.0881510358303785e-05, -8.236202120315284e-06, 2.4409106117673218e-05, 5.705441435566172e-05, 8.969972259365022e-05, 0.0001223450235556811, 0.00015499033906962723, 0.00018763565458357334, 0.00022028095554560423, 0.0002529262565076351, 0.000285571557469666, 0.00031821688753552735, 0.00035086218849755824, 0.0003835074894595891, 0.00041615281952545047, 0.00044879812048748136, 0.00048144336324185133, 0.0005140886642038822, 0.0005467339651659131, 0.000579379266127944, 0.0006120245670899749, 0.0006446698680520058, 0.0006773152272216976, 0.0007099605281837285, 0.0007426058291457593, 0.0007752511301077902, 0.0008078964310698211, 0.000840541732031852, 0.0008731870912015438, 0.0009058323921635747, 0.0009384776931256056, 0.0009711229940876365, 0.0010037682950496674, 0.0010364135960116982, 0.0010690588969737291, 0.00110170419793576, 0.001134349498897791, 0.0011669947998598218, 0.0011996401008218527, 0.0012322855181992054, 0.0012649307027459145, 0.0012975760037079453, 0.0013302213046699762, 0.0013628666056320071, 0.001395511906594038, 0.001428157207556069, 0.0014608025085180998, 0.0014934479258954525, 0.0015260932268574834]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 9.0, 7.0, 5.0, 4.0, 9.0, 13.0, 6.0, 15.0, 29.0, 17.0, 28.0, 25.0, 19.0, 33.0, 43.0, 40.0, 32.0, 40.0, 41.0, 52.0, 31.0, 44.0, 33.0, 34.0, 37.0, 36.0, 33.0, 30.0, 34.0, 33.0, 28.0, 14.0, 24.0, 18.0, 19.0, 18.0, 12.0, 11.0, 8.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0010229945182800293, -0.0009929127991199493, -0.0009628310799598694, -0.0009327493607997894, -0.0009026676416397095, -0.0008725859224796295, -0.0008425042033195496, -0.0008124224841594696, -0.0007823407649993896, -0.0007522590458393097, -0.0007221773266792297, -0.0006920956075191498, -0.0006620138883590698, -0.0006319321691989899, -0.0006018504500389099, -0.00057176873087883, -0.00054168701171875, -0.00051160529255867, -0.0004815235733985901, -0.00045144185423851013, -0.0004213601350784302, -0.0003912784159183502, -0.00036119669675827026, -0.0003311149775981903, -0.00030103325843811035, -0.0002709515392780304, -0.00024086982011795044, -0.00021078810095787048, -0.00018070638179779053, -0.00015062466263771057, -0.00012054294347763062, -9.046122431755066e-05, -6.03795051574707e-05, -3.0297785997390747e-05, -2.1606683731079102e-07, 2.9865652322769165e-05, 5.994737148284912e-05, 9.002909064292908e-05, 0.00012011080980300903, 0.000150192528963089, 0.00018027424812316895, 0.0002103559672832489, 0.00024043768644332886, 0.0002705194056034088, 0.00030060112476348877, 0.0003306828439235687, 0.0003607645630836487, 0.00039084628224372864, 0.0004209280014038086, 0.00045100972056388855, 0.0004810914397239685, 0.0005111731588840485, 0.0005412548780441284, 0.0005713365972042084, 0.0006014183163642883, 0.0006315000355243683, 0.0006615817546844482, 0.0006916634738445282, 0.0007217451930046082, 0.0007518269121646881, 0.0007819086313247681, 0.000811990350484848, 0.000842072069644928, 0.0008721537888050079, 0.0009022355079650879]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 9.0, 10.0, 16.0, 11.0, 11.0, 13.0, 15.0, 30.0, 27.0, 35.0, 34.0, 47.0, 31.0, 35.0, 38.0, 64.0, 52.0, 48.0, 46.0, 35.0, 40.0, 53.0, 31.0, 25.0, 38.0, 29.0, 30.0, 21.0, 16.0, 26.0, 11.0, 10.0, 9.0, 13.0, 8.0, 2.0, 5.0, 2.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.78125, -16.2791748046875, -15.777099609375, -15.2750244140625, -14.77294921875, -14.2708740234375, -13.768798828125, -13.2667236328125, -12.7646484375, -12.2625732421875, -11.760498046875, -11.2584228515625, -10.75634765625, -10.2542724609375, -9.752197265625, -9.2501220703125, -8.748046875, -8.2459716796875, -7.743896484375, -7.2418212890625, -6.73974609375, -6.2376708984375, -5.735595703125, -5.2335205078125, -4.7314453125, -4.2293701171875, -3.727294921875, -3.2252197265625, -2.72314453125, -2.2210693359375, -1.718994140625, -1.2169189453125, -0.71484375, -0.2127685546875, 0.289306640625, 0.7913818359375, 1.29345703125, 1.7955322265625, 2.297607421875, 2.7996826171875, 3.3017578125, 3.8038330078125, 4.305908203125, 4.8079833984375, 5.31005859375, 5.8121337890625, 6.314208984375, 6.8162841796875, 7.318359375, 7.8204345703125, 8.322509765625, 8.8245849609375, 9.32666015625, 9.8287353515625, 10.330810546875, 10.8328857421875, 11.3349609375, 11.8370361328125, 12.339111328125, 12.8411865234375, 13.34326171875, 13.8453369140625, 14.347412109375, 14.8494873046875, 15.3515625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 10.0, 17.0, 18.0, 25.0, 53.0, 79.0, 124.0, 173.0, 321.0, 462.0, 678.0, 1016.0, 1549.0, 2511.0, 4037.0, 6703.0, 11925.0, 21273.0, 41509.0, 88424.0, 211200.0, 359736.0, 153924.0, 67898.0, 32921.0, 17307.0, 9680.0, 5508.0, 3395.0, 2097.0, 1344.0, 865.0, 610.0, 403.0, 280.0, 163.0, 110.0, 75.0, 40.0, 23.0, 25.0, 14.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.4443359375, -6.224609375, -6.0048828125, -5.78515625, -5.5654296875, -5.345703125, -5.1259765625, -4.90625, -4.6865234375, -4.466796875, -4.2470703125, -4.02734375, -3.8076171875, -3.587890625, -3.3681640625, -3.1484375, -2.9287109375, -2.708984375, -2.4892578125, -2.26953125, -2.0498046875, -1.830078125, -1.6103515625, -1.390625, -1.1708984375, -0.951171875, -0.7314453125, -0.51171875, -0.2919921875, -0.072265625, 0.1474609375, 0.3671875, 0.5869140625, 0.806640625, 1.0263671875, 1.24609375, 1.4658203125, 1.685546875, 1.9052734375, 2.125, 2.3447265625, 2.564453125, 2.7841796875, 3.00390625, 3.2236328125, 3.443359375, 3.6630859375, 3.8828125, 4.1025390625, 4.322265625, 4.5419921875, 4.76171875, 4.9814453125, 5.201171875, 5.4208984375, 5.640625, 5.8603515625, 6.080078125, 6.2998046875, 6.51953125, 6.7392578125, 6.958984375, 7.1787109375, 7.3984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 4.0, 8.0, 7.0, 7.0, 6.0, 10.0, 13.0, 16.0, 14.0, 28.0, 29.0, 22.0, 39.0, 25.0, 32.0, 44.0, 43.0, 45.0, 47.0, 164.0, 1715.0, 209.0, 83.0, 55.0, 47.0, 41.0, 35.0, 39.0, 39.0, 23.0, 22.0, 14.0, 25.0, 19.0, 17.0, 11.0, 8.0, 8.0, 5.0, 9.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.71875, -45.98876953125, -44.2587890625, -42.52880859375, -40.798828125, -39.06884765625, -37.3388671875, -35.60888671875, -33.87890625, -32.14892578125, -30.4189453125, -28.68896484375, -26.958984375, -25.22900390625, -23.4990234375, -21.76904296875, -20.0390625, -18.30908203125, -16.5791015625, -14.84912109375, -13.119140625, -11.38916015625, -9.6591796875, -7.92919921875, -6.19921875, -4.46923828125, -2.7392578125, -1.00927734375, 0.720703125, 2.45068359375, 4.1806640625, 5.91064453125, 7.640625, 9.37060546875, 11.1005859375, 12.83056640625, 14.560546875, 16.29052734375, 18.0205078125, 19.75048828125, 21.48046875, 23.21044921875, 24.9404296875, 26.67041015625, 28.400390625, 30.13037109375, 31.8603515625, 33.59033203125, 35.3203125, 37.05029296875, 38.7802734375, 40.51025390625, 42.240234375, 43.97021484375, 45.7001953125, 47.43017578125, 49.16015625, 50.89013671875, 52.6201171875, 54.35009765625, 56.080078125, 57.81005859375, 59.5400390625, 61.27001953125, 63.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 11.0, 15.0, 14.0, 21.0, 33.0, 39.0, 70.0, 83.0, 114.0, 188.0, 290.0, 519.0, 1959.0, 2593134.0, 546301.0, 1569.0, 509.0, 277.0, 172.0, 117.0, 75.0, 58.0, 38.0, 22.0, 18.0, 13.0, 12.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.5, -127.759765625, -123.01953125, -118.279296875, -113.5390625, -108.798828125, -104.05859375, -99.318359375, -94.578125, -89.837890625, -85.09765625, -80.357421875, -75.6171875, -70.876953125, -66.13671875, -61.396484375, -56.65625, -51.916015625, -47.17578125, -42.435546875, -37.6953125, -32.955078125, -28.21484375, -23.474609375, -18.734375, -13.994140625, -9.25390625, -4.513671875, 0.2265625, 4.966796875, 9.70703125, 14.447265625, 19.1875, 23.927734375, 28.66796875, 33.408203125, 38.1484375, 42.888671875, 47.62890625, 52.369140625, 57.109375, 61.849609375, 66.58984375, 71.330078125, 76.0703125, 80.810546875, 85.55078125, 90.291015625, 95.03125, 99.771484375, 104.51171875, 109.251953125, 113.9921875, 118.732421875, 123.47265625, 128.212890625, 132.953125, 137.693359375, 142.43359375, 147.173828125, 151.9140625, 156.654296875, 161.39453125, 166.134765625, 170.875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 32.0, 253.0, 578.0, 139.0, 13.0, 5.0], "bins": [-497.0633544921875, -488.82061767578125, -480.5779113769531, -472.335205078125, -464.09246826171875, -455.8497314453125, -447.6070251464844, -439.36431884765625, -431.12158203125, -422.87884521484375, -414.6361389160156, -406.3934326171875, -398.15069580078125, -389.907958984375, -381.6652526855469, -373.42254638671875, -365.1798095703125, -356.93707275390625, -348.6943664550781, -340.45166015625, -332.20892333984375, -323.9661865234375, -315.7234802246094, -307.48077392578125, -299.238037109375, -290.99530029296875, -282.7525939941406, -274.5098876953125, -266.26715087890625, -258.0244140625, -249.78170776367188, -241.5389862060547, -233.29623413085938, -225.0535125732422, -216.810791015625, -208.5680694580078, -200.32534790039062, -192.08262634277344, -183.83990478515625, -175.59718322753906, -167.35446166992188, -159.1117401123047, -150.8690185546875, -142.6262969970703, -134.38357543945312, -126.14085388183594, -117.89813232421875, -109.65541076660156, -101.4126968383789, -93.16997528076172, -84.92725372314453, -76.68453216552734, -68.44181060791016, -60.19908905029297, -51.95636749267578, -43.713645935058594, -35.470924377441406, -27.22820281982422, -18.98548126220703, -10.742759704589844, -2.5000381469726562, 5.742683410644531, 13.985404968261719, 22.228126525878906, 30.470849990844727]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 8.0, 12.0, 9.0, 12.0, 7.0, 16.0, 13.0, 16.0, 17.0, 28.0, 22.0, 22.0, 29.0, 46.0, 36.0, 36.0, 37.0, 49.0, 36.0, 41.0, 40.0, 36.0, 36.0, 42.0, 32.0, 37.0, 34.0, 38.0, 26.0, 21.0, 26.0, 19.0, 25.0, 23.0, 8.0, 5.0, 11.0, 10.0, 7.0, 9.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-162.701904296875, -157.92788696289062, -153.1538543701172, -148.3798370361328, -143.60581970214844, -138.831787109375, -134.05776977539062, -129.28375244140625, -124.50972747802734, -119.73570251464844, -114.96168518066406, -110.18766021728516, -105.41363525390625, -100.63961791992188, -95.86559295654297, -91.09156799316406, -86.31755065917969, -81.54352569580078, -76.7695083618164, -71.9954833984375, -67.22146606445312, -62.44744110107422, -57.67341613769531, -52.89939498901367, -48.12537384033203, -43.35135269165039, -38.57733154296875, -33.803306579589844, -29.029285430908203, -24.255264282226562, -19.48124122619629, -14.707218170166016, -9.933197021484375, -5.159174919128418, -0.38515281677246094, 4.388869285583496, 9.162891387939453, 13.936912536621094, 18.710935592651367, 23.48495864868164, 28.25897979736328, 33.03300094604492, 37.80702209472656, 42.58104705810547, 47.35506820678711, 52.12908935546875, 56.903114318847656, 61.6771354675293, 66.45115661621094, 71.22518157958984, 75.99919891357422, 80.77322387695312, 85.5472412109375, 90.3212661743164, 95.09529113769531, 99.86930847167969, 104.6433334350586, 109.4173583984375, 114.19137573242188, 118.96540069580078, 123.73942565917969, 128.51344299316406, 133.28746032714844, 138.06149291992188, 142.83551025390625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 7.0, 18.0, 13.0, 12.0, 13.0, 15.0, 26.0, 19.0, 39.0, 34.0, 32.0, 41.0, 38.0, 40.0, 39.0, 48.0, 36.0, 47.0, 52.0, 44.0, 36.0, 34.0, 37.0, 36.0, 27.0, 29.0, 23.0, 25.0, 18.0, 17.0, 13.0, 10.0, 10.0, 9.0, 10.0, 8.0, 4.0, 4.0, 5.0, 0.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.6171875, -15.1290283203125, -14.640869140625, -14.1527099609375, -13.66455078125, -13.1763916015625, -12.688232421875, -12.2000732421875, -11.7119140625, -11.2237548828125, -10.735595703125, -10.2474365234375, -9.75927734375, -9.2711181640625, -8.782958984375, -8.2947998046875, -7.806640625, -7.3184814453125, -6.830322265625, -6.3421630859375, -5.85400390625, -5.3658447265625, -4.877685546875, -4.3895263671875, -3.9013671875, -3.4132080078125, -2.925048828125, -2.4368896484375, -1.94873046875, -1.4605712890625, -0.972412109375, -0.4842529296875, 0.00390625, 0.4920654296875, 0.980224609375, 1.4683837890625, 1.95654296875, 2.4447021484375, 2.932861328125, 3.4210205078125, 3.9091796875, 4.3973388671875, 4.885498046875, 5.3736572265625, 5.86181640625, 6.3499755859375, 6.838134765625, 7.3262939453125, 7.814453125, 8.3026123046875, 8.790771484375, 9.2789306640625, 9.76708984375, 10.2552490234375, 10.743408203125, 11.2315673828125, 11.7197265625, 12.2078857421875, 12.696044921875, 13.1842041015625, 13.67236328125, 14.1605224609375, 14.648681640625, 15.1368408203125, 15.625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 12.0, 7.0, 11.0, 7.0, 15.0, 25.0, 28.0, 35.0, 48.0, 58.0, 91.0, 124.0, 202.0, 282.0, 485.0, 964.0, 2206.0, 5982.0, 21980.0, 100787.0, 469569.0, 1485570.0, 1495671.0, 481042.0, 97269.0, 21208.0, 5968.0, 2237.0, 985.0, 481.0, 278.0, 185.0, 125.0, 93.0, 65.0, 45.0, 39.0, 23.0, 23.0, 17.0, 10.0, 9.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.127197265625, -15.55126953125, -14.975341796875, -14.3994140625, -13.823486328125, -13.24755859375, -12.671630859375, -12.095703125, -11.519775390625, -10.94384765625, -10.367919921875, -9.7919921875, -9.216064453125, -8.64013671875, -8.064208984375, -7.48828125, -6.912353515625, -6.33642578125, -5.760498046875, -5.1845703125, -4.608642578125, -4.03271484375, -3.456787109375, -2.880859375, -2.304931640625, -1.72900390625, -1.153076171875, -0.5771484375, -0.001220703125, 0.57470703125, 1.150634765625, 1.7265625, 2.302490234375, 2.87841796875, 3.454345703125, 4.0302734375, 4.606201171875, 5.18212890625, 5.758056640625, 6.333984375, 6.909912109375, 7.48583984375, 8.061767578125, 8.6376953125, 9.213623046875, 9.78955078125, 10.365478515625, 10.94140625, 11.517333984375, 12.09326171875, 12.669189453125, 13.2451171875, 13.821044921875, 14.39697265625, 14.972900390625, 15.548828125, 16.124755859375, 16.70068359375, 17.276611328125, 17.8525390625, 18.428466796875, 19.00439453125, 19.580322265625, 20.15625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 12.0, 18.0, 39.0, 68.0, 117.0, 189.0, 313.0, 560.0, 808.0, 817.0, 491.0, 284.0, 155.0, 86.0, 65.0, 26.0, 14.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -59.66162109375, -57.6669921875, -55.67236328125, -53.677734375, -51.68310546875, -49.6884765625, -47.69384765625, -45.69921875, -43.70458984375, -41.7099609375, -39.71533203125, -37.720703125, -35.72607421875, -33.7314453125, -31.73681640625, -29.7421875, -27.74755859375, -25.7529296875, -23.75830078125, -21.763671875, -19.76904296875, -17.7744140625, -15.77978515625, -13.78515625, -11.79052734375, -9.7958984375, -7.80126953125, -5.806640625, -3.81201171875, -1.8173828125, 0.17724609375, 2.171875, 4.16650390625, 6.1611328125, 8.15576171875, 10.150390625, 12.14501953125, 14.1396484375, 16.13427734375, 18.12890625, 20.12353515625, 22.1181640625, 24.11279296875, 26.107421875, 28.10205078125, 30.0966796875, 32.09130859375, 34.0859375, 36.08056640625, 38.0751953125, 40.06982421875, 42.064453125, 44.05908203125, 46.0537109375, 48.04833984375, 50.04296875, 52.03759765625, 54.0322265625, 56.02685546875, 58.021484375, 60.01611328125, 62.0107421875, 64.00537109375, 66.0]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 13.0, 11.0, 19.0, 32.0, 36.0, 54.0, 52.0, 58.0, 103.0, 146.0, 245.0, 411.0, 945.0, 13148.0, 4165412.0, 11367.0, 904.0, 432.0, 231.0, 172.0, 103.0, 82.0, 51.0, 64.0, 38.0, 27.0, 22.0, 14.0, 15.0, 14.0, 9.0, 11.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-178.5, -172.447265625, -166.39453125, -160.341796875, -154.2890625, -148.236328125, -142.18359375, -136.130859375, -130.078125, -124.025390625, -117.97265625, -111.919921875, -105.8671875, -99.814453125, -93.76171875, -87.708984375, -81.65625, -75.603515625, -69.55078125, -63.498046875, -57.4453125, -51.392578125, -45.33984375, -39.287109375, -33.234375, -27.181640625, -21.12890625, -15.076171875, -9.0234375, -2.970703125, 3.08203125, 9.134765625, 15.1875, 21.240234375, 27.29296875, 33.345703125, 39.3984375, 45.451171875, 51.50390625, 57.556640625, 63.609375, 69.662109375, 75.71484375, 81.767578125, 87.8203125, 93.873046875, 99.92578125, 105.978515625, 112.03125, 118.083984375, 124.13671875, 130.189453125, 136.2421875, 142.294921875, 148.34765625, 154.400390625, 160.453125, 166.505859375, 172.55859375, 178.611328125, 184.6640625, 190.716796875, 196.76953125, 202.822265625, 208.875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 13.0, 37.0, 44.0, 78.0, 98.0, 131.0, 138.0, 128.0, 107.0, 97.0, 61.0, 36.0, 16.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.12973022460938, -164.7701873779297, -160.41064453125, -156.05111694335938, -151.6915740966797, -147.33203125, -142.9724884033203, -138.61294555664062, -134.25341796875, -129.8938751220703, -125.53433990478516, -121.17479705810547, -116.81526184082031, -112.45571899414062, -108.09617614746094, -103.73663330078125, -99.37709045410156, -95.01754760742188, -90.65801239013672, -86.29846954345703, -81.93893432617188, -77.57939147949219, -73.2198486328125, -68.86030578613281, -64.50077056884766, -60.141231536865234, -55.78169250488281, -51.422149658203125, -47.0626106262207, -42.70307159423828, -38.343528747558594, -33.98398971557617, -29.62445068359375, -25.264911651611328, -20.905370712280273, -16.54582977294922, -12.186290740966797, -7.826751708984375, -3.4672107696533203, 0.8923301696777344, 5.251869201660156, 9.611409187316895, 13.970949172973633, 18.330490112304688, 22.69002914428711, 27.04956817626953, 31.409109115600586, 35.76865005493164, 40.12818908691406, 44.487728118896484, 48.847267150878906, 53.206809997558594, 57.566349029541016, 61.92588806152344, 66.28543090820312, 70.64497375488281, 75.00450897216797, 79.36405181884766, 83.72358703613281, 88.0831298828125, 92.44267272949219, 96.80220794677734, 101.16175079345703, 105.52128601074219, 109.88082885742188]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 10.0, 16.0, 16.0, 10.0, 12.0, 25.0, 16.0, 24.0, 32.0, 32.0, 31.0, 25.0, 30.0, 26.0, 41.0, 47.0, 39.0, 35.0, 36.0, 53.0, 40.0, 28.0, 46.0, 28.0, 37.0, 22.0, 30.0, 26.0, 27.0, 13.0, 25.0, 13.0, 10.0, 16.0, 16.0, 14.0, 15.0, 3.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-128.8302001953125, -125.22200012207031, -121.61380767822266, -118.005615234375, -114.39741516113281, -110.78921508789062, -107.18102264404297, -103.57283020019531, -99.96463012695312, -96.35643005371094, -92.74823760986328, -89.14004516601562, -85.53184509277344, -81.92364501953125, -78.3154525756836, -74.70726013183594, -71.09906005859375, -67.49085998535156, -63.882667541503906, -60.274471282958984, -56.66627502441406, -53.05807876586914, -49.44988250732422, -45.8416862487793, -42.233489990234375, -38.62529373168945, -35.01709747314453, -31.40890121459961, -27.800704956054688, -24.192508697509766, -20.584312438964844, -16.976116180419922, -13.367919921875, -9.759723663330078, -6.151527404785156, -2.5433311462402344, 1.0648651123046875, 4.673061370849609, 8.281257629394531, 11.889453887939453, 15.497650146484375, 19.105846405029297, 22.71404266357422, 26.32223892211914, 29.930435180664062, 33.538631439208984, 37.146827697753906, 40.75502395629883, 44.36322021484375, 47.97141647338867, 51.579612731933594, 55.187808990478516, 58.79600524902344, 62.40420150756836, 66.01239776611328, 69.62059020996094, 73.22879028320312, 76.83699035644531, 80.44518280029297, 84.05337524414062, 87.66157531738281, 91.269775390625, 94.87796783447266, 98.48616027832031, 102.0943603515625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 15.0, 9.0, 9.0, 10.0, 12.0, 17.0, 15.0, 19.0, 23.0, 31.0, 26.0, 43.0, 28.0, 38.0, 43.0, 39.0, 45.0, 46.0, 51.0, 48.0, 42.0, 38.0, 45.0, 23.0, 33.0, 33.0, 35.0, 22.0, 29.0, 21.0, 15.0, 11.0, 16.0, 9.0, 8.0, 14.0, 9.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.90625, -14.418212890625, -13.93017578125, -13.442138671875, -12.9541015625, -12.466064453125, -11.97802734375, -11.489990234375, -11.001953125, -10.513916015625, -10.02587890625, -9.537841796875, -9.0498046875, -8.561767578125, -8.07373046875, -7.585693359375, -7.09765625, -6.609619140625, -6.12158203125, -5.633544921875, -5.1455078125, -4.657470703125, -4.16943359375, -3.681396484375, -3.193359375, -2.705322265625, -2.21728515625, -1.729248046875, -1.2412109375, -0.753173828125, -0.26513671875, 0.222900390625, 0.7109375, 1.198974609375, 1.68701171875, 2.175048828125, 2.6630859375, 3.151123046875, 3.63916015625, 4.127197265625, 4.615234375, 5.103271484375, 5.59130859375, 6.079345703125, 6.5673828125, 7.055419921875, 7.54345703125, 8.031494140625, 8.51953125, 9.007568359375, 9.49560546875, 9.983642578125, 10.4716796875, 10.959716796875, 11.44775390625, 11.935791015625, 12.423828125, 12.911865234375, 13.39990234375, 13.887939453125, 14.3759765625, 14.864013671875, 15.35205078125, 15.840087890625, 16.328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 13.0, 16.0, 22.0, 50.0, 59.0, 80.0, 122.0, 195.0, 254.0, 400.0, 642.0, 946.0, 1415.0, 2165.0, 3300.0, 5105.0, 7973.0, 12129.0, 19429.0, 31392.0, 51927.0, 89843.0, 198465.0, 339095.0, 116622.0, 63746.0, 38341.0, 23488.0, 14581.0, 9348.0, 6064.0, 3878.0, 2506.0, 1663.0, 1100.0, 726.0, 504.0, 304.0, 197.0, 147.0, 103.0, 72.0, 33.0, 32.0, 20.0, 15.0, 12.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-4.2265625, -4.0992431640625, -3.971923828125, -3.8446044921875, -3.71728515625, -3.5899658203125, -3.462646484375, -3.3353271484375, -3.2080078125, -3.0806884765625, -2.953369140625, -2.8260498046875, -2.69873046875, -2.5714111328125, -2.444091796875, -2.3167724609375, -2.189453125, -2.0621337890625, -1.934814453125, -1.8074951171875, -1.68017578125, -1.5528564453125, -1.425537109375, -1.2982177734375, -1.1708984375, -1.0435791015625, -0.916259765625, -0.7889404296875, -0.66162109375, -0.5343017578125, -0.406982421875, -0.2796630859375, -0.15234375, -0.0250244140625, 0.102294921875, 0.2296142578125, 0.35693359375, 0.4842529296875, 0.611572265625, 0.7388916015625, 0.8662109375, 0.9935302734375, 1.120849609375, 1.2481689453125, 1.37548828125, 1.5028076171875, 1.630126953125, 1.7574462890625, 1.884765625, 2.0120849609375, 2.139404296875, 2.2667236328125, 2.39404296875, 2.5213623046875, 2.648681640625, 2.7760009765625, 2.9033203125, 3.0306396484375, 3.157958984375, 3.2852783203125, 3.41259765625, 3.5399169921875, 3.667236328125, 3.7945556640625, 3.921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 11.0, 18.0, 25.0, 18.0, 30.0, 34.0, 30.0, 31.0, 30.0, 34.0, 39.0, 38.0, 46.0, 54.0, 47.0, 1065.0, 51.0, 43.0, 30.0, 42.0, 35.0, 31.0, 36.0, 28.0, 26.0, 25.0, 15.0, 13.0, 18.0, 12.0, 14.0, 13.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.4447021484375, -9.108154296875, -8.7716064453125, -8.43505859375, -8.0985107421875, -7.761962890625, -7.4254150390625, -7.0888671875, -6.7523193359375, -6.415771484375, -6.0792236328125, -5.74267578125, -5.4061279296875, -5.069580078125, -4.7330322265625, -4.396484375, -4.0599365234375, -3.723388671875, -3.3868408203125, -3.05029296875, -2.7137451171875, -2.377197265625, -2.0406494140625, -1.7041015625, -1.3675537109375, -1.031005859375, -0.6944580078125, -0.35791015625, -0.0213623046875, 0.315185546875, 0.6517333984375, 0.98828125, 1.3248291015625, 1.661376953125, 1.9979248046875, 2.33447265625, 2.6710205078125, 3.007568359375, 3.3441162109375, 3.6806640625, 4.0172119140625, 4.353759765625, 4.6903076171875, 5.02685546875, 5.3634033203125, 5.699951171875, 6.0364990234375, 6.373046875, 6.7095947265625, 7.046142578125, 7.3826904296875, 7.71923828125, 8.0557861328125, 8.392333984375, 8.7288818359375, 9.0654296875, 9.4019775390625, 9.738525390625, 10.0750732421875, 10.41162109375, 10.7481689453125, 11.084716796875, 11.4212646484375, 11.7578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 15.0, 10.0, 22.0, 31.0, 47.0, 63.0, 89.0, 141.0, 189.0, 292.0, 462.0, 711.0, 1107.0, 1759.0, 2871.0, 4554.0, 7655.0, 13142.0, 23020.0, 39891.0, 70284.0, 135541.0, 1416211.0, 178609.0, 85807.0, 47583.0, 27498.0, 15706.0, 9398.0, 5488.0, 3235.0, 1977.0, 1264.0, 841.0, 542.0, 335.0, 249.0, 149.0, 109.0, 71.0, 43.0, 32.0, 20.0, 21.0, 15.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.62890625, -4.4871826171875, -4.345458984375, -4.2037353515625, -4.06201171875, -3.9202880859375, -3.778564453125, -3.6368408203125, -3.4951171875, -3.3533935546875, -3.211669921875, -3.0699462890625, -2.92822265625, -2.7864990234375, -2.644775390625, -2.5030517578125, -2.361328125, -2.2196044921875, -2.077880859375, -1.9361572265625, -1.79443359375, -1.6527099609375, -1.510986328125, -1.3692626953125, -1.2275390625, -1.0858154296875, -0.944091796875, -0.8023681640625, -0.66064453125, -0.5189208984375, -0.377197265625, -0.2354736328125, -0.09375, 0.0479736328125, 0.189697265625, 0.3314208984375, 0.47314453125, 0.6148681640625, 0.756591796875, 0.8983154296875, 1.0400390625, 1.1817626953125, 1.323486328125, 1.4652099609375, 1.60693359375, 1.7486572265625, 1.890380859375, 2.0321044921875, 2.173828125, 2.3155517578125, 2.457275390625, 2.5989990234375, 2.74072265625, 2.8824462890625, 3.024169921875, 3.1658935546875, 3.3076171875, 3.4493408203125, 3.591064453125, 3.7327880859375, 3.87451171875, 4.0162353515625, 4.157958984375, 4.2996826171875, 4.44140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 4.0, 7.0, 5.0, 14.0, 9.0, 13.0, 26.0, 26.0, 37.0, 62.0, 68.0, 82.0, 95.0, 98.0, 94.0, 84.0, 71.0, 47.0, 30.0, 25.0, 23.0, 15.0, 12.0, 9.0, 5.0, 7.0, 3.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004192352294921875, -0.004073500633239746, -0.003954648971557617, -0.0038357973098754883, -0.0037169456481933594, -0.0035980939865112305, -0.0034792423248291016, -0.0033603906631469727, -0.0032415390014648438, -0.003122687339782715, -0.003003835678100586, -0.002884984016418457, -0.002766132354736328, -0.0026472806930541992, -0.0025284290313720703, -0.0024095773696899414, -0.0022907257080078125, -0.0021718740463256836, -0.0020530223846435547, -0.0019341707229614258, -0.0018153190612792969, -0.001696467399597168, -0.001577615737915039, -0.0014587640762329102, -0.0013399124145507812, -0.0012210607528686523, -0.0011022090911865234, -0.0009833574295043945, -0.0008645057678222656, -0.0007456541061401367, -0.0006268024444580078, -0.0005079507827758789, -0.00038909912109375, -0.0002702474594116211, -0.0001513957977294922, -3.254413604736328e-05, 8.630752563476562e-05, 0.00020515918731689453, 0.00032401084899902344, 0.00044286251068115234, 0.0005617141723632812, 0.0006805658340454102, 0.0007994174957275391, 0.000918269157409668, 0.0010371208190917969, 0.0011559724807739258, 0.0012748241424560547, 0.0013936758041381836, 0.0015125274658203125, 0.0016313791275024414, 0.0017502307891845703, 0.0018690824508666992, 0.001987934112548828, 0.002106785774230957, 0.002225637435913086, 0.002344489097595215, 0.0024633407592773438, 0.0025821924209594727, 0.0027010440826416016, 0.0028198957443237305, 0.0029387474060058594, 0.0030575990676879883, 0.003176450729370117, 0.003295302391052246, 0.003414154052734375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 7.0, 5.0, 6.0, 7.0, 9.0, 16.0, 11.0, 33.0, 24.0, 53.0, 79.0, 144.0, 384.0, 15334.0, 1031234.0, 698.0, 198.0, 98.0, 72.0, 27.0, 24.0, 12.0, 19.0, 13.0, 7.0, 8.0, 3.0, 4.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0911865234375, -0.08806228637695312, -0.08493804931640625, -0.08181381225585938, -0.0786895751953125, -0.07556533813476562, -0.07244110107421875, -0.06931686401367188, -0.066192626953125, -0.06306838989257812, -0.05994415283203125, -0.056819915771484375, -0.0536956787109375, -0.050571441650390625, -0.04744720458984375, -0.044322967529296875, -0.04119873046875, -0.038074493408203125, -0.03495025634765625, -0.031826019287109375, -0.0287017822265625, -0.025577545166015625, -0.02245330810546875, -0.019329071044921875, -0.016204833984375, -0.013080596923828125, -0.00995635986328125, -0.006832122802734375, -0.0037078857421875, -0.000583648681640625, 0.00254058837890625, 0.005664825439453125, 0.0087890625, 0.011913299560546875, 0.01503753662109375, 0.018161773681640625, 0.0212860107421875, 0.024410247802734375, 0.02753448486328125, 0.030658721923828125, 0.033782958984375, 0.036907196044921875, 0.04003143310546875, 0.043155670166015625, 0.0462799072265625, 0.049404144287109375, 0.05252838134765625, 0.055652618408203125, 0.05877685546875, 0.061901092529296875, 0.06502532958984375, 0.06814956665039062, 0.0712738037109375, 0.07439804077148438, 0.07752227783203125, 0.08064651489257812, 0.083770751953125, 0.08689498901367188, 0.09001922607421875, 0.09314346313476562, 0.0962677001953125, 0.09939193725585938, 0.10251617431640625, 0.10564041137695312, 0.1087646484375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 15.0, 44.0, 150.0, 290.0, 283.0, 152.0, 57.0, 14.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014886975986883044, -0.00138950499240309, -0.0012903125025331974, -0.001191119896247983, -0.0010919272899627686, -0.0009927346836775541, -0.0008935421356000006, -0.0007943495875224471, -0.0006951569812372327, -0.0005959643749520183, -0.0004967718268744648, -0.0003975792496930808, -0.0002983866725116968, -0.0001991940662264824, -0.00010000151814892888, -8.0897007137537e-07, 9.838363621383905e-05, 0.00019757621339522302, 0.000296768790576607, 0.00039596136775799096, 0.0004951539449393749, 0.0005943465512245893, 0.0006935390993021429, 0.0007927316473796964, 0.0008919242536649108, 0.0009911168599501252, 0.0010903093498200178, 0.0011895019561052322, 0.0012886945623904467, 0.001387887168675661, 0.0014870797749608755, 0.001586272264830768, 0.0016854647547006607, 0.0017846573609858751, 0.0018838499672710896, 0.001983042573556304, 0.0020822351798415184, 0.002181427553296089, 0.0022806201595813036, 0.002379812765866518, 0.0024790053721517324, 0.002578197978436947, 0.0026773905847221613, 0.0027765831910073757, 0.0028757755644619465, 0.0029749684035778046, 0.0030741607770323753, 0.0031733533833175898, 0.003272545989602804, 0.0033717385958880186, 0.003470931202173233, 0.0035701238084584475, 0.003669316414743662, 0.0037685087881982327, 0.003867701394483447, 0.0039668940007686615, 0.004066086374223232, 0.004165278747677803, 0.004264471586793661, 0.004363663960248232, 0.00446285679936409, 0.004562049172818661, 0.004661242011934519, 0.00476043438538909, 0.004859627224504948]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 9.0, 7.0, 4.0, 10.0, 17.0, 17.0, 18.0, 17.0, 20.0, 28.0, 24.0, 32.0, 44.0, 42.0, 52.0, 48.0, 56.0, 53.0, 53.0, 34.0, 50.0, 37.0, 34.0, 35.0, 38.0, 40.0, 31.0, 27.0, 32.0, 24.0, 17.0, 10.0, 12.0, 8.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002004861831665039, -0.0019477512687444687, -0.0018906407058238983, -0.001833530142903328, -0.0017764195799827576, -0.0017193090170621872, -0.0016621984541416168, -0.0016050878912210464, -0.001547977328300476, -0.0014908667653799057, -0.0014337562024593353, -0.001376645639538765, -0.0013195350766181946, -0.0012624245136976242, -0.0012053139507770538, -0.0011482033878564835, -0.001091092824935913, -0.0010339822620153427, -0.0009768716990947723, -0.000919761136174202, -0.0008626505732536316, -0.0008055400103330612, -0.0007484294474124908, -0.0006913188844919205, -0.0006342083215713501, -0.0005770977586507797, -0.0005199871957302094, -0.000462876632809639, -0.0004057660698890686, -0.00034865550696849823, -0.00029154494404792786, -0.00023443438112735748, -0.0001773238182067871, -0.00012021325528621674, -6.310269236564636e-05, -5.992129445075989e-06, 5.1118433475494385e-05, 0.00010822899639606476, 0.00016533955931663513, 0.0002224501222372055, 0.0002795606851577759, 0.00033667124807834625, 0.0003937818109989166, 0.000450892373919487, 0.0005080029368400574, 0.0005651134997606277, 0.0006222240626811981, 0.0006793346256017685, 0.0007364451885223389, 0.0007935557514429092, 0.0008506663143634796, 0.00090777687728405, 0.0009648874402046204, 0.0010219980031251907, 0.001079108566045761, 0.0011362191289663315, 0.0011933296918869019, 0.0012504402548074722, 0.0013075508177280426, 0.001364661380648613, 0.0014217719435691833, 0.0014788825064897537, 0.001535993069410324, 0.0015931036323308945, 0.0016502141952514648]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 15.0, 9.0, 9.0, 10.0, 12.0, 17.0, 15.0, 19.0, 23.0, 31.0, 26.0, 44.0, 28.0, 37.0, 43.0, 39.0, 45.0, 46.0, 51.0, 48.0, 42.0, 38.0, 45.0, 23.0, 33.0, 33.0, 35.0, 22.0, 29.0, 21.0, 15.0, 11.0, 16.0, 9.0, 8.0, 14.0, 9.0, 6.0, 4.0, 0.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.90625, -14.418212890625, -13.93017578125, -13.442138671875, -12.9541015625, -12.466064453125, -11.97802734375, -11.489990234375, -11.001953125, -10.513916015625, -10.02587890625, -9.537841796875, -9.0498046875, -8.561767578125, -8.07373046875, -7.585693359375, -7.09765625, -6.609619140625, -6.12158203125, -5.633544921875, -5.1455078125, -4.657470703125, -4.16943359375, -3.681396484375, -3.193359375, -2.705322265625, -2.21728515625, -1.729248046875, -1.2412109375, -0.753173828125, -0.26513671875, 0.222900390625, 0.7109375, 1.198974609375, 1.68701171875, 2.175048828125, 2.6630859375, 3.151123046875, 3.63916015625, 4.127197265625, 4.615234375, 5.103271484375, 5.59130859375, 6.079345703125, 6.5673828125, 7.055419921875, 7.54345703125, 8.031494140625, 8.51953125, 9.007568359375, 9.49560546875, 9.983642578125, 10.4716796875, 10.959716796875, 11.44775390625, 11.935791015625, 12.423828125, 12.911865234375, 13.39990234375, 13.887939453125, 14.3759765625, 14.864013671875, 15.35205078125, 15.840087890625, 16.328125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 7.0, 4.0, 13.0, 8.0, 16.0, 26.0, 29.0, 31.0, 53.0, 49.0, 82.0, 103.0, 167.0, 240.0, 329.0, 545.0, 874.0, 1595.0, 3206.0, 6429.0, 14336.0, 32704.0, 78675.0, 206743.0, 381966.0, 190225.0, 73252.0, 30206.0, 13580.0, 6192.0, 2920.0, 1522.0, 842.0, 484.0, 319.0, 191.0, 161.0, 99.0, 77.0, 63.0, 46.0, 48.0, 23.0, 22.0, 14.0, 14.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-9.40625, -9.116455078125, -8.82666015625, -8.536865234375, -8.2470703125, -7.957275390625, -7.66748046875, -7.377685546875, -7.087890625, -6.798095703125, -6.50830078125, -6.218505859375, -5.9287109375, -5.638916015625, -5.34912109375, -5.059326171875, -4.76953125, -4.479736328125, -4.18994140625, -3.900146484375, -3.6103515625, -3.320556640625, -3.03076171875, -2.740966796875, -2.451171875, -2.161376953125, -1.87158203125, -1.581787109375, -1.2919921875, -1.002197265625, -0.71240234375, -0.422607421875, -0.1328125, 0.156982421875, 0.44677734375, 0.736572265625, 1.0263671875, 1.316162109375, 1.60595703125, 1.895751953125, 2.185546875, 2.475341796875, 2.76513671875, 3.054931640625, 3.3447265625, 3.634521484375, 3.92431640625, 4.214111328125, 4.50390625, 4.793701171875, 5.08349609375, 5.373291015625, 5.6630859375, 5.952880859375, 6.24267578125, 6.532470703125, 6.822265625, 7.112060546875, 7.40185546875, 7.691650390625, 7.9814453125, 8.271240234375, 8.56103515625, 8.850830078125, 9.140625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 11.0, 4.0, 5.0, 8.0, 8.0, 14.0, 9.0, 15.0, 21.0, 21.0, 16.0, 25.0, 26.0, 43.0, 30.0, 52.0, 47.0, 71.0, 169.0, 1834.0, 168.0, 68.0, 60.0, 49.0, 41.0, 42.0, 29.0, 30.0, 25.0, 22.0, 16.0, 19.0, 8.0, 11.0, 9.0, 4.0, 11.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-69.3125, -67.30224609375, -65.2919921875, -63.28173828125, -61.271484375, -59.26123046875, -57.2509765625, -55.24072265625, -53.23046875, -51.22021484375, -49.2099609375, -47.19970703125, -45.189453125, -43.17919921875, -41.1689453125, -39.15869140625, -37.1484375, -35.13818359375, -33.1279296875, -31.11767578125, -29.107421875, -27.09716796875, -25.0869140625, -23.07666015625, -21.06640625, -19.05615234375, -17.0458984375, -15.03564453125, -13.025390625, -11.01513671875, -9.0048828125, -6.99462890625, -4.984375, -2.97412109375, -0.9638671875, 1.04638671875, 3.056640625, 5.06689453125, 7.0771484375, 9.08740234375, 11.09765625, 13.10791015625, 15.1181640625, 17.12841796875, 19.138671875, 21.14892578125, 23.1591796875, 25.16943359375, 27.1796875, 29.18994140625, 31.2001953125, 33.21044921875, 35.220703125, 37.23095703125, 39.2412109375, 41.25146484375, 43.26171875, 45.27197265625, 47.2822265625, 49.29248046875, 51.302734375, 53.31298828125, 55.3232421875, 57.33349609375, 59.34375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 6.0, 9.0, 15.0, 10.0, 24.0, 21.0, 34.0, 50.0, 67.0, 72.0, 124.0, 149.0, 223.0, 343.0, 763.0, 6555.0, 3124616.0, 10632.0, 825.0, 316.0, 234.0, 135.0, 124.0, 84.0, 52.0, 43.0, 53.0, 28.0, 16.0, 15.0, 12.0, 10.0, 5.0, 7.0, 7.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.0, -129.46484375, -124.9296875, -120.39453125, -115.859375, -111.32421875, -106.7890625, -102.25390625, -97.71875, -93.18359375, -88.6484375, -84.11328125, -79.578125, -75.04296875, -70.5078125, -65.97265625, -61.4375, -56.90234375, -52.3671875, -47.83203125, -43.296875, -38.76171875, -34.2265625, -29.69140625, -25.15625, -20.62109375, -16.0859375, -11.55078125, -7.015625, -2.48046875, 2.0546875, 6.58984375, 11.125, 15.66015625, 20.1953125, 24.73046875, 29.265625, 33.80078125, 38.3359375, 42.87109375, 47.40625, 51.94140625, 56.4765625, 61.01171875, 65.546875, 70.08203125, 74.6171875, 79.15234375, 83.6875, 88.22265625, 92.7578125, 97.29296875, 101.828125, 106.36328125, 110.8984375, 115.43359375, 119.96875, 124.50390625, 129.0390625, 133.57421875, 138.109375, 142.64453125, 147.1796875, 151.71484375, 156.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 70.0, 627.0, 306.0, 13.0], "bins": [-517.095458984375, -508.717041015625, -500.3386535644531, -491.9602355957031, -483.58184814453125, -475.20343017578125, -466.82501220703125, -458.4466247558594, -450.0682067871094, -441.6897888183594, -433.3114013671875, -424.9329833984375, -416.5545959472656, -408.1761779785156, -399.79779052734375, -391.41937255859375, -383.04095458984375, -374.66253662109375, -366.2841491699219, -357.9057312011719, -349.52734375, -341.14892578125, -332.7705078125, -324.3921203613281, -316.01373291015625, -307.63531494140625, -299.2569274902344, -290.8785095214844, -282.5001220703125, -274.1217041015625, -265.7432861328125, -257.3648986816406, -248.98648071289062, -240.6080780029297, -232.22967529296875, -223.85125732421875, -215.4728546142578, -207.09445190429688, -198.71604919433594, -190.337646484375, -181.95924377441406, -173.58084106445312, -165.2024383544922, -156.82403564453125, -148.44561767578125, -140.0672149658203, -131.68881225585938, -123.31040954589844, -114.93199920654297, -106.55359649658203, -98.17518615722656, -89.79678344726562, -81.41838073730469, -73.03997039794922, -64.66156768798828, -56.28316116333008, -47.904754638671875, -39.52634811401367, -31.1479434967041, -22.76953887939453, -14.391132354736328, -6.012725830078125, 2.3656768798828125, 10.744083404541016, 19.12249183654785]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 5.0, 8.0, 13.0, 23.0, 18.0, 23.0, 24.0, 19.0, 35.0, 39.0, 35.0, 41.0, 33.0, 38.0, 36.0, 41.0, 45.0, 46.0, 51.0, 39.0, 36.0, 35.0, 38.0, 35.0, 31.0, 26.0, 22.0, 26.0, 25.0, 25.0, 12.0, 10.0, 7.0, 6.0, 9.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-132.5778045654297, -128.24562072753906, -123.91343688964844, -119.58125305175781, -115.24906921386719, -110.91688537597656, -106.58470916748047, -102.25252532958984, -97.92034149169922, -93.5881576538086, -89.25597381591797, -84.92378997802734, -80.59161376953125, -76.25942993164062, -71.92724609375, -67.59506225585938, -63.26287841796875, -58.930694580078125, -54.5985107421875, -50.26633071899414, -45.934146881103516, -41.60196304321289, -37.26978302001953, -32.937599182128906, -28.60541534423828, -24.273231506347656, -19.941049575805664, -15.608866691589355, -11.276683807373047, -6.944499969482422, -2.6123180389404297, 1.7198638916015625, 6.05206298828125, 10.384245872497559, 14.716428756713867, 19.04861068725586, 23.380794525146484, 27.71297836303711, 32.04515838623047, 36.377342224121094, 40.70952606201172, 45.041709899902344, 49.37389373779297, 53.70607376098633, 58.03825759887695, 62.37044143676758, 66.70262145996094, 71.03480529785156, 75.36698913574219, 79.69917297363281, 84.03135681152344, 88.36354064941406, 92.69572448730469, 97.02790832519531, 101.3600845336914, 105.69226837158203, 110.02445220947266, 114.35663604736328, 118.6888198852539, 123.02100372314453, 127.35317993164062, 131.68536376953125, 136.01754760742188, 140.3497314453125, 144.68191528320312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 10.0, 9.0, 12.0, 14.0, 15.0, 12.0, 24.0, 19.0, 19.0, 25.0, 36.0, 48.0, 30.0, 37.0, 39.0, 47.0, 52.0, 44.0, 45.0, 51.0, 43.0, 36.0, 29.0, 25.0, 37.0, 29.0, 41.0, 25.0, 21.0, 15.0, 12.0, 13.0, 17.0, 7.0, 10.0, 6.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.9453125, -14.4464111328125, -13.947509765625, -13.4486083984375, -12.94970703125, -12.4508056640625, -11.951904296875, -11.4530029296875, -10.9541015625, -10.4552001953125, -9.956298828125, -9.4573974609375, -8.95849609375, -8.4595947265625, -7.960693359375, -7.4617919921875, -6.962890625, -6.4639892578125, -5.965087890625, -5.4661865234375, -4.96728515625, -4.4683837890625, -3.969482421875, -3.4705810546875, -2.9716796875, -2.4727783203125, -1.973876953125, -1.4749755859375, -0.97607421875, -0.4771728515625, 0.021728515625, 0.5206298828125, 1.01953125, 1.5184326171875, 2.017333984375, 2.5162353515625, 3.01513671875, 3.5140380859375, 4.012939453125, 4.5118408203125, 5.0107421875, 5.5096435546875, 6.008544921875, 6.5074462890625, 7.00634765625, 7.5052490234375, 8.004150390625, 8.5030517578125, 9.001953125, 9.5008544921875, 9.999755859375, 10.4986572265625, 10.99755859375, 11.4964599609375, 11.995361328125, 12.4942626953125, 12.9931640625, 13.4920654296875, 13.990966796875, 14.4898681640625, 14.98876953125, 15.4876708984375, 15.986572265625, 16.4854736328125, 16.984375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 13.0, 8.0, 7.0, 19.0, 11.0, 23.0, 18.0, 25.0, 41.0, 47.0, 68.0, 96.0, 119.0, 215.0, 406.0, 1984.0, 45676.0, 2981823.0, 1150101.0, 11590.0, 1040.0, 297.0, 173.0, 104.0, 93.0, 69.0, 32.0, 30.0, 29.0, 19.0, 13.0, 16.0, 16.0, 16.0, 5.0, 6.0, 5.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.125, -58.236328125, -56.34765625, -54.458984375, -52.5703125, -50.681640625, -48.79296875, -46.904296875, -45.015625, -43.126953125, -41.23828125, -39.349609375, -37.4609375, -35.572265625, -33.68359375, -31.794921875, -29.90625, -28.017578125, -26.12890625, -24.240234375, -22.3515625, -20.462890625, -18.57421875, -16.685546875, -14.796875, -12.908203125, -11.01953125, -9.130859375, -7.2421875, -5.353515625, -3.46484375, -1.576171875, 0.3125, 2.201171875, 4.08984375, 5.978515625, 7.8671875, 9.755859375, 11.64453125, 13.533203125, 15.421875, 17.310546875, 19.19921875, 21.087890625, 22.9765625, 24.865234375, 26.75390625, 28.642578125, 30.53125, 32.419921875, 34.30859375, 36.197265625, 38.0859375, 39.974609375, 41.86328125, 43.751953125, 45.640625, 47.529296875, 49.41796875, 51.306640625, 53.1953125, 55.083984375, 56.97265625, 58.861328125, 60.75]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 14.0, 22.0, 33.0, 36.0, 65.0, 72.0, 155.0, 211.0, 351.0, 522.0, 713.0, 642.0, 423.0, 299.0, 182.0, 92.0, 89.0, 50.0, 41.0, 15.0, 17.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-65.0, -63.513671875, -62.02734375, -60.541015625, -59.0546875, -57.568359375, -56.08203125, -54.595703125, -53.109375, -51.623046875, -50.13671875, -48.650390625, -47.1640625, -45.677734375, -44.19140625, -42.705078125, -41.21875, -39.732421875, -38.24609375, -36.759765625, -35.2734375, -33.787109375, -32.30078125, -30.814453125, -29.328125, -27.841796875, -26.35546875, -24.869140625, -23.3828125, -21.896484375, -20.41015625, -18.923828125, -17.4375, -15.951171875, -14.46484375, -12.978515625, -11.4921875, -10.005859375, -8.51953125, -7.033203125, -5.546875, -4.060546875, -2.57421875, -1.087890625, 0.3984375, 1.884765625, 3.37109375, 4.857421875, 6.34375, 7.830078125, 9.31640625, 10.802734375, 12.2890625, 13.775390625, 15.26171875, 16.748046875, 18.234375, 19.720703125, 21.20703125, 22.693359375, 24.1796875, 25.666015625, 27.15234375, 28.638671875, 30.125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 14.0, 17.0, 19.0, 24.0, 35.0, 54.0, 58.0, 106.0, 116.0, 173.0, 333.0, 572.0, 2030.0, 3920979.0, 267178.0, 1218.0, 467.0, 233.0, 164.0, 110.0, 81.0, 64.0, 49.0, 33.0, 32.0, 25.0, 11.0, 11.0, 6.0, 15.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 3.0], "bins": [-279.0, -272.171875, -265.34375, -258.515625, -251.6875, -244.859375, -238.03125, -231.203125, -224.375, -217.546875, -210.71875, -203.890625, -197.0625, -190.234375, -183.40625, -176.578125, -169.75, -162.921875, -156.09375, -149.265625, -142.4375, -135.609375, -128.78125, -121.953125, -115.125, -108.296875, -101.46875, -94.640625, -87.8125, -80.984375, -74.15625, -67.328125, -60.5, -53.671875, -46.84375, -40.015625, -33.1875, -26.359375, -19.53125, -12.703125, -5.875, 0.953125, 7.78125, 14.609375, 21.4375, 28.265625, 35.09375, 41.921875, 48.75, 55.578125, 62.40625, 69.234375, 76.0625, 82.890625, 89.71875, 96.546875, 103.375, 110.203125, 117.03125, 123.859375, 130.6875, 137.515625, 144.34375, 151.171875, 158.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 31.0, 199.0, 419.0, 288.0, 58.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-489.2817687988281, -476.271240234375, -463.2607421875, -450.250244140625, -437.2397155761719, -424.22918701171875, -411.21868896484375, -398.20819091796875, -385.1976623535156, -372.1871337890625, -359.1766357421875, -346.1661376953125, -333.1556091308594, -320.14508056640625, -307.13458251953125, -294.12408447265625, -281.1135559082031, -268.10302734375, -255.092529296875, -242.08201599121094, -229.07150268554688, -216.0609893798828, -203.05047607421875, -190.0399627685547, -177.02944946289062, -164.01893615722656, -151.0084228515625, -137.99790954589844, -124.98739624023438, -111.97688293457031, -98.96636962890625, -85.95585632324219, -72.94534301757812, -59.93482971191406, -46.92431640625, -33.91380310058594, -20.903289794921875, -7.8927764892578125, 5.11773681640625, 18.128250122070312, 31.138763427734375, 44.14927673339844, 57.1597900390625, 70.17030334472656, 83.18081665039062, 96.19132995605469, 109.20184326171875, 122.21235656738281, 135.22286987304688, 148.23338317871094, 161.243896484375, 174.25440979003906, 187.26492309570312, 200.2754364013672, 213.28594970703125, 226.2964630126953, 239.30697631835938, 252.31748962402344, 265.3280029296875, 278.3385009765625, 291.3490295410156, 304.35955810546875, 317.37005615234375, 330.38055419921875, 343.3910827636719]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 12.0, 18.0, 15.0, 21.0, 27.0, 29.0, 21.0, 28.0, 32.0, 27.0, 35.0, 33.0, 38.0, 43.0, 46.0, 29.0, 47.0, 47.0, 38.0, 37.0, 45.0, 45.0, 39.0, 36.0, 35.0, 26.0, 23.0, 12.0, 11.0, 18.0, 17.0, 13.0, 7.0, 6.0, 9.0, 9.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.12477111816406, -88.68219757080078, -85.2396240234375, -81.79704284667969, -78.3544692993164, -74.91189575195312, -71.46932220458984, -68.02674865722656, -64.58416748046875, -61.14159393310547, -57.69901657104492, -54.25644302368164, -50.813865661621094, -47.37129211425781, -43.92871856689453, -40.486141204833984, -37.0435676574707, -33.60099411010742, -30.158416748046875, -26.715843200683594, -23.273265838623047, -19.830692291259766, -16.38811683654785, -12.945541381835938, -9.502965927124023, -6.060390472412109, -2.6178154945373535, 0.8247594833374023, 4.267334938049316, 7.709909439086914, 11.152484893798828, 14.595060348510742, 18.037635803222656, 21.48021125793457, 24.922786712646484, 28.365360260009766, 31.807937622070312, 35.250511169433594, 38.693084716796875, 42.13566207885742, 45.57823944091797, 49.02081298828125, 52.4633903503418, 55.90596389770508, 59.348541259765625, 62.791114807128906, 66.23368835449219, 69.67626953125, 73.11883544921875, 76.56140899658203, 80.00398254394531, 83.44656372070312, 86.8891372680664, 90.33171081542969, 93.77428436279297, 97.21685791015625, 100.65943908691406, 104.10201263427734, 107.54458618164062, 110.98716735839844, 114.42974090576172, 117.872314453125, 121.31488800048828, 124.75746154785156, 128.20004272460938]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 9.0, 8.0, 14.0, 15.0, 23.0, 18.0, 33.0, 26.0, 28.0, 24.0, 36.0, 40.0, 40.0, 37.0, 53.0, 53.0, 36.0, 43.0, 50.0, 46.0, 42.0, 39.0, 28.0, 32.0, 30.0, 26.0, 23.0, 17.0, 20.0, 21.0, 11.0, 13.0, 15.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8515625, -15.3348388671875, -14.818115234375, -14.3013916015625, -13.78466796875, -13.2679443359375, -12.751220703125, -12.2344970703125, -11.7177734375, -11.2010498046875, -10.684326171875, -10.1676025390625, -9.65087890625, -9.1341552734375, -8.617431640625, -8.1007080078125, -7.583984375, -7.0672607421875, -6.550537109375, -6.0338134765625, -5.51708984375, -5.0003662109375, -4.483642578125, -3.9669189453125, -3.4501953125, -2.9334716796875, -2.416748046875, -1.9000244140625, -1.38330078125, -0.8665771484375, -0.349853515625, 0.1668701171875, 0.68359375, 1.2003173828125, 1.717041015625, 2.2337646484375, 2.75048828125, 3.2672119140625, 3.783935546875, 4.3006591796875, 4.8173828125, 5.3341064453125, 5.850830078125, 6.3675537109375, 6.88427734375, 7.4010009765625, 7.917724609375, 8.4344482421875, 8.951171875, 9.4678955078125, 9.984619140625, 10.5013427734375, 11.01806640625, 11.5347900390625, 12.051513671875, 12.5682373046875, 13.0849609375, 13.6016845703125, 14.118408203125, 14.6351318359375, 15.15185546875, 15.6685791015625, 16.185302734375, 16.7020263671875, 17.21875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 9.0, 13.0, 13.0, 32.0, 43.0, 62.0, 95.0, 146.0, 214.0, 288.0, 479.0, 744.0, 1129.0, 1672.0, 2691.0, 4318.0, 6871.0, 10942.0, 17784.0, 28606.0, 47689.0, 84211.0, 180722.0, 344264.0, 138925.0, 69838.0, 40948.0, 24735.0, 15200.0, 9537.0, 5882.0, 3719.0, 2367.0, 1526.0, 931.0, 680.0, 416.0, 251.0, 173.0, 132.0, 86.0, 59.0, 34.0, 23.0, 14.0, 13.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3984375, -4.26654052734375, -4.1346435546875, -4.00274658203125, -3.870849609375, -3.73895263671875, -3.6070556640625, -3.47515869140625, -3.34326171875, -3.21136474609375, -3.0794677734375, -2.94757080078125, -2.815673828125, -2.68377685546875, -2.5518798828125, -2.41998291015625, -2.2880859375, -2.15618896484375, -2.0242919921875, -1.89239501953125, -1.760498046875, -1.62860107421875, -1.4967041015625, -1.36480712890625, -1.23291015625, -1.10101318359375, -0.9691162109375, -0.83721923828125, -0.705322265625, -0.57342529296875, -0.4415283203125, -0.30963134765625, -0.177734375, -0.04583740234375, 0.0860595703125, 0.21795654296875, 0.349853515625, 0.48175048828125, 0.6136474609375, 0.74554443359375, 0.87744140625, 1.00933837890625, 1.1412353515625, 1.27313232421875, 1.405029296875, 1.53692626953125, 1.6688232421875, 1.80072021484375, 1.9326171875, 2.06451416015625, 2.1964111328125, 2.32830810546875, 2.460205078125, 2.59210205078125, 2.7239990234375, 2.85589599609375, 2.98779296875, 3.11968994140625, 3.2515869140625, 3.38348388671875, 3.515380859375, 3.64727783203125, 3.7791748046875, 3.91107177734375, 4.04296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 11.0, 10.0, 14.0, 7.0, 9.0, 19.0, 15.0, 31.0, 23.0, 20.0, 30.0, 40.0, 42.0, 45.0, 37.0, 40.0, 47.0, 49.0, 1066.0, 56.0, 38.0, 40.0, 40.0, 33.0, 37.0, 30.0, 17.0, 21.0, 20.0, 29.0, 20.0, 16.0, 9.0, 7.0, 16.0, 8.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-11.078125, -10.7464599609375, -10.414794921875, -10.0831298828125, -9.75146484375, -9.4197998046875, -9.088134765625, -8.7564697265625, -8.4248046875, -8.0931396484375, -7.761474609375, -7.4298095703125, -7.09814453125, -6.7664794921875, -6.434814453125, -6.1031494140625, -5.771484375, -5.4398193359375, -5.108154296875, -4.7764892578125, -4.44482421875, -4.1131591796875, -3.781494140625, -3.4498291015625, -3.1181640625, -2.7864990234375, -2.454833984375, -2.1231689453125, -1.79150390625, -1.4598388671875, -1.128173828125, -0.7965087890625, -0.46484375, -0.1331787109375, 0.198486328125, 0.5301513671875, 0.86181640625, 1.1934814453125, 1.525146484375, 1.8568115234375, 2.1884765625, 2.5201416015625, 2.851806640625, 3.1834716796875, 3.51513671875, 3.8468017578125, 4.178466796875, 4.5101318359375, 4.841796875, 5.1734619140625, 5.505126953125, 5.8367919921875, 6.16845703125, 6.5001220703125, 6.831787109375, 7.1634521484375, 7.4951171875, 7.8267822265625, 8.158447265625, 8.4901123046875, 8.82177734375, 9.1534423828125, 9.485107421875, 9.8167724609375, 10.1484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 14.0, 9.0, 17.0, 30.0, 36.0, 61.0, 64.0, 133.0, 167.0, 249.0, 347.0, 514.0, 750.0, 1208.0, 1710.0, 2711.0, 4382.0, 6835.0, 10828.0, 17618.0, 28566.0, 48447.0, 86724.0, 179335.0, 1403240.0, 130883.0, 68922.0, 39309.0, 23889.0, 14794.0, 9037.0, 5829.0, 3658.0, 2244.0, 1537.0, 1005.0, 659.0, 428.0, 294.0, 218.0, 129.0, 87.0, 65.0, 48.0, 42.0, 13.0, 18.0, 11.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.16796875, -4.03485107421875, -3.9017333984375, -3.76861572265625, -3.635498046875, -3.50238037109375, -3.3692626953125, -3.23614501953125, -3.10302734375, -2.96990966796875, -2.8367919921875, -2.70367431640625, -2.570556640625, -2.43743896484375, -2.3043212890625, -2.17120361328125, -2.0380859375, -1.90496826171875, -1.7718505859375, -1.63873291015625, -1.505615234375, -1.37249755859375, -1.2393798828125, -1.10626220703125, -0.97314453125, -0.84002685546875, -0.7069091796875, -0.57379150390625, -0.440673828125, -0.30755615234375, -0.1744384765625, -0.04132080078125, 0.091796875, 0.22491455078125, 0.3580322265625, 0.49114990234375, 0.624267578125, 0.75738525390625, 0.8905029296875, 1.02362060546875, 1.15673828125, 1.28985595703125, 1.4229736328125, 1.55609130859375, 1.689208984375, 1.82232666015625, 1.9554443359375, 2.08856201171875, 2.2216796875, 2.35479736328125, 2.4879150390625, 2.62103271484375, 2.754150390625, 2.88726806640625, 3.0203857421875, 3.15350341796875, 3.28662109375, 3.41973876953125, 3.5528564453125, 3.68597412109375, 3.819091796875, 3.95220947265625, 4.0853271484375, 4.21844482421875, 4.3515625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 19.0, 13.0, 10.0, 22.0, 29.0, 52.0, 49.0, 77.0, 94.0, 116.0, 130.0, 89.0, 73.0, 62.0, 38.0, 27.0, 18.0, 18.0, 11.0, 7.0, 10.0, 8.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.004643619060516357, -0.00450742244720459, -0.004371225833892822, -0.004235029220581055, -0.004098832607269287, -0.0039626359939575195, -0.003826439380645752, -0.0036902427673339844, -0.003554046154022217, -0.0034178495407104492, -0.0032816529273986816, -0.003145456314086914, -0.0030092597007751465, -0.002873063087463379, -0.0027368664741516113, -0.0026006698608398438, -0.002464473247528076, -0.0023282766342163086, -0.002192080020904541, -0.0020558834075927734, -0.0019196867942810059, -0.0017834901809692383, -0.0016472935676574707, -0.0015110969543457031, -0.0013749003410339355, -0.001238703727722168, -0.0011025071144104004, -0.0009663105010986328, -0.0008301138877868652, -0.0006939172744750977, -0.0005577206611633301, -0.0004215240478515625, -0.0002853274345397949, -0.00014913082122802734, -1.2934207916259766e-05, 0.0001232624053955078, 0.0002594590187072754, 0.00039565563201904297, 0.0005318522453308105, 0.0006680488586425781, 0.0008042454719543457, 0.0009404420852661133, 0.0010766386985778809, 0.0012128353118896484, 0.001349031925201416, 0.0014852285385131836, 0.0016214251518249512, 0.0017576217651367188, 0.0018938183784484863, 0.002030014991760254, 0.0021662116050720215, 0.002302408218383789, 0.0024386048316955566, 0.0025748014450073242, 0.002710998058319092, 0.0028471946716308594, 0.002983391284942627, 0.0031195878982543945, 0.003255784511566162, 0.0033919811248779297, 0.0035281777381896973, 0.003664374351501465, 0.0038005709648132324, 0.003936767578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 4.0, 3.0, 8.0, 11.0, 18.0, 17.0, 20.0, 31.0, 43.0, 89.0, 157.0, 531.0, 14029.0, 1031960.0, 1036.0, 263.0, 103.0, 66.0, 45.0, 28.0, 14.0, 17.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.09177780151367188, -0.08852386474609375, -0.08526992797851562, -0.0820159912109375, -0.07876205444335938, -0.07550811767578125, -0.07225418090820312, -0.069000244140625, -0.06574630737304688, -0.06249237060546875, -0.059238433837890625, -0.0559844970703125, -0.052730560302734375, -0.04947662353515625, -0.046222686767578125, -0.04296875, -0.039714813232421875, -0.03646087646484375, -0.033206939697265625, -0.0299530029296875, -0.026699066162109375, -0.02344512939453125, -0.020191192626953125, -0.016937255859375, -0.013683319091796875, -0.01042938232421875, -0.007175445556640625, -0.0039215087890625, -0.000667572021484375, 0.00258636474609375, 0.005840301513671875, 0.00909423828125, 0.012348175048828125, 0.01560211181640625, 0.018856048583984375, 0.0221099853515625, 0.025363922119140625, 0.02861785888671875, 0.031871795654296875, 0.035125732421875, 0.038379669189453125, 0.04163360595703125, 0.044887542724609375, 0.0481414794921875, 0.051395416259765625, 0.05464935302734375, 0.057903289794921875, 0.0611572265625, 0.06441116333007812, 0.06766510009765625, 0.07091903686523438, 0.0741729736328125, 0.07742691040039062, 0.08068084716796875, 0.08393478393554688, 0.087188720703125, 0.09044265747070312, 0.09369659423828125, 0.09695053100585938, 0.1002044677734375, 0.10345840454101562, 0.10671234130859375, 0.10996627807617188, 0.11322021484375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 73.0, 520.0, 370.0, 40.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011303099803626537, -0.011080803349614143, -0.010858507826924324, -0.01063621137291193, -0.010413914918899536, -0.010191619396209717, -0.009969322942197323, -0.009747026488184929, -0.009524730034172535, -0.009302433580160141, -0.009080138057470322, -0.008857841603457928, -0.008635545149445534, -0.008413249626755714, -0.00819095317274332, -0.007968656718730927, -0.007746361196041107, -0.0075240652076900005, -0.007301768753677607, -0.0070794727653265, -0.006857176311314106, -0.006634880322962999, -0.006412584334611893, -0.006190287880599499, -0.005967991426587105, -0.005745695438235998, -0.005523398984223604, -0.0053011029958724976, -0.005078806541860104, -0.004856510553508997, -0.00463421456515789, -0.004411918111145496, -0.00418962212279439, -0.003967326134443283, -0.003745029680430889, -0.0035227336920797825, -0.003300437470898032, -0.003078141249716282, -0.0028558450285345316, -0.0026335488073527813, -0.0024112528190016747, -0.0021889565978199244, -0.001966660376638174, -0.0017443642718717456, -0.0015220681671053171, -0.0012997719459235668, -0.0010774757247418165, -0.000855179619975388, -0.0006328832823783159, -0.00041058711940422654, -0.0001882909273263067, 3.400526475161314e-05, 0.0002563014277257025, 0.0004785975906997919, 0.0007008938118815422, 0.0009231899166479707, 0.001145486137829721, 0.0013677823590114713, 0.0015900784637778997, 0.00181237468495965, 0.0020346709061414003, 0.0022569671273231506, 0.0024792631156742573, 0.0027015593368560076, 0.002923855558037758]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 11.0, 13.0, 11.0, 26.0, 19.0, 19.0, 23.0, 25.0, 27.0, 37.0, 41.0, 28.0, 35.0, 39.0, 44.0, 33.0, 45.0, 28.0, 30.0, 41.0, 47.0, 36.0, 36.0, 25.0, 35.0, 37.0, 28.0, 28.0, 18.0, 7.0, 18.0, 12.0, 11.0, 16.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.001584470272064209, -0.0015379618853330612, -0.0014914534986019135, -0.0014449451118707657, -0.001398436725139618, -0.0013519283384084702, -0.0013054199516773224, -0.0012589115649461746, -0.0012124031782150269, -0.001165894791483879, -0.0011193864047527313, -0.0010728780180215836, -0.0010263696312904358, -0.000979861244559288, -0.0009333528578281403, -0.0008868444710969925, -0.0008403360843658447, -0.000793827697634697, -0.0007473193109035492, -0.0007008109241724014, -0.0006543025374412537, -0.0006077941507101059, -0.0005612857639789581, -0.0005147773772478104, -0.0004682689905166626, -0.00042176060378551483, -0.00037525221705436707, -0.0003287438303232193, -0.00028223544359207153, -0.00023572705686092377, -0.000189218670129776, -0.00014271028339862823, -9.620189666748047e-05, -4.96935099363327e-05, -3.1851232051849365e-06, 4.332326352596283e-05, 8.98316502571106e-05, 0.00013634003698825836, 0.00018284842371940613, 0.0002293568104505539, 0.00027586519718170166, 0.0003223735839128494, 0.0003688819706439972, 0.00041539035737514496, 0.0004618987441062927, 0.0005084071308374405, 0.0005549155175685883, 0.000601423904299736, 0.0006479322910308838, 0.0006944406777620316, 0.0007409490644931793, 0.0007874574512243271, 0.0008339658379554749, 0.0008804742246866226, 0.0009269826114177704, 0.0009734909981489182, 0.001019999384880066, 0.0010665077716112137, 0.0011130161583423615, 0.0011595245450735092, 0.001206032931804657, 0.0012525413185358047, 0.0012990497052669525, 0.0013455580919981003, 0.001392066478729248]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 9.0, 8.0, 14.0, 15.0, 23.0, 18.0, 33.0, 26.0, 28.0, 24.0, 36.0, 40.0, 40.0, 37.0, 53.0, 53.0, 36.0, 43.0, 50.0, 46.0, 42.0, 39.0, 28.0, 32.0, 30.0, 26.0, 23.0, 17.0, 20.0, 21.0, 11.0, 13.0, 15.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8515625, -15.3348388671875, -14.818115234375, -14.3013916015625, -13.78466796875, -13.2679443359375, -12.751220703125, -12.2344970703125, -11.7177734375, -11.2010498046875, -10.684326171875, -10.1676025390625, -9.65087890625, -9.1341552734375, -8.617431640625, -8.1007080078125, -7.583984375, -7.0672607421875, -6.550537109375, -6.0338134765625, -5.51708984375, -5.0003662109375, -4.483642578125, -3.9669189453125, -3.4501953125, -2.9334716796875, -2.416748046875, -1.9000244140625, -1.38330078125, -0.8665771484375, -0.349853515625, 0.1668701171875, 0.68359375, 1.2003173828125, 1.717041015625, 2.2337646484375, 2.75048828125, 3.2672119140625, 3.783935546875, 4.3006591796875, 4.8173828125, 5.3341064453125, 5.850830078125, 6.3675537109375, 6.88427734375, 7.4010009765625, 7.917724609375, 8.4344482421875, 8.951171875, 9.4678955078125, 9.984619140625, 10.5013427734375, 11.01806640625, 11.5347900390625, 12.051513671875, 12.5682373046875, 13.0849609375, 13.6016845703125, 14.118408203125, 14.6351318359375, 15.15185546875, 15.6685791015625, 16.185302734375, 16.7020263671875, 17.21875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 5.0, 16.0, 9.0, 15.0, 24.0, 25.0, 31.0, 39.0, 53.0, 99.0, 77.0, 122.0, 139.0, 205.0, 301.0, 423.0, 514.0, 861.0, 1222.0, 2130.0, 4097.0, 10464.0, 38078.0, 180315.0, 608176.0, 149570.0, 32554.0, 9265.0, 3708.0, 2055.0, 1173.0, 759.0, 501.0, 362.0, 267.0, 230.0, 152.0, 115.0, 88.0, 73.0, 65.0, 40.0, 33.0, 29.0, 19.0, 17.0, 8.0, 13.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0], "bins": [-18.296875, -17.73291015625, -17.1689453125, -16.60498046875, -16.041015625, -15.47705078125, -14.9130859375, -14.34912109375, -13.78515625, -13.22119140625, -12.6572265625, -12.09326171875, -11.529296875, -10.96533203125, -10.4013671875, -9.83740234375, -9.2734375, -8.70947265625, -8.1455078125, -7.58154296875, -7.017578125, -6.45361328125, -5.8896484375, -5.32568359375, -4.76171875, -4.19775390625, -3.6337890625, -3.06982421875, -2.505859375, -1.94189453125, -1.3779296875, -0.81396484375, -0.25, 0.31396484375, 0.8779296875, 1.44189453125, 2.005859375, 2.56982421875, 3.1337890625, 3.69775390625, 4.26171875, 4.82568359375, 5.3896484375, 5.95361328125, 6.517578125, 7.08154296875, 7.6455078125, 8.20947265625, 8.7734375, 9.33740234375, 9.9013671875, 10.46533203125, 11.029296875, 11.59326171875, 12.1572265625, 12.72119140625, 13.28515625, 13.84912109375, 14.4130859375, 14.97705078125, 15.541015625, 16.10498046875, 16.6689453125, 17.23291015625, 17.796875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 16.0, 11.0, 13.0, 9.0, 18.0, 13.0, 23.0, 21.0, 48.0, 30.0, 47.0, 48.0, 40.0, 65.0, 81.0, 295.0, 1695.0, 110.0, 75.0, 48.0, 47.0, 41.0, 42.0, 40.0, 28.0, 27.0, 17.0, 18.0, 16.0, 7.0, 10.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-58.40625, -56.5908203125, -54.775390625, -52.9599609375, -51.14453125, -49.3291015625, -47.513671875, -45.6982421875, -43.8828125, -42.0673828125, -40.251953125, -38.4365234375, -36.62109375, -34.8056640625, -32.990234375, -31.1748046875, -29.359375, -27.5439453125, -25.728515625, -23.9130859375, -22.09765625, -20.2822265625, -18.466796875, -16.6513671875, -14.8359375, -13.0205078125, -11.205078125, -9.3896484375, -7.57421875, -5.7587890625, -3.943359375, -2.1279296875, -0.3125, 1.5029296875, 3.318359375, 5.1337890625, 6.94921875, 8.7646484375, 10.580078125, 12.3955078125, 14.2109375, 16.0263671875, 17.841796875, 19.6572265625, 21.47265625, 23.2880859375, 25.103515625, 26.9189453125, 28.734375, 30.5498046875, 32.365234375, 34.1806640625, 35.99609375, 37.8115234375, 39.626953125, 41.4423828125, 43.2578125, 45.0732421875, 46.888671875, 48.7041015625, 50.51953125, 52.3349609375, 54.150390625, 55.9658203125, 57.78125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 7.0, 10.0, 6.0, 18.0, 17.0, 22.0, 33.0, 39.0, 45.0, 74.0, 112.0, 148.0, 234.0, 295.0, 573.0, 3732.0, 3027274.0, 110263.0, 1397.0, 468.0, 271.0, 167.0, 125.0, 105.0, 58.0, 44.0, 44.0, 32.0, 19.0, 22.0, 11.0, 11.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.0, -126.453125, -121.90625, -117.359375, -112.8125, -108.265625, -103.71875, -99.171875, -94.625, -90.078125, -85.53125, -80.984375, -76.4375, -71.890625, -67.34375, -62.796875, -58.25, -53.703125, -49.15625, -44.609375, -40.0625, -35.515625, -30.96875, -26.421875, -21.875, -17.328125, -12.78125, -8.234375, -3.6875, 0.859375, 5.40625, 9.953125, 14.5, 19.046875, 23.59375, 28.140625, 32.6875, 37.234375, 41.78125, 46.328125, 50.875, 55.421875, 59.96875, 64.515625, 69.0625, 73.609375, 78.15625, 82.703125, 87.25, 91.796875, 96.34375, 100.890625, 105.4375, 109.984375, 114.53125, 119.078125, 123.625, 128.171875, 132.71875, 137.265625, 141.8125, 146.359375, 150.90625, 155.453125, 160.0]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 398.0, 613.0, 6.0, 0.0, 0.0, 1.0], "bins": [-1236.9010009765625, -1215.95068359375, -1195.000244140625, -1174.0499267578125, -1153.0994873046875, -1132.149169921875, -1111.19873046875, -1090.2484130859375, -1069.298095703125, -1048.3477783203125, -1027.3973388671875, -1006.4469604492188, -985.49658203125, -964.5462646484375, -943.5958862304688, -922.6455078125, -901.695068359375, -880.7446899414062, -859.7943115234375, -838.8439331054688, -817.8935546875, -796.9432373046875, -775.9928588867188, -755.04248046875, -734.0921020507812, -713.1417236328125, -692.1913452148438, -671.240966796875, -650.2906494140625, -629.3402709960938, -608.389892578125, -587.4395141601562, -566.4891357421875, -545.5387573242188, -524.58837890625, -503.6380310058594, -482.6876525878906, -461.7372741699219, -440.78692626953125, -419.8365478515625, -398.88616943359375, -377.935791015625, -356.98541259765625, -336.0350646972656, -315.0846862792969, -294.1343078613281, -273.1839599609375, -252.23358154296875, -231.283203125, -210.33282470703125, -189.38246154785156, -168.43209838867188, -147.48171997070312, -126.5313491821289, -105.58097839355469, -84.630615234375, -63.68024444580078, -42.72987365722656, -21.779502868652344, -0.829132080078125, 20.121238708496094, 41.07160949707031, 62.02198028564453, 82.97234344482422, 103.92272186279297]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 9.0, 5.0, 9.0, 9.0, 9.0, 10.0, 22.0, 14.0, 14.0, 16.0, 34.0, 34.0, 26.0, 26.0, 32.0, 27.0, 39.0, 42.0, 27.0, 38.0, 47.0, 50.0, 42.0, 47.0, 41.0, 39.0, 31.0, 31.0, 25.0, 33.0, 26.0, 19.0, 21.0, 13.0, 11.0, 15.0, 11.0, 7.0, 8.0, 8.0, 8.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.30242919921875, -123.76303100585938, -119.2236328125, -114.68423461914062, -110.14483642578125, -105.60543823242188, -101.06603240966797, -96.5266342163086, -91.98723602294922, -87.44783782958984, -82.90843963623047, -78.3690414428711, -73.82963562011719, -69.29023742675781, -64.75083923339844, -60.21144104003906, -55.67204284667969, -51.13264465332031, -46.59324645996094, -42.0538444519043, -37.51444625854492, -32.97504806518555, -28.43564796447754, -23.89624786376953, -19.356849670410156, -14.817450523376465, -10.278051376342773, -5.738652229309082, -1.1992530822753906, 3.3401451110839844, 7.879545211791992, 12.4189453125, 16.958343505859375, 21.49774169921875, 26.037141799926758, 30.576541900634766, 35.11594009399414, 39.655338287353516, 44.194740295410156, 48.73413848876953, 53.273536682128906, 57.81293487548828, 62.352333068847656, 66.89173126220703, 71.43113708496094, 75.97053527832031, 80.50993347167969, 85.04933166503906, 89.58872985839844, 94.12812805175781, 98.66752624511719, 103.20692443847656, 107.74632263183594, 112.28572082519531, 116.82512664794922, 121.3645248413086, 125.90392303466797, 130.44332885742188, 134.98272705078125, 139.52212524414062, 144.0615234375, 148.60092163085938, 153.14031982421875, 157.67971801757812, 162.2191162109375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 11.0, 14.0, 21.0, 16.0, 22.0, 39.0, 19.0, 30.0, 23.0, 36.0, 36.0, 44.0, 51.0, 50.0, 53.0, 43.0, 43.0, 52.0, 46.0, 33.0, 33.0, 34.0, 33.0, 23.0, 31.0, 18.0, 13.0, 20.0, 24.0, 8.0, 10.0, 9.0, 11.0, 7.0, 5.0, 5.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.427490234375, -16.87060546875, -16.313720703125, -15.7568359375, -15.199951171875, -14.64306640625, -14.086181640625, -13.529296875, -12.972412109375, -12.41552734375, -11.858642578125, -11.3017578125, -10.744873046875, -10.18798828125, -9.631103515625, -9.07421875, -8.517333984375, -7.96044921875, -7.403564453125, -6.8466796875, -6.289794921875, -5.73291015625, -5.176025390625, -4.619140625, -4.062255859375, -3.50537109375, -2.948486328125, -2.3916015625, -1.834716796875, -1.27783203125, -0.720947265625, -0.1640625, 0.392822265625, 0.94970703125, 1.506591796875, 2.0634765625, 2.620361328125, 3.17724609375, 3.734130859375, 4.291015625, 4.847900390625, 5.40478515625, 5.961669921875, 6.5185546875, 7.075439453125, 7.63232421875, 8.189208984375, 8.74609375, 9.302978515625, 9.85986328125, 10.416748046875, 10.9736328125, 11.530517578125, 12.08740234375, 12.644287109375, 13.201171875, 13.758056640625, 14.31494140625, 14.871826171875, 15.4287109375, 15.985595703125, 16.54248046875, 17.099365234375, 17.65625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 5.0, 4.0, 11.0, 13.0, 9.0, 13.0, 21.0, 28.0, 16.0, 26.0, 35.0, 30.0, 45.0, 71.0, 150.0, 437.0, 1722.0, 44159.0, 3235107.0, 903832.0, 7037.0, 833.0, 260.0, 93.0, 53.0, 37.0, 32.0, 25.0, 25.0, 24.0, 30.0, 11.0, 15.0, 13.0, 6.0, 8.0, 11.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.8125, -62.7734375, -60.734375, -58.6953125, -56.65625, -54.6171875, -52.578125, -50.5390625, -48.5, -46.4609375, -44.421875, -42.3828125, -40.34375, -38.3046875, -36.265625, -34.2265625, -32.1875, -30.1484375, -28.109375, -26.0703125, -24.03125, -21.9921875, -19.953125, -17.9140625, -15.875, -13.8359375, -11.796875, -9.7578125, -7.71875, -5.6796875, -3.640625, -1.6015625, 0.4375, 2.4765625, 4.515625, 6.5546875, 8.59375, 10.6328125, 12.671875, 14.7109375, 16.75, 18.7890625, 20.828125, 22.8671875, 24.90625, 26.9453125, 28.984375, 31.0234375, 33.0625, 35.1015625, 37.140625, 39.1796875, 41.21875, 43.2578125, 45.296875, 47.3359375, 49.375, 51.4140625, 53.453125, 55.4921875, 57.53125, 59.5703125, 61.609375, 63.6484375, 65.6875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 12.0, 8.0, 19.0, 20.0, 18.0, 27.0, 42.0, 52.0, 70.0, 96.0, 105.0, 148.0, 185.0, 253.0, 336.0, 471.0, 461.0, 424.0, 342.0, 253.0, 197.0, 111.0, 108.0, 70.0, 46.0, 52.0, 39.0, 29.0, 20.0, 8.0, 7.0, 5.0, 5.0, 6.0, 0.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.70751953125, -33.7275390625, -32.74755859375, -31.767578125, -30.78759765625, -29.8076171875, -28.82763671875, -27.84765625, -26.86767578125, -25.8876953125, -24.90771484375, -23.927734375, -22.94775390625, -21.9677734375, -20.98779296875, -20.0078125, -19.02783203125, -18.0478515625, -17.06787109375, -16.087890625, -15.10791015625, -14.1279296875, -13.14794921875, -12.16796875, -11.18798828125, -10.2080078125, -9.22802734375, -8.248046875, -7.26806640625, -6.2880859375, -5.30810546875, -4.328125, -3.34814453125, -2.3681640625, -1.38818359375, -0.408203125, 0.57177734375, 1.5517578125, 2.53173828125, 3.51171875, 4.49169921875, 5.4716796875, 6.45166015625, 7.431640625, 8.41162109375, 9.3916015625, 10.37158203125, 11.3515625, 12.33154296875, 13.3115234375, 14.29150390625, 15.271484375, 16.25146484375, 17.2314453125, 18.21142578125, 19.19140625, 20.17138671875, 21.1513671875, 22.13134765625, 23.111328125, 24.09130859375, 25.0712890625, 26.05126953125, 27.03125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 6.0, 8.0, 12.0, 9.0, 19.0, 18.0, 37.0, 25.0, 58.0, 61.0, 68.0, 95.0, 136.0, 163.0, 234.0, 346.0, 654.0, 3251.0, 3983905.0, 202040.0, 1245.0, 530.0, 308.0, 222.0, 171.0, 123.0, 104.0, 75.0, 71.0, 69.0, 35.0, 39.0, 23.0, 23.0, 16.0, 15.0, 12.0, 13.0, 8.0, 5.0, 6.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.25, -171.677734375, -166.10546875, -160.533203125, -154.9609375, -149.388671875, -143.81640625, -138.244140625, -132.671875, -127.099609375, -121.52734375, -115.955078125, -110.3828125, -104.810546875, -99.23828125, -93.666015625, -88.09375, -82.521484375, -76.94921875, -71.376953125, -65.8046875, -60.232421875, -54.66015625, -49.087890625, -43.515625, -37.943359375, -32.37109375, -26.798828125, -21.2265625, -15.654296875, -10.08203125, -4.509765625, 1.0625, 6.634765625, 12.20703125, 17.779296875, 23.3515625, 28.923828125, 34.49609375, 40.068359375, 45.640625, 51.212890625, 56.78515625, 62.357421875, 67.9296875, 73.501953125, 79.07421875, 84.646484375, 90.21875, 95.791015625, 101.36328125, 106.935546875, 112.5078125, 118.080078125, 123.65234375, 129.224609375, 134.796875, 140.369140625, 145.94140625, 151.513671875, 157.0859375, 162.658203125, 168.23046875, 173.802734375, 179.375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 51.0, 221.0, 416.0, 259.0, 53.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-536.2328491210938, -523.927001953125, -511.62115478515625, -499.3153076171875, -487.00946044921875, -474.70361328125, -462.39776611328125, -450.0919189453125, -437.78607177734375, -425.480224609375, -413.17437744140625, -400.8685302734375, -388.56268310546875, -376.2568359375, -363.95098876953125, -351.6451416015625, -339.3392639160156, -327.0334167480469, -314.7275695800781, -302.4217224121094, -290.1158752441406, -277.8100280761719, -265.504150390625, -253.1983184814453, -240.89247131347656, -228.5866241455078, -216.28077697753906, -203.97491455078125, -191.6690673828125, -179.36322021484375, -167.057373046875, -154.75152587890625, -142.44569396972656, -130.1398468017578, -117.83399963378906, -105.52814483642578, -93.22229766845703, -80.91645050048828, -68.610595703125, -56.30474853515625, -43.9989013671875, -31.693052291870117, -19.387203216552734, -7.081352233886719, 5.224494934082031, 17.53034210205078, 29.836196899414062, 42.14204406738281, 54.44789123535156, 66.75373840332031, 79.05958557128906, 91.36544036865234, 103.6712875366211, 115.97713470458984, 128.28298950195312, 140.58883666992188, 152.89468383789062, 165.20053100585938, 177.50637817382812, 189.81222534179688, 202.11807250976562, 214.42391967773438, 226.7297821044922, 239.03562927246094, 251.3414764404297]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 8.0, 11.0, 5.0, 12.0, 6.0, 20.0, 21.0, 22.0, 17.0, 26.0, 23.0, 27.0, 29.0, 35.0, 27.0, 38.0, 44.0, 45.0, 38.0, 34.0, 41.0, 42.0, 39.0, 49.0, 32.0, 31.0, 30.0, 28.0, 17.0, 24.0, 22.0, 20.0, 20.0, 20.0, 16.0, 13.0, 14.0, 14.0, 6.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.926025390625, -97.48374938964844, -94.04146575927734, -90.59918212890625, -87.15690612792969, -83.71463012695312, -80.27234649658203, -76.83006286621094, -73.38778686523438, -69.94551086425781, -66.50322723388672, -63.06094741821289, -59.61866760253906, -56.176387786865234, -52.734107971191406, -49.29182815551758, -45.84954833984375, -42.40726852416992, -38.964988708496094, -35.522708892822266, -32.08042907714844, -28.63814926147461, -25.19586944580078, -21.753589630126953, -18.311309814453125, -14.869029998779297, -11.426750183105469, -7.984470367431641, -4.5421905517578125, -1.0999107360839844, 2.3423690795898438, 5.784648895263672, 9.2269287109375, 12.669208526611328, 16.111488342285156, 19.553768157958984, 22.996047973632812, 26.43832778930664, 29.88060760498047, 33.3228874206543, 36.765167236328125, 40.20744705200195, 43.64972686767578, 47.09200668334961, 50.53428649902344, 53.976566314697266, 57.418846130371094, 60.86112594604492, 64.30340576171875, 67.74568176269531, 71.1879653930664, 74.6302490234375, 78.07252502441406, 81.51480102539062, 84.95708465576172, 88.39936828613281, 91.84164428710938, 95.28392028808594, 98.72620391845703, 102.16848754882812, 105.61076354980469, 109.05303955078125, 112.49532318115234, 115.93760681152344, 119.3798828125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 6.0, 12.0, 9.0, 16.0, 18.0, 24.0, 29.0, 27.0, 21.0, 40.0, 36.0, 37.0, 44.0, 46.0, 42.0, 49.0, 46.0, 61.0, 41.0, 49.0, 43.0, 44.0, 36.0, 31.0, 25.0, 25.0, 14.0, 20.0, 20.0, 16.0, 12.0, 9.0, 9.0, 13.0, 8.0, 3.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.973388671875, -16.39990234375, -15.826416015625, -15.2529296875, -14.679443359375, -14.10595703125, -13.532470703125, -12.958984375, -12.385498046875, -11.81201171875, -11.238525390625, -10.6650390625, -10.091552734375, -9.51806640625, -8.944580078125, -8.37109375, -7.797607421875, -7.22412109375, -6.650634765625, -6.0771484375, -5.503662109375, -4.93017578125, -4.356689453125, -3.783203125, -3.209716796875, -2.63623046875, -2.062744140625, -1.4892578125, -0.915771484375, -0.34228515625, 0.231201171875, 0.8046875, 1.378173828125, 1.95166015625, 2.525146484375, 3.0986328125, 3.672119140625, 4.24560546875, 4.819091796875, 5.392578125, 5.966064453125, 6.53955078125, 7.113037109375, 7.6865234375, 8.260009765625, 8.83349609375, 9.406982421875, 9.98046875, 10.553955078125, 11.12744140625, 11.700927734375, 12.2744140625, 12.847900390625, 13.42138671875, 13.994873046875, 14.568359375, 15.141845703125, 15.71533203125, 16.288818359375, 16.8623046875, 17.435791015625, 18.00927734375, 18.582763671875, 19.15625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 12.0, 7.0, 20.0, 40.0, 42.0, 64.0, 91.0, 115.0, 204.0, 306.0, 472.0, 789.0, 1185.0, 1781.0, 2784.0, 4402.0, 7007.0, 11102.0, 17870.0, 29197.0, 49149.0, 89515.0, 192983.0, 346503.0, 127581.0, 66668.0, 37803.0, 22685.0, 13696.0, 8781.0, 5653.0, 3530.0, 2235.0, 1519.0, 925.0, 642.0, 401.0, 276.0, 169.0, 102.0, 81.0, 45.0, 42.0, 34.0, 24.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.68359375, -4.53839111328125, -4.3931884765625, -4.24798583984375, -4.102783203125, -3.95758056640625, -3.8123779296875, -3.66717529296875, -3.52197265625, -3.37677001953125, -3.2315673828125, -3.08636474609375, -2.941162109375, -2.79595947265625, -2.6507568359375, -2.50555419921875, -2.3603515625, -2.21514892578125, -2.0699462890625, -1.92474365234375, -1.779541015625, -1.63433837890625, -1.4891357421875, -1.34393310546875, -1.19873046875, -1.05352783203125, -0.9083251953125, -0.76312255859375, -0.617919921875, -0.47271728515625, -0.3275146484375, -0.18231201171875, -0.037109375, 0.10809326171875, 0.2532958984375, 0.39849853515625, 0.543701171875, 0.68890380859375, 0.8341064453125, 0.97930908203125, 1.12451171875, 1.26971435546875, 1.4149169921875, 1.56011962890625, 1.705322265625, 1.85052490234375, 1.9957275390625, 2.14093017578125, 2.2861328125, 2.43133544921875, 2.5765380859375, 2.72174072265625, 2.866943359375, 3.01214599609375, 3.1573486328125, 3.30255126953125, 3.44775390625, 3.59295654296875, 3.7381591796875, 3.88336181640625, 4.028564453125, 4.17376708984375, 4.3189697265625, 4.46417236328125, 4.609375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 13.0, 10.0, 17.0, 18.0, 23.0, 21.0, 18.0, 28.0, 32.0, 25.0, 25.0, 26.0, 31.0, 37.0, 43.0, 33.0, 49.0, 1060.0, 41.0, 45.0, 55.0, 36.0, 32.0, 26.0, 27.0, 28.0, 36.0, 27.0, 21.0, 26.0, 18.0, 19.0, 13.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.697509765625, -8.37939453125, -8.061279296875, -7.7431640625, -7.425048828125, -7.10693359375, -6.788818359375, -6.470703125, -6.152587890625, -5.83447265625, -5.516357421875, -5.1982421875, -4.880126953125, -4.56201171875, -4.243896484375, -3.92578125, -3.607666015625, -3.28955078125, -2.971435546875, -2.6533203125, -2.335205078125, -2.01708984375, -1.698974609375, -1.380859375, -1.062744140625, -0.74462890625, -0.426513671875, -0.1083984375, 0.209716796875, 0.52783203125, 0.845947265625, 1.1640625, 1.482177734375, 1.80029296875, 2.118408203125, 2.4365234375, 2.754638671875, 3.07275390625, 3.390869140625, 3.708984375, 4.027099609375, 4.34521484375, 4.663330078125, 4.9814453125, 5.299560546875, 5.61767578125, 5.935791015625, 6.25390625, 6.572021484375, 6.89013671875, 7.208251953125, 7.5263671875, 7.844482421875, 8.16259765625, 8.480712890625, 8.798828125, 9.116943359375, 9.43505859375, 9.753173828125, 10.0712890625, 10.389404296875, 10.70751953125, 11.025634765625, 11.34375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 13.0, 23.0, 30.0, 45.0, 81.0, 94.0, 161.0, 225.0, 342.0, 572.0, 831.0, 1298.0, 2067.0, 3418.0, 5564.0, 9153.0, 15357.0, 25215.0, 41814.0, 69509.0, 131420.0, 1397967.0, 178091.0, 85801.0, 50273.0, 30616.0, 18366.0, 11010.0, 6600.0, 4123.0, 2518.0, 1610.0, 998.0, 667.0, 395.0, 289.0, 185.0, 143.0, 83.0, 47.0, 32.0, 26.0, 15.0, 14.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.46875, -4.33203125, -4.1953125, -4.05859375, -3.921875, -3.78515625, -3.6484375, -3.51171875, -3.375, -3.23828125, -3.1015625, -2.96484375, -2.828125, -2.69140625, -2.5546875, -2.41796875, -2.28125, -2.14453125, -2.0078125, -1.87109375, -1.734375, -1.59765625, -1.4609375, -1.32421875, -1.1875, -1.05078125, -0.9140625, -0.77734375, -0.640625, -0.50390625, -0.3671875, -0.23046875, -0.09375, 0.04296875, 0.1796875, 0.31640625, 0.453125, 0.58984375, 0.7265625, 0.86328125, 1.0, 1.13671875, 1.2734375, 1.41015625, 1.546875, 1.68359375, 1.8203125, 1.95703125, 2.09375, 2.23046875, 2.3671875, 2.50390625, 2.640625, 2.77734375, 2.9140625, 3.05078125, 3.1875, 3.32421875, 3.4609375, 3.59765625, 3.734375, 3.87109375, 4.0078125, 4.14453125, 4.28125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 11.0, 4.0, 6.0, 4.0, 15.0, 13.0, 15.0, 20.0, 22.0, 23.0, 17.0, 40.0, 55.0, 66.0, 93.0, 89.0, 81.0, 79.0, 72.0, 53.0, 36.0, 36.0, 25.0, 21.0, 14.0, 10.0, 6.0, 13.0, 8.0, 5.0, 8.0, 1.0, 3.0, 5.0, 0.0, 2.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00283050537109375, -0.002736300230026245, -0.0026420950889587402, -0.0025478899478912354, -0.0024536848068237305, -0.0023594796657562256, -0.0022652745246887207, -0.002171069383621216, -0.002076864242553711, -0.001982659101486206, -0.0018884539604187012, -0.0017942488193511963, -0.0017000436782836914, -0.0016058385372161865, -0.0015116333961486816, -0.0014174282550811768, -0.0013232231140136719, -0.001229017972946167, -0.0011348128318786621, -0.0010406076908111572, -0.0009464025497436523, -0.0008521974086761475, -0.0007579922676086426, -0.0006637871265411377, -0.0005695819854736328, -0.00047537684440612793, -0.00038117170333862305, -0.00028696656227111816, -0.00019276142120361328, -9.85562801361084e-05, -4.351139068603516e-06, 8.985400199890137e-05, 0.00018405914306640625, 0.00027826428413391113, 0.000372469425201416, 0.0004666745662689209, 0.0005608797073364258, 0.0006550848484039307, 0.0007492899894714355, 0.0008434951305389404, 0.0009377002716064453, 0.0010319054126739502, 0.001126110553741455, 0.00122031569480896, 0.0013145208358764648, 0.0014087259769439697, 0.0015029311180114746, 0.0015971362590789795, 0.0016913414001464844, 0.0017855465412139893, 0.0018797516822814941, 0.001973956823348999, 0.002068161964416504, 0.002162367105484009, 0.0022565722465515137, 0.0023507773876190186, 0.0024449825286865234, 0.0025391876697540283, 0.002633392810821533, 0.002727597951889038, 0.002821803092956543, 0.002916008234024048, 0.0030102133750915527, 0.0031044185161590576, 0.0031986236572265625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 7.0, 12.0, 12.0, 12.0, 22.0, 32.0, 36.0, 52.0, 90.0, 125.0, 381.0, 2025.0, 1042534.0, 2284.0, 430.0, 156.0, 81.0, 41.0, 31.0, 35.0, 20.0, 28.0, 12.0, 12.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07889652252197266, -0.07631111145019531, -0.07372570037841797, -0.07114028930664062, -0.06855487823486328, -0.06596946716308594, -0.0633840560913086, -0.06079864501953125, -0.058213233947753906, -0.05562782287597656, -0.05304241180419922, -0.050457000732421875, -0.04787158966064453, -0.04528617858886719, -0.042700767517089844, -0.0401153564453125, -0.037529945373535156, -0.03494453430175781, -0.03235912322998047, -0.029773712158203125, -0.02718830108642578, -0.024602890014648438, -0.022017478942871094, -0.01943206787109375, -0.016846656799316406, -0.014261245727539062, -0.011675834655761719, -0.009090423583984375, -0.006505012512207031, -0.0039196014404296875, -0.0013341903686523438, 0.001251220703125, 0.0038366317749023438, 0.0064220428466796875, 0.009007453918457031, 0.011592864990234375, 0.014178276062011719, 0.016763687133789062, 0.019349098205566406, 0.02193450927734375, 0.024519920349121094, 0.027105331420898438, 0.02969074249267578, 0.032276153564453125, 0.03486156463623047, 0.03744697570800781, 0.040032386779785156, 0.0426177978515625, 0.045203208923339844, 0.04778861999511719, 0.05037403106689453, 0.052959442138671875, 0.05554485321044922, 0.05813026428222656, 0.060715675354003906, 0.06330108642578125, 0.0658864974975586, 0.06847190856933594, 0.07105731964111328, 0.07364273071289062, 0.07622814178466797, 0.07881355285644531, 0.08139896392822266, 0.083984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 29.0, 131.0, 334.0, 358.0, 124.0, 24.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029893768951296806, -0.0028646867722272873, -0.0027399964164942503, -0.002615306293591857, -0.0024906161706894636, -0.0023659258149564266, -0.0022412356920540333, -0.00211654556915164, -0.0019918554462492466, -0.0018671652069315314, -0.001742475084029138, -0.001617784844711423, -0.0014930947218090296, -0.0013684044824913144, -0.0012437142431735992, -0.001119024120271206, -0.000994333764538169, -0.0008696435834281147, -0.0007449534023180604, -0.0006202631630003452, -0.000495572981890291, -0.0003708828007802367, -0.00024619256146252155, -0.0001215023803524673, 3.187800757586956e-06, 0.00012787799641955644, 0.0002525681920815259, 0.00037725840229541063, 0.0005019485834054649, 0.0006266387645155191, 0.0007513290038332343, 0.0008760191849432886, 0.0010007093660533428, 0.001125399605371058, 0.0012500897282734513, 0.0013747799675911665, 0.0014994700904935598, 0.001624160329811275, 0.0017488505691289902, 0.0018735406920313835, 0.001998230814933777, 0.00212292093783617, 0.002247611293569207, 0.0023723014164716005, 0.002496991539373994, 0.002621681895107031, 0.002746372018009424, 0.0028710621409118176, 0.0029957524966448545, 0.003120442619547248, 0.003245132975280285, 0.0033698230981826782, 0.0034945132210850716, 0.003619203343987465, 0.003743893699720502, 0.0038685838226228952, 0.003993274178355932, 0.004117964301258326, 0.004242654424160719, 0.0043673450127244, 0.004492035135626793, 0.004616725258529186, 0.00474141538143158, 0.004866105504333973, 0.004990795627236366]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 1.0, 13.0, 6.0, 10.0, 10.0, 13.0, 21.0, 19.0, 22.0, 21.0, 33.0, 31.0, 23.0, 28.0, 28.0, 31.0, 45.0, 41.0, 31.0, 43.0, 47.0, 40.0, 40.0, 34.0, 40.0, 32.0, 34.0, 35.0, 29.0, 18.0, 24.0, 22.0, 21.0, 13.0, 17.0, 10.0, 9.0, 9.0, 10.0, 6.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0015862584114074707, -0.0015399018302559853, -0.0014935452491044998, -0.0014471886679530144, -0.001400832086801529, -0.0013544755056500435, -0.001308118924498558, -0.0012617623433470726, -0.0012154057621955872, -0.0011690491810441017, -0.0011226925998926163, -0.0010763360187411308, -0.0010299794375896454, -0.00098362285643816, -0.0009372662752866745, -0.0008909096941351891, -0.0008445531129837036, -0.0007981965318322182, -0.0007518399506807327, -0.0007054833695292473, -0.0006591267883777618, -0.0006127702072262764, -0.000566413626074791, -0.0005200570449233055, -0.00047370046377182007, -0.0004273438826203346, -0.0003809873014688492, -0.00033463072031736374, -0.0002882741391658783, -0.00024191755801439285, -0.0001955609768629074, -0.00014920439571142197, -0.00010284781455993652, -5.649123340845108e-05, -1.0134652256965637e-05, 3.6221928894519806e-05, 8.257851004600525e-05, 0.0001289350911974907, 0.00017529167234897614, 0.00022164825350046158, 0.000268004834651947, 0.00031436141580343246, 0.0003607179969549179, 0.00040707457810640335, 0.0004534311592578888, 0.0004997877404093742, 0.0005461443215608597, 0.0005925009027123451, 0.0006388574838638306, 0.000685214065015316, 0.0007315706461668015, 0.0007779272273182869, 0.0008242838084697723, 0.0008706403896212578, 0.0009169969707727432, 0.0009633535519242287, 0.0010097101330757141, 0.0010560667142271996, 0.001102423295378685, 0.0011487798765301704, 0.0011951364576816559, 0.0012414930388331413, 0.0012878496199846268, 0.0013342062011361122, 0.0013805627822875977]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 6.0, 12.0, 9.0, 16.0, 18.0, 24.0, 29.0, 27.0, 21.0, 40.0, 36.0, 37.0, 44.0, 46.0, 42.0, 49.0, 46.0, 61.0, 41.0, 49.0, 43.0, 44.0, 36.0, 31.0, 25.0, 25.0, 14.0, 20.0, 20.0, 16.0, 12.0, 9.0, 9.0, 13.0, 8.0, 3.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.973388671875, -16.39990234375, -15.826416015625, -15.2529296875, -14.679443359375, -14.10595703125, -13.532470703125, -12.958984375, -12.385498046875, -11.81201171875, -11.238525390625, -10.6650390625, -10.091552734375, -9.51806640625, -8.944580078125, -8.37109375, -7.797607421875, -7.22412109375, -6.650634765625, -6.0771484375, -5.503662109375, -4.93017578125, -4.356689453125, -3.783203125, -3.209716796875, -2.63623046875, -2.062744140625, -1.4892578125, -0.915771484375, -0.34228515625, 0.231201171875, 0.8046875, 1.378173828125, 1.95166015625, 2.525146484375, 3.0986328125, 3.672119140625, 4.24560546875, 4.819091796875, 5.392578125, 5.966064453125, 6.53955078125, 7.113037109375, 7.6865234375, 8.260009765625, 8.83349609375, 9.406982421875, 9.98046875, 10.553955078125, 11.12744140625, 11.700927734375, 12.2744140625, 12.847900390625, 13.42138671875, 13.994873046875, 14.568359375, 15.141845703125, 15.71533203125, 16.288818359375, 16.8623046875, 17.435791015625, 18.00927734375, 18.582763671875, 19.15625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 9.0, 8.0, 24.0, 22.0, 29.0, 43.0, 51.0, 67.0, 90.0, 129.0, 168.0, 247.0, 381.0, 515.0, 742.0, 1339.0, 2364.0, 4584.0, 9586.0, 22312.0, 59092.0, 183248.0, 451185.0, 202045.0, 64470.0, 24181.0, 10365.0, 4748.0, 2485.0, 1352.0, 790.0, 569.0, 385.0, 232.0, 185.0, 144.0, 78.0, 86.0, 57.0, 34.0, 30.0, 17.0, 19.0, 9.0, 8.0, 5.0, 4.0, 2.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.015625, -10.6663818359375, -10.317138671875, -9.9678955078125, -9.61865234375, -9.2694091796875, -8.920166015625, -8.5709228515625, -8.2216796875, -7.8724365234375, -7.523193359375, -7.1739501953125, -6.82470703125, -6.4754638671875, -6.126220703125, -5.7769775390625, -5.427734375, -5.0784912109375, -4.729248046875, -4.3800048828125, -4.03076171875, -3.6815185546875, -3.332275390625, -2.9830322265625, -2.6337890625, -2.2845458984375, -1.935302734375, -1.5860595703125, -1.23681640625, -0.8875732421875, -0.538330078125, -0.1890869140625, 0.16015625, 0.5093994140625, 0.858642578125, 1.2078857421875, 1.55712890625, 1.9063720703125, 2.255615234375, 2.6048583984375, 2.9541015625, 3.3033447265625, 3.652587890625, 4.0018310546875, 4.35107421875, 4.7003173828125, 5.049560546875, 5.3988037109375, 5.748046875, 6.0972900390625, 6.446533203125, 6.7957763671875, 7.14501953125, 7.4942626953125, 7.843505859375, 8.1927490234375, 8.5419921875, 8.8912353515625, 9.240478515625, 9.5897216796875, 9.93896484375, 10.2882080078125, 10.637451171875, 10.9866943359375, 11.3359375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 10.0, 10.0, 15.0, 11.0, 22.0, 31.0, 29.0, 39.0, 46.0, 38.0, 42.0, 45.0, 57.0, 122.0, 1783.0, 260.0, 69.0, 53.0, 37.0, 47.0, 52.0, 38.0, 31.0, 26.0, 30.0, 20.0, 12.0, 8.0, 14.0, 12.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.125, -71.134765625, -69.14453125, -67.154296875, -65.1640625, -63.173828125, -61.18359375, -59.193359375, -57.203125, -55.212890625, -53.22265625, -51.232421875, -49.2421875, -47.251953125, -45.26171875, -43.271484375, -41.28125, -39.291015625, -37.30078125, -35.310546875, -33.3203125, -31.330078125, -29.33984375, -27.349609375, -25.359375, -23.369140625, -21.37890625, -19.388671875, -17.3984375, -15.408203125, -13.41796875, -11.427734375, -9.4375, -7.447265625, -5.45703125, -3.466796875, -1.4765625, 0.513671875, 2.50390625, 4.494140625, 6.484375, 8.474609375, 10.46484375, 12.455078125, 14.4453125, 16.435546875, 18.42578125, 20.416015625, 22.40625, 24.396484375, 26.38671875, 28.376953125, 30.3671875, 32.357421875, 34.34765625, 36.337890625, 38.328125, 40.318359375, 42.30859375, 44.298828125, 46.2890625, 48.279296875, 50.26953125, 52.259765625, 54.25]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 11.0, 17.0, 26.0, 24.0, 34.0, 36.0, 66.0, 68.0, 95.0, 109.0, 180.0, 224.0, 272.0, 494.0, 1649.0, 638044.0, 2500486.0, 2143.0, 504.0, 270.0, 230.0, 160.0, 136.0, 100.0, 65.0, 50.0, 40.0, 28.0, 29.0, 18.0, 19.0, 10.0, 6.0, 12.0, 5.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.75, -103.765625, -99.78125, -95.796875, -91.8125, -87.828125, -83.84375, -79.859375, -75.875, -71.890625, -67.90625, -63.921875, -59.9375, -55.953125, -51.96875, -47.984375, -44.0, -40.015625, -36.03125, -32.046875, -28.0625, -24.078125, -20.09375, -16.109375, -12.125, -8.140625, -4.15625, -0.171875, 3.8125, 7.796875, 11.78125, 15.765625, 19.75, 23.734375, 27.71875, 31.703125, 35.6875, 39.671875, 43.65625, 47.640625, 51.625, 55.609375, 59.59375, 63.578125, 67.5625, 71.546875, 75.53125, 79.515625, 83.5, 87.484375, 91.46875, 95.453125, 99.4375, 103.421875, 107.40625, 111.390625, 115.375, 119.359375, 123.34375, 127.328125, 131.3125, 135.296875, 139.28125, 143.265625, 147.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 106.0, 873.0, 37.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.04001998901367, -48.020973205566406, -34.001930236816406, -19.98288345336914, -5.963836669921875, 8.05521011352539, 22.07425308227539, 36.09330368041992, 50.11234664916992, 64.13139343261719, 78.15043640136719, 92.16947937011719, 106.18852996826172, 120.20758056640625, 134.22662353515625, 148.24566650390625, 162.26470947265625, 176.28375244140625, 190.30279541015625, 204.32183837890625, 218.3408966064453, 232.3599395751953, 246.3789825439453, 260.3980407714844, 274.4170837402344, 288.4361267089844, 302.4551696777344, 316.4742126464844, 330.4932556152344, 344.5123291015625, 358.5313720703125, 372.5504150390625, 386.5694274902344, 400.5884704589844, 414.6075134277344, 428.6265563964844, 442.6455993652344, 456.6646728515625, 470.6837158203125, 484.7027587890625, 498.7218017578125, 512.7408447265625, 526.7598876953125, 540.7789306640625, 554.7979736328125, 568.8170166015625, 582.8360595703125, 596.8551025390625, 610.8741455078125, 624.8931884765625, 638.9122314453125, 652.9312744140625, 666.9503173828125, 680.9693603515625, 694.9884033203125, 709.0074462890625, 723.0265502929688, 737.0455932617188, 751.0646362304688, 765.0836791992188, 779.1027221679688, 793.1217651367188, 807.1408081054688, 821.1598510742188, 835.1788940429688]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 11.0, 10.0, 13.0, 12.0, 15.0, 16.0, 14.0, 24.0, 11.0, 29.0, 23.0, 21.0, 33.0, 26.0, 46.0, 45.0, 43.0, 36.0, 38.0, 27.0, 45.0, 38.0, 38.0, 41.0, 30.0, 34.0, 32.0, 16.0, 29.0, 22.0, 23.0, 15.0, 15.0, 20.0, 12.0, 16.0, 12.0, 11.0, 9.0, 12.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.94898986816406, -119.81915283203125, -115.68931579589844, -111.55948638916016, -107.42964935302734, -103.29981231689453, -99.16998291015625, -95.04014587402344, -90.91030883789062, -86.78047180175781, -82.650634765625, -78.52080535888672, -74.3909683227539, -70.2611312866211, -66.13130187988281, -62.00146484375, -57.87162780761719, -53.741790771484375, -49.61195755004883, -45.48212432861328, -41.35228729248047, -37.222450256347656, -33.09261703491211, -28.96278190612793, -24.83294677734375, -20.70311164855957, -16.57327651977539, -12.443441390991211, -8.313606262207031, -4.183771133422852, -0.053936004638671875, 4.075899124145508, 8.205718994140625, 12.335554122924805, 16.465389251708984, 20.595224380493164, 24.725059509277344, 28.854894638061523, 32.9847297668457, 37.11456298828125, 41.24440002441406, 45.374237060546875, 49.50407028198242, 53.63390350341797, 57.76374053955078, 61.893577575683594, 66.02340698242188, 70.15324401855469, 74.2830810546875, 78.41291809082031, 82.54275512695312, 86.6725845336914, 90.80242156982422, 94.93225860595703, 99.06208801269531, 103.19192504882812, 107.32176208496094, 111.45159912109375, 115.58143615722656, 119.71126556396484, 123.84110260009766, 127.97093963623047, 132.10076904296875, 136.23060607910156, 140.36044311523438]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 8.0, 9.0, 4.0, 13.0, 14.0, 16.0, 33.0, 27.0, 29.0, 31.0, 32.0, 39.0, 40.0, 38.0, 53.0, 47.0, 35.0, 38.0, 61.0, 51.0, 40.0, 43.0, 41.0, 36.0, 34.0, 16.0, 23.0, 26.0, 20.0, 14.0, 14.0, 12.0, 11.0, 13.0, 7.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.618896484375, -16.03466796875, -15.450439453125, -14.8662109375, -14.281982421875, -13.69775390625, -13.113525390625, -12.529296875, -11.945068359375, -11.36083984375, -10.776611328125, -10.1923828125, -9.608154296875, -9.02392578125, -8.439697265625, -7.85546875, -7.271240234375, -6.68701171875, -6.102783203125, -5.5185546875, -4.934326171875, -4.35009765625, -3.765869140625, -3.181640625, -2.597412109375, -2.01318359375, -1.428955078125, -0.8447265625, -0.260498046875, 0.32373046875, 0.907958984375, 1.4921875, 2.076416015625, 2.66064453125, 3.244873046875, 3.8291015625, 4.413330078125, 4.99755859375, 5.581787109375, 6.166015625, 6.750244140625, 7.33447265625, 7.918701171875, 8.5029296875, 9.087158203125, 9.67138671875, 10.255615234375, 10.83984375, 11.424072265625, 12.00830078125, 12.592529296875, 13.1767578125, 13.760986328125, 14.34521484375, 14.929443359375, 15.513671875, 16.097900390625, 16.68212890625, 17.266357421875, 17.8505859375, 18.434814453125, 19.01904296875, 19.603271484375, 20.1875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 10.0, 9.0, 7.0, 4.0, 18.0, 18.0, 17.0, 14.0, 27.0, 36.0, 35.0, 66.0, 81.0, 125.0, 198.0, 317.0, 1048.0, 6547.0, 150090.0, 2622094.0, 1367827.0, 41266.0, 2936.0, 669.0, 264.0, 148.0, 95.0, 50.0, 62.0, 35.0, 28.0, 21.0, 24.0, 16.0, 5.0, 12.0, 14.0, 7.0, 8.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.12353515625, -38.7783203125, -37.43310546875, -36.087890625, -34.74267578125, -33.3974609375, -32.05224609375, -30.70703125, -29.36181640625, -28.0166015625, -26.67138671875, -25.326171875, -23.98095703125, -22.6357421875, -21.29052734375, -19.9453125, -18.60009765625, -17.2548828125, -15.90966796875, -14.564453125, -13.21923828125, -11.8740234375, -10.52880859375, -9.18359375, -7.83837890625, -6.4931640625, -5.14794921875, -3.802734375, -2.45751953125, -1.1123046875, 0.23291015625, 1.578125, 2.92333984375, 4.2685546875, 5.61376953125, 6.958984375, 8.30419921875, 9.6494140625, 10.99462890625, 12.33984375, 13.68505859375, 15.0302734375, 16.37548828125, 17.720703125, 19.06591796875, 20.4111328125, 21.75634765625, 23.1015625, 24.44677734375, 25.7919921875, 27.13720703125, 28.482421875, 29.82763671875, 31.1728515625, 32.51806640625, 33.86328125, 35.20849609375, 36.5537109375, 37.89892578125, 39.244140625, 40.58935546875, 41.9345703125, 43.27978515625, 44.625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 7.0, 9.0, 11.0, 16.0, 38.0, 28.0, 31.0, 42.0, 50.0, 79.0, 85.0, 108.0, 164.0, 206.0, 287.0, 357.0, 429.0, 461.0, 419.0, 314.0, 225.0, 158.0, 117.0, 109.0, 68.0, 52.0, 49.0, 31.0, 34.0, 19.0, 17.0, 10.0, 9.0, 14.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-34.875, -33.9619140625, -33.048828125, -32.1357421875, -31.22265625, -30.3095703125, -29.396484375, -28.4833984375, -27.5703125, -26.6572265625, -25.744140625, -24.8310546875, -23.91796875, -23.0048828125, -22.091796875, -21.1787109375, -20.265625, -19.3525390625, -18.439453125, -17.5263671875, -16.61328125, -15.7001953125, -14.787109375, -13.8740234375, -12.9609375, -12.0478515625, -11.134765625, -10.2216796875, -9.30859375, -8.3955078125, -7.482421875, -6.5693359375, -5.65625, -4.7431640625, -3.830078125, -2.9169921875, -2.00390625, -1.0908203125, -0.177734375, 0.7353515625, 1.6484375, 2.5615234375, 3.474609375, 4.3876953125, 5.30078125, 6.2138671875, 7.126953125, 8.0400390625, 8.953125, 9.8662109375, 10.779296875, 11.6923828125, 12.60546875, 13.5185546875, 14.431640625, 15.3447265625, 16.2578125, 17.1708984375, 18.083984375, 18.9970703125, 19.91015625, 20.8232421875, 21.736328125, 22.6494140625, 23.5625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 6.0, 2.0, 4.0, 2.0, 6.0, 11.0, 12.0, 15.0, 13.0, 12.0, 25.0, 28.0, 44.0, 46.0, 65.0, 77.0, 97.0, 140.0, 183.0, 286.0, 468.0, 1103.0, 496958.0, 3691332.0, 1557.0, 557.0, 301.0, 213.0, 142.0, 119.0, 84.0, 80.0, 64.0, 55.0, 37.0, 26.0, 23.0, 21.0, 13.0, 12.0, 17.0, 8.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-205.125, -198.927734375, -192.73046875, -186.533203125, -180.3359375, -174.138671875, -167.94140625, -161.744140625, -155.546875, -149.349609375, -143.15234375, -136.955078125, -130.7578125, -124.560546875, -118.36328125, -112.166015625, -105.96875, -99.771484375, -93.57421875, -87.376953125, -81.1796875, -74.982421875, -68.78515625, -62.587890625, -56.390625, -50.193359375, -43.99609375, -37.798828125, -31.6015625, -25.404296875, -19.20703125, -13.009765625, -6.8125, -0.615234375, 5.58203125, 11.779296875, 17.9765625, 24.173828125, 30.37109375, 36.568359375, 42.765625, 48.962890625, 55.16015625, 61.357421875, 67.5546875, 73.751953125, 79.94921875, 86.146484375, 92.34375, 98.541015625, 104.73828125, 110.935546875, 117.1328125, 123.330078125, 129.52734375, 135.724609375, 141.921875, 148.119140625, 154.31640625, 160.513671875, 166.7109375, 172.908203125, 179.10546875, 185.302734375, 191.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 32.0, 71.0, 141.0, 212.0, 216.0, 184.0, 88.0, 34.0, 14.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.29476928710938, -185.5139617919922, -179.733154296875, -173.9523468017578, -168.17153930664062, -162.3907470703125, -156.6099395751953, -150.82913208007812, -145.04832458496094, -139.26751708984375, -133.48670959472656, -127.7059097290039, -121.92510223388672, -116.14429473876953, -110.36349487304688, -104.58268737792969, -98.8018798828125, -93.02107238769531, -87.24026489257812, -81.45946502685547, -75.67865753173828, -69.8978500366211, -64.11705017089844, -58.33624267578125, -52.55543518066406, -46.774627685546875, -40.99382400512695, -35.21302032470703, -29.432212829589844, -23.65140724182129, -17.870601654052734, -12.089797973632812, -6.308990478515625, -0.5281848907470703, 5.252620697021484, 11.033426284790039, 16.814231872558594, 22.59503746032715, 28.375843048095703, 34.156646728515625, 39.93745422363281, 45.71826171875, 51.49906539916992, 57.279869079589844, 63.06067657470703, 68.84148406982422, 74.62228393554688, 80.40309143066406, 86.18389892578125, 91.96470642089844, 97.74551391601562, 103.52631378173828, 109.30712127685547, 115.08792877197266, 120.86872863769531, 126.6495361328125, 132.4303436279297, 138.21115112304688, 143.99195861816406, 149.77276611328125, 155.55355834960938, 161.33436584472656, 167.11517333984375, 172.89598083496094, 178.67678833007812]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 4.0, 12.0, 13.0, 13.0, 21.0, 10.0, 13.0, 22.0, 17.0, 32.0, 33.0, 50.0, 27.0, 30.0, 42.0, 38.0, 27.0, 39.0, 34.0, 47.0, 40.0, 36.0, 37.0, 40.0, 37.0, 31.0, 22.0, 29.0, 28.0, 19.0, 22.0, 19.0, 23.0, 11.0, 11.0, 14.0, 8.0, 10.0, 5.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-94.91580200195312, -91.8681869506836, -88.82056427001953, -85.77294921875, -82.72532653808594, -79.6777114868164, -76.63009643554688, -73.58247375488281, -70.53485107421875, -67.48723602294922, -64.43961334228516, -61.391998291015625, -58.34437561035156, -55.29676055908203, -52.249141693115234, -49.20152282714844, -46.153907775878906, -43.10628890991211, -40.05867004394531, -37.01105499267578, -33.96343231201172, -30.915815353393555, -27.86819839477539, -24.820579528808594, -21.772960662841797, -18.725341796875, -15.67772388458252, -12.630105972290039, -9.582487106323242, -6.534868240356445, -3.4872512817382812, -0.4396324157714844, 2.6079864501953125, 5.655604839324951, 8.70322322845459, 11.75084114074707, 14.798460006713867, 17.846078872680664, 20.893695831298828, 23.941314697265625, 26.988933563232422, 30.03655242919922, 33.084171295166016, 36.13179016113281, 39.179405212402344, 42.227027893066406, 45.27464294433594, 48.322261810302734, 51.36988067626953, 54.41749954223633, 57.465118408203125, 60.512733459472656, 63.56035614013672, 66.60797119140625, 69.65559387207031, 72.70320892333984, 75.75082397460938, 78.7984390258789, 81.84606170654297, 84.8936767578125, 87.94129943847656, 90.9889144897461, 94.03652954101562, 97.08415222167969, 100.13177490234375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 11.0, 11.0, 12.0, 7.0, 15.0, 22.0, 28.0, 40.0, 33.0, 35.0, 36.0, 27.0, 39.0, 33.0, 48.0, 49.0, 42.0, 48.0, 53.0, 45.0, 37.0, 40.0, 25.0, 39.0, 30.0, 24.0, 27.0, 16.0, 15.0, 12.0, 11.0, 17.0, 13.0, 13.0, 9.0, 10.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.69091796875, -15.1474609375, -14.60400390625, -14.060546875, -13.51708984375, -12.9736328125, -12.43017578125, -11.88671875, -11.34326171875, -10.7998046875, -10.25634765625, -9.712890625, -9.16943359375, -8.6259765625, -8.08251953125, -7.5390625, -6.99560546875, -6.4521484375, -5.90869140625, -5.365234375, -4.82177734375, -4.2783203125, -3.73486328125, -3.19140625, -2.64794921875, -2.1044921875, -1.56103515625, -1.017578125, -0.47412109375, 0.0693359375, 0.61279296875, 1.15625, 1.69970703125, 2.2431640625, 2.78662109375, 3.330078125, 3.87353515625, 4.4169921875, 4.96044921875, 5.50390625, 6.04736328125, 6.5908203125, 7.13427734375, 7.677734375, 8.22119140625, 8.7646484375, 9.30810546875, 9.8515625, 10.39501953125, 10.9384765625, 11.48193359375, 12.025390625, 12.56884765625, 13.1123046875, 13.65576171875, 14.19921875, 14.74267578125, 15.2861328125, 15.82958984375, 16.373046875, 16.91650390625, 17.4599609375, 18.00341796875, 18.546875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 7.0, 16.0, 23.0, 31.0, 42.0, 66.0, 89.0, 115.0, 220.0, 295.0, 499.0, 658.0, 1017.0, 1568.0, 2268.0, 3291.0, 4905.0, 7417.0, 11603.0, 18162.0, 28752.0, 47115.0, 79972.0, 154798.0, 341440.0, 145386.0, 75766.0, 44513.0, 28063.0, 17360.0, 11145.0, 7229.0, 4834.0, 3189.0, 2138.0, 1472.0, 983.0, 708.0, 428.0, 311.0, 215.0, 150.0, 104.0, 61.0, 41.0, 31.0, 17.0, 14.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-4.01171875, -3.8800048828125, -3.748291015625, -3.6165771484375, -3.48486328125, -3.3531494140625, -3.221435546875, -3.0897216796875, -2.9580078125, -2.8262939453125, -2.694580078125, -2.5628662109375, -2.43115234375, -2.2994384765625, -2.167724609375, -2.0360107421875, -1.904296875, -1.7725830078125, -1.640869140625, -1.5091552734375, -1.37744140625, -1.2457275390625, -1.114013671875, -0.9822998046875, -0.8505859375, -0.7188720703125, -0.587158203125, -0.4554443359375, -0.32373046875, -0.1920166015625, -0.060302734375, 0.0714111328125, 0.203125, 0.3348388671875, 0.466552734375, 0.5982666015625, 0.72998046875, 0.8616943359375, 0.993408203125, 1.1251220703125, 1.2568359375, 1.3885498046875, 1.520263671875, 1.6519775390625, 1.78369140625, 1.9154052734375, 2.047119140625, 2.1788330078125, 2.310546875, 2.4422607421875, 2.573974609375, 2.7056884765625, 2.83740234375, 2.9691162109375, 3.100830078125, 3.2325439453125, 3.3642578125, 3.4959716796875, 3.627685546875, 3.7593994140625, 3.89111328125, 4.0228271484375, 4.154541015625, 4.2862548828125, 4.41796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 12.0, 10.0, 11.0, 7.0, 15.0, 18.0, 25.0, 23.0, 27.0, 31.0, 20.0, 33.0, 38.0, 32.0, 44.0, 51.0, 44.0, 1064.0, 54.0, 42.0, 51.0, 36.0, 37.0, 35.0, 36.0, 30.0, 36.0, 23.0, 17.0, 20.0, 13.0, 13.0, 11.0, 10.0, 7.0, 4.0, 6.0, 9.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.0859375, -10.7568359375, -10.427734375, -10.0986328125, -9.76953125, -9.4404296875, -9.111328125, -8.7822265625, -8.453125, -8.1240234375, -7.794921875, -7.4658203125, -7.13671875, -6.8076171875, -6.478515625, -6.1494140625, -5.8203125, -5.4912109375, -5.162109375, -4.8330078125, -4.50390625, -4.1748046875, -3.845703125, -3.5166015625, -3.1875, -2.8583984375, -2.529296875, -2.2001953125, -1.87109375, -1.5419921875, -1.212890625, -0.8837890625, -0.5546875, -0.2255859375, 0.103515625, 0.4326171875, 0.76171875, 1.0908203125, 1.419921875, 1.7490234375, 2.078125, 2.4072265625, 2.736328125, 3.0654296875, 3.39453125, 3.7236328125, 4.052734375, 4.3818359375, 4.7109375, 5.0400390625, 5.369140625, 5.6982421875, 6.02734375, 6.3564453125, 6.685546875, 7.0146484375, 7.34375, 7.6728515625, 8.001953125, 8.3310546875, 8.66015625, 8.9892578125, 9.318359375, 9.6474609375, 9.9765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 7.0, 16.0, 19.0, 34.0, 47.0, 61.0, 93.0, 128.0, 191.0, 248.0, 389.0, 554.0, 818.0, 1226.0, 1835.0, 2824.0, 4414.0, 6828.0, 10811.0, 17463.0, 28962.0, 48680.0, 86382.0, 182982.0, 1402500.0, 129020.0, 68015.0, 39186.0, 23225.0, 14427.0, 8997.0, 5705.0, 3659.0, 2444.0, 1615.0, 1017.0, 709.0, 493.0, 336.0, 232.0, 147.0, 118.0, 72.0, 68.0, 41.0, 25.0, 23.0, 11.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.171875, -4.03857421875, -3.9052734375, -3.77197265625, -3.638671875, -3.50537109375, -3.3720703125, -3.23876953125, -3.10546875, -2.97216796875, -2.8388671875, -2.70556640625, -2.572265625, -2.43896484375, -2.3056640625, -2.17236328125, -2.0390625, -1.90576171875, -1.7724609375, -1.63916015625, -1.505859375, -1.37255859375, -1.2392578125, -1.10595703125, -0.97265625, -0.83935546875, -0.7060546875, -0.57275390625, -0.439453125, -0.30615234375, -0.1728515625, -0.03955078125, 0.09375, 0.22705078125, 0.3603515625, 0.49365234375, 0.626953125, 0.76025390625, 0.8935546875, 1.02685546875, 1.16015625, 1.29345703125, 1.4267578125, 1.56005859375, 1.693359375, 1.82666015625, 1.9599609375, 2.09326171875, 2.2265625, 2.35986328125, 2.4931640625, 2.62646484375, 2.759765625, 2.89306640625, 3.0263671875, 3.15966796875, 3.29296875, 3.42626953125, 3.5595703125, 3.69287109375, 3.826171875, 3.95947265625, 4.0927734375, 4.22607421875, 4.359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 1.0, 4.0, 4.0, 17.0, 19.0, 25.0, 32.0, 33.0, 44.0, 62.0, 64.0, 81.0, 104.0, 92.0, 89.0, 70.0, 55.0, 51.0, 32.0, 19.0, 29.0, 18.0, 9.0, 7.0, 7.0, 2.0, 7.0, 5.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028743743896484375, -0.002774745225906372, -0.0026751160621643066, -0.002575486898422241, -0.0024758577346801758, -0.0023762285709381104, -0.002276599407196045, -0.0021769702434539795, -0.002077341079711914, -0.0019777119159698486, -0.0018780827522277832, -0.0017784535884857178, -0.0016788244247436523, -0.001579195261001587, -0.0014795660972595215, -0.001379936933517456, -0.0012803077697753906, -0.0011806786060333252, -0.0010810494422912598, -0.0009814202785491943, -0.0008817911148071289, -0.0007821619510650635, -0.000682532787322998, -0.0005829036235809326, -0.0004832744598388672, -0.00038364529609680176, -0.00028401613235473633, -0.0001843869686126709, -8.475780487060547e-05, 1.4871358871459961e-05, 0.00011450052261352539, 0.00021412968635559082, 0.00031375885009765625, 0.0004133880138397217, 0.0005130171775817871, 0.0006126463413238525, 0.000712275505065918, 0.0008119046688079834, 0.0009115338325500488, 0.0010111629962921143, 0.0011107921600341797, 0.0012104213237762451, 0.0013100504875183105, 0.001409679651260376, 0.0015093088150024414, 0.0016089379787445068, 0.0017085671424865723, 0.0018081963062286377, 0.0019078254699707031, 0.0020074546337127686, 0.002107083797454834, 0.0022067129611968994, 0.002306342124938965, 0.0024059712886810303, 0.0025056004524230957, 0.002605229616165161, 0.0027048587799072266, 0.002804487943649292, 0.0029041171073913574, 0.003003746271133423, 0.0031033754348754883, 0.0032030045986175537, 0.003302633762359619, 0.0034022629261016846, 0.00350189208984375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 3.0, 8.0, 7.0, 12.0, 16.0, 23.0, 20.0, 41.0, 59.0, 88.0, 135.0, 464.0, 28154.0, 1018210.0, 796.0, 174.0, 100.0, 69.0, 46.0, 28.0, 26.0, 9.0, 22.0, 6.0, 5.0, 1.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.0938711166381836, -0.09112358093261719, -0.08837604522705078, -0.08562850952148438, -0.08288097381591797, -0.08013343811035156, -0.07738590240478516, -0.07463836669921875, -0.07189083099365234, -0.06914329528808594, -0.06639575958251953, -0.06364822387695312, -0.06090068817138672, -0.05815315246582031, -0.055405616760253906, -0.0526580810546875, -0.049910545349121094, -0.04716300964355469, -0.04441547393798828, -0.041667938232421875, -0.03892040252685547, -0.03617286682128906, -0.033425331115722656, -0.03067779541015625, -0.027930259704589844, -0.025182723999023438, -0.02243518829345703, -0.019687652587890625, -0.01694011688232422, -0.014192581176757812, -0.011445045471191406, -0.008697509765625, -0.005949974060058594, -0.0032024383544921875, -0.00045490264892578125, 0.002292633056640625, 0.005040168762207031, 0.0077877044677734375, 0.010535240173339844, 0.01328277587890625, 0.016030311584472656, 0.018777847290039062, 0.02152538299560547, 0.024272918701171875, 0.02702045440673828, 0.029767990112304688, 0.032515525817871094, 0.0352630615234375, 0.038010597229003906, 0.04075813293457031, 0.04350566864013672, 0.046253204345703125, 0.04900074005126953, 0.05174827575683594, 0.054495811462402344, 0.05724334716796875, 0.059990882873535156, 0.06273841857910156, 0.06548595428466797, 0.06823348999023438, 0.07098102569580078, 0.07372856140136719, 0.0764760971069336, 0.0792236328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 50.0, 414.0, 457.0, 87.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009071114473044872, -0.008878137916326523, -0.008685160428285599, -0.00849218387156725, -0.0082992073148489, -0.008106229826807976, -0.007913253270089626, -0.007720276713371277, -0.00752729969099164, -0.007334322668612003, -0.007141346111893654, -0.006948369089514017, -0.00675539206713438, -0.006562415510416031, -0.006369438488036394, -0.006176461465656757, -0.005983484908938408, -0.005790507886558771, -0.005597531329840422, -0.005404554307460785, -0.0052115777507424355, -0.005018600728362799, -0.004825623705983162, -0.0046326471492648125, -0.004439670126885176, -0.004246693104505539, -0.0040537165477871895, -0.0038607395254075527, -0.0036677627358585596, -0.0034747859463095665, -0.0032818089239299297, -0.0030888321343809366, -0.0028958553448319435, -0.0027028785552829504, -0.0025099017657339573, -0.0023169247433543205, -0.0021239479538053274, -0.0019309711642563343, -0.0017379942582920194, -0.0015450173523277044, -0.0013520405627787113, -0.0011590637732297182, -0.0009660868672654033, -0.0007731100195087492, -0.0005801331717520952, -0.0003871563239954412, -0.00019417947623878717, -1.2025702744722366e-06, 0.00019177421927452087, 0.0003847510670311749, 0.0005777279147878289, 0.000770704762544483, 0.000963681610301137, 0.00115665839985013, 0.001349635305814445, 0.00154261221177876, 0.001735589001327753, 0.0019285657908767462, 0.0021215425804257393, 0.002314519602805376, 0.002507496392354369, 0.0027004731819033623, 0.002893450204282999, 0.003086426993831992, 0.0032794037833809853]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 11.0, 6.0, 13.0, 12.0, 14.0, 13.0, 19.0, 29.0, 29.0, 23.0, 29.0, 30.0, 30.0, 30.0, 34.0, 54.0, 48.0, 53.0, 47.0, 38.0, 39.0, 31.0, 39.0, 27.0, 27.0, 37.0, 26.0, 32.0, 30.0, 20.0, 23.0, 15.0, 14.0, 22.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011401176452636719, -0.001101718284189701, -0.0010633189231157303, -0.0010249195620417595, -0.0009865202009677887, -0.0009481208398938179, -0.0009097214788198471, -0.0008713221177458763, -0.0008329227566719055, -0.0007945233955979347, -0.0007561240345239639, -0.0007177246734499931, -0.0006793253123760223, -0.0006409259513020515, -0.0006025265902280807, -0.00056412722915411, -0.0005257278680801392, -0.00048732850700616837, -0.00044892914593219757, -0.0004105297848582268, -0.000372130423784256, -0.0003337310627102852, -0.0002953317016363144, -0.0002569323405623436, -0.0002185329794883728, -0.000180133618414402, -0.0001417342573404312, -0.00010333489626646042, -6.493553519248962e-05, -2.653617411851883e-05, 1.1863186955451965e-05, 5.026254802942276e-05, 8.866190910339355e-05, 0.00012706127017736435, 0.00016546063125133514, 0.00020385999232530594, 0.00024225935339927673, 0.00028065871447324753, 0.0003190580755472183, 0.0003574574366211891, 0.0003958567976951599, 0.0004342561587691307, 0.0004726555198431015, 0.0005110548809170723, 0.0005494542419910431, 0.0005878536030650139, 0.0006262529641389847, 0.0006646523252129555, 0.0007030516862869263, 0.0007414510473608971, 0.0007798504084348679, 0.0008182497695088387, 0.0008566491305828094, 0.0008950484916567802, 0.000933447852730751, 0.0009718472138047218, 0.0010102465748786926, 0.0010486459359526634, 0.0010870452970266342, 0.001125444658100605, 0.0011638440191745758, 0.0012022433802485466, 0.0012406427413225174, 0.0012790421023964882, 0.001317441463470459]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 12.0, 10.0, 12.0, 7.0, 15.0, 24.0, 26.0, 40.0, 34.0, 34.0, 36.0, 27.0, 40.0, 33.0, 47.0, 50.0, 42.0, 48.0, 52.0, 45.0, 37.0, 40.0, 25.0, 40.0, 32.0, 23.0, 25.0, 16.0, 16.0, 11.0, 12.0, 16.0, 13.0, 13.0, 9.0, 12.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.690673828125, -15.14697265625, -14.603271484375, -14.0595703125, -13.515869140625, -12.97216796875, -12.428466796875, -11.884765625, -11.341064453125, -10.79736328125, -10.253662109375, -9.7099609375, -9.166259765625, -8.62255859375, -8.078857421875, -7.53515625, -6.991455078125, -6.44775390625, -5.904052734375, -5.3603515625, -4.816650390625, -4.27294921875, -3.729248046875, -3.185546875, -2.641845703125, -2.09814453125, -1.554443359375, -1.0107421875, -0.467041015625, 0.07666015625, 0.620361328125, 1.1640625, 1.707763671875, 2.25146484375, 2.795166015625, 3.3388671875, 3.882568359375, 4.42626953125, 4.969970703125, 5.513671875, 6.057373046875, 6.60107421875, 7.144775390625, 7.6884765625, 8.232177734375, 8.77587890625, 9.319580078125, 9.86328125, 10.406982421875, 10.95068359375, 11.494384765625, 12.0380859375, 12.581787109375, 13.12548828125, 13.669189453125, 14.212890625, 14.756591796875, 15.30029296875, 15.843994140625, 16.3876953125, 16.931396484375, 17.47509765625, 18.018798828125, 18.5625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 8.0, 14.0, 15.0, 18.0, 10.0, 30.0, 43.0, 61.0, 98.0, 137.0, 238.0, 383.0, 732.0, 1832.0, 5616.0, 18816.0, 82804.0, 548910.0, 314911.0, 53430.0, 13423.0, 4150.0, 1414.0, 565.0, 328.0, 165.0, 107.0, 80.0, 49.0, 38.0, 23.0, 15.0, 18.0, 14.0, 14.0, 10.0, 11.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.20751953125, -14.6806640625, -14.15380859375, -13.626953125, -13.10009765625, -12.5732421875, -12.04638671875, -11.51953125, -10.99267578125, -10.4658203125, -9.93896484375, -9.412109375, -8.88525390625, -8.3583984375, -7.83154296875, -7.3046875, -6.77783203125, -6.2509765625, -5.72412109375, -5.197265625, -4.67041015625, -4.1435546875, -3.61669921875, -3.08984375, -2.56298828125, -2.0361328125, -1.50927734375, -0.982421875, -0.45556640625, 0.0712890625, 0.59814453125, 1.125, 1.65185546875, 2.1787109375, 2.70556640625, 3.232421875, 3.75927734375, 4.2861328125, 4.81298828125, 5.33984375, 5.86669921875, 6.3935546875, 6.92041015625, 7.447265625, 7.97412109375, 8.5009765625, 9.02783203125, 9.5546875, 10.08154296875, 10.6083984375, 11.13525390625, 11.662109375, 12.18896484375, 12.7158203125, 13.24267578125, 13.76953125, 14.29638671875, 14.8232421875, 15.35009765625, 15.876953125, 16.40380859375, 16.9306640625, 17.45751953125, 17.984375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 9.0, 7.0, 9.0, 17.0, 16.0, 20.0, 15.0, 34.0, 39.0, 37.0, 39.0, 38.0, 50.0, 50.0, 64.0, 218.0, 1864.0, 103.0, 57.0, 50.0, 56.0, 33.0, 34.0, 33.0, 27.0, 28.0, 23.0, 11.0, 19.0, 13.0, 7.0, 6.0, 2.0, 3.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.4609375, -53.421875, -51.3828125, -49.34375, -47.3046875, -45.265625, -43.2265625, -41.1875, -39.1484375, -37.109375, -35.0703125, -33.03125, -30.9921875, -28.953125, -26.9140625, -24.875, -22.8359375, -20.796875, -18.7578125, -16.71875, -14.6796875, -12.640625, -10.6015625, -8.5625, -6.5234375, -4.484375, -2.4453125, -0.40625, 1.6328125, 3.671875, 5.7109375, 7.75, 9.7890625, 11.828125, 13.8671875, 15.90625, 17.9453125, 19.984375, 22.0234375, 24.0625, 26.1015625, 28.140625, 30.1796875, 32.21875, 34.2578125, 36.296875, 38.3359375, 40.375, 42.4140625, 44.453125, 46.4921875, 48.53125, 50.5703125, 52.609375, 54.6484375, 56.6875, 58.7265625, 60.765625, 62.8046875, 64.84375, 66.8828125, 68.921875, 70.9609375, 73.0]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 8.0, 9.0, 6.0, 5.0, 9.0, 12.0, 20.0, 21.0, 26.0, 39.0, 52.0, 63.0, 97.0, 118.0, 181.0, 259.0, 479.0, 1740.0, 2693106.0, 446706.0, 1418.0, 419.0, 257.0, 177.0, 132.0, 89.0, 70.0, 55.0, 26.0, 28.0, 19.0, 17.0, 10.0, 10.0, 10.0, 5.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.0, -157.494140625, -152.98828125, -148.482421875, -143.9765625, -139.470703125, -134.96484375, -130.458984375, -125.953125, -121.447265625, -116.94140625, -112.435546875, -107.9296875, -103.423828125, -98.91796875, -94.412109375, -89.90625, -85.400390625, -80.89453125, -76.388671875, -71.8828125, -67.376953125, -62.87109375, -58.365234375, -53.859375, -49.353515625, -44.84765625, -40.341796875, -35.8359375, -31.330078125, -26.82421875, -22.318359375, -17.8125, -13.306640625, -8.80078125, -4.294921875, 0.2109375, 4.716796875, 9.22265625, 13.728515625, 18.234375, 22.740234375, 27.24609375, 31.751953125, 36.2578125, 40.763671875, 45.26953125, 49.775390625, 54.28125, 58.787109375, 63.29296875, 67.798828125, 72.3046875, 76.810546875, 81.31640625, 85.822265625, 90.328125, 94.833984375, 99.33984375, 103.845703125, 108.3515625, 112.857421875, 117.36328125, 121.869140625, 126.375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 666.0, 346.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-581.2677001953125, -570.059326171875, -558.8509521484375, -547.642578125, -536.4342041015625, -525.225830078125, -514.0174560546875, -502.80908203125, -491.6007080078125, -480.392333984375, -469.1839599609375, -457.9755859375, -446.7672119140625, -435.558837890625, -424.3504638671875, -413.14208984375, -401.9336853027344, -390.7253112792969, -379.5169372558594, -368.3085632324219, -357.1001892089844, -345.8918151855469, -334.68341064453125, -323.47503662109375, -312.26666259765625, -301.05828857421875, -289.84991455078125, -278.64154052734375, -267.43316650390625, -256.22479248046875, -245.0164031982422, -233.8080291748047, -222.5996856689453, -211.3913116455078, -200.1829376220703, -188.97454833984375, -177.76617431640625, -166.55780029296875, -155.34942626953125, -144.14105224609375, -132.93267822265625, -121.72430419921875, -110.51593017578125, -99.30754852294922, -88.09917449951172, -76.89080047607422, -65.68241882324219, -54.47404479980469, -43.26567077636719, -32.05729675292969, -20.848918914794922, -9.640541076660156, 1.5678329467773438, 12.776206970214844, 23.984588623046875, 35.192962646484375, 46.401336669921875, 57.609710693359375, 68.81808471679688, 80.0264663696289, 91.2348403930664, 102.4432144165039, 113.65159606933594, 124.85997009277344, 136.06834411621094]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 7.0, 11.0, 9.0, 16.0, 15.0, 13.0, 22.0, 18.0, 16.0, 19.0, 22.0, 32.0, 33.0, 44.0, 29.0, 29.0, 28.0, 54.0, 37.0, 38.0, 36.0, 39.0, 36.0, 48.0, 38.0, 32.0, 33.0, 36.0, 33.0, 22.0, 17.0, 24.0, 11.0, 12.0, 13.0, 12.0, 9.0, 15.0, 9.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0], "bins": [-136.525146484375, -132.57293701171875, -128.62074279785156, -124.66853332519531, -120.71632385253906, -116.76412200927734, -112.81192016601562, -108.85971069335938, -104.90750885009766, -100.95530700683594, -97.00309753417969, -93.05089569091797, -89.09868621826172, -85.146484375, -81.19427490234375, -77.24207305908203, -73.28987121582031, -69.3376693725586, -65.38545989990234, -61.433258056640625, -57.48105239868164, -53.528846740722656, -49.57664108276367, -45.62443542480469, -41.67222595214844, -37.72002029418945, -33.76781463623047, -29.815610885620117, -25.863407135009766, -21.91120147705078, -17.958995819091797, -14.006792068481445, -10.054588317871094, -6.102383613586426, -2.1501784324645996, 1.8020267486572266, 5.7542314529418945, 9.706436157226562, 13.658641815185547, 17.6108455657959, 21.563051223754883, 25.515256881713867, 29.46746063232422, 33.4196662902832, 37.37187194824219, 41.324073791503906, 45.276283264160156, 49.228485107421875, 53.18069076538086, 57.132896423339844, 61.08510208129883, 65.03730773925781, 68.98950958251953, 72.94171142578125, 76.8939208984375, 80.84612274169922, 84.79833221435547, 88.75053405761719, 92.70274353027344, 96.65494537353516, 100.6071548461914, 104.55935668945312, 108.51156616210938, 112.4637680053711, 116.41596984863281]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 2.0, 6.0, 8.0, 11.0, 6.0, 15.0, 14.0, 14.0, 26.0, 22.0, 38.0, 30.0, 36.0, 37.0, 29.0, 36.0, 35.0, 42.0, 51.0, 43.0, 47.0, 42.0, 35.0, 43.0, 43.0, 29.0, 33.0, 26.0, 23.0, 36.0, 14.0, 12.0, 14.0, 18.0, 12.0, 14.0, 11.0, 13.0, 8.0, 10.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.60400390625, -15.0673828125, -14.53076171875, -13.994140625, -13.45751953125, -12.9208984375, -12.38427734375, -11.84765625, -11.31103515625, -10.7744140625, -10.23779296875, -9.701171875, -9.16455078125, -8.6279296875, -8.09130859375, -7.5546875, -7.01806640625, -6.4814453125, -5.94482421875, -5.408203125, -4.87158203125, -4.3349609375, -3.79833984375, -3.26171875, -2.72509765625, -2.1884765625, -1.65185546875, -1.115234375, -0.57861328125, -0.0419921875, 0.49462890625, 1.03125, 1.56787109375, 2.1044921875, 2.64111328125, 3.177734375, 3.71435546875, 4.2509765625, 4.78759765625, 5.32421875, 5.86083984375, 6.3974609375, 6.93408203125, 7.470703125, 8.00732421875, 8.5439453125, 9.08056640625, 9.6171875, 10.15380859375, 10.6904296875, 11.22705078125, 11.763671875, 12.30029296875, 12.8369140625, 13.37353515625, 13.91015625, 14.44677734375, 14.9833984375, 15.52001953125, 16.056640625, 16.59326171875, 17.1298828125, 17.66650390625, 18.203125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 10.0, 12.0, 7.0, 10.0, 10.0, 16.0, 18.0, 19.0, 21.0, 30.0, 30.0, 56.0, 66.0, 63.0, 81.0, 112.0, 140.0, 161.0, 253.0, 496.0, 1146.0, 5275.0, 68242.0, 1375927.0, 2508128.0, 219397.0, 10942.0, 1792.0, 549.0, 335.0, 209.0, 116.0, 107.0, 92.0, 64.0, 45.0, 51.0, 38.0, 35.0, 26.0, 27.0, 12.0, 18.0, 27.0, 14.0, 10.0, 12.0, 11.0, 12.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-35.03125, -33.87060546875, -32.7099609375, -31.54931640625, -30.388671875, -29.22802734375, -28.0673828125, -26.90673828125, -25.74609375, -24.58544921875, -23.4248046875, -22.26416015625, -21.103515625, -19.94287109375, -18.7822265625, -17.62158203125, -16.4609375, -15.30029296875, -14.1396484375, -12.97900390625, -11.818359375, -10.65771484375, -9.4970703125, -8.33642578125, -7.17578125, -6.01513671875, -4.8544921875, -3.69384765625, -2.533203125, -1.37255859375, -0.2119140625, 0.94873046875, 2.109375, 3.27001953125, 4.4306640625, 5.59130859375, 6.751953125, 7.91259765625, 9.0732421875, 10.23388671875, 11.39453125, 12.55517578125, 13.7158203125, 14.87646484375, 16.037109375, 17.19775390625, 18.3583984375, 19.51904296875, 20.6796875, 21.84033203125, 23.0009765625, 24.16162109375, 25.322265625, 26.48291015625, 27.6435546875, 28.80419921875, 29.96484375, 31.12548828125, 32.2861328125, 33.44677734375, 34.607421875, 35.76806640625, 36.9287109375, 38.08935546875, 39.25]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 12.0, 18.0, 17.0, 24.0, 27.0, 41.0, 49.0, 68.0, 115.0, 133.0, 189.0, 230.0, 331.0, 466.0, 526.0, 490.0, 386.0, 238.0, 212.0, 122.0, 91.0, 80.0, 57.0, 37.0, 24.0, 27.0, 20.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.244873046875, -29.25537109375, -28.265869140625, -27.2763671875, -26.286865234375, -25.29736328125, -24.307861328125, -23.318359375, -22.328857421875, -21.33935546875, -20.349853515625, -19.3603515625, -18.370849609375, -17.38134765625, -16.391845703125, -15.40234375, -14.412841796875, -13.42333984375, -12.433837890625, -11.4443359375, -10.454833984375, -9.46533203125, -8.475830078125, -7.486328125, -6.496826171875, -5.50732421875, -4.517822265625, -3.5283203125, -2.538818359375, -1.54931640625, -0.559814453125, 0.4296875, 1.419189453125, 2.40869140625, 3.398193359375, 4.3876953125, 5.377197265625, 6.36669921875, 7.356201171875, 8.345703125, 9.335205078125, 10.32470703125, 11.314208984375, 12.3037109375, 13.293212890625, 14.28271484375, 15.272216796875, 16.26171875, 17.251220703125, 18.24072265625, 19.230224609375, 20.2197265625, 21.209228515625, 22.19873046875, 23.188232421875, 24.177734375, 25.167236328125, 26.15673828125, 27.146240234375, 28.1357421875, 29.125244140625, 30.11474609375, 31.104248046875, 32.09375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 9.0, 5.0, 6.0, 10.0, 22.0, 15.0, 32.0, 32.0, 48.0, 57.0, 84.0, 102.0, 130.0, 199.0, 224.0, 388.0, 628.0, 3192.0, 4168702.0, 18084.0, 764.0, 410.0, 267.0, 176.0, 148.0, 117.0, 95.0, 76.0, 52.0, 48.0, 31.0, 28.0, 28.0, 20.0, 11.0, 16.0, 9.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-197.5, -191.052734375, -184.60546875, -178.158203125, -171.7109375, -165.263671875, -158.81640625, -152.369140625, -145.921875, -139.474609375, -133.02734375, -126.580078125, -120.1328125, -113.685546875, -107.23828125, -100.791015625, -94.34375, -87.896484375, -81.44921875, -75.001953125, -68.5546875, -62.107421875, -55.66015625, -49.212890625, -42.765625, -36.318359375, -29.87109375, -23.423828125, -16.9765625, -10.529296875, -4.08203125, 2.365234375, 8.8125, 15.259765625, 21.70703125, 28.154296875, 34.6015625, 41.048828125, 47.49609375, 53.943359375, 60.390625, 66.837890625, 73.28515625, 79.732421875, 86.1796875, 92.626953125, 99.07421875, 105.521484375, 111.96875, 118.416015625, 124.86328125, 131.310546875, 137.7578125, 144.205078125, 150.65234375, 157.099609375, 163.546875, 169.994140625, 176.44140625, 182.888671875, 189.3359375, 195.783203125, 202.23046875, 208.677734375, 215.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 12.0, 298.0, 632.0, 66.0, 5.0, 2.0], "bins": [-1146.711669921875, -1127.6798095703125, -1108.64794921875, -1089.615966796875, -1070.5841064453125, -1051.55224609375, -1032.5203857421875, -1013.4884643554688, -994.45654296875, -975.4246826171875, -956.3927612304688, -937.3609008789062, -918.3289794921875, -899.297119140625, -880.2651977539062, -861.2333374023438, -842.2014770507812, -823.1696166992188, -804.1376953125, -785.1058349609375, -766.0739135742188, -747.0420532226562, -728.0101318359375, -708.978271484375, -689.9464111328125, -670.91455078125, -651.8826293945312, -632.8507690429688, -613.81884765625, -594.7869873046875, -575.7550659179688, -556.7232055664062, -537.6912841796875, -518.659423828125, -499.62750244140625, -480.5956115722656, -461.563720703125, -442.5318603515625, -423.4999694824219, -404.46807861328125, -385.43621826171875, -366.4043273925781, -347.3724365234375, -328.3405456542969, -309.30865478515625, -290.27679443359375, -271.2449035644531, -252.2130126953125, -233.18112182617188, -214.14923095703125, -195.11734008789062, -176.08546447753906, -157.05357360839844, -138.0216827392578, -118.98979949951172, -99.95791625976562, -80.92601776123047, -61.89413070678711, -42.86224365234375, -23.83035659790039, -4.798469543457031, 14.233421325683594, 33.26530456542969, 52.29718780517578, 71.3290786743164]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 8.0, 11.0, 17.0, 14.0, 21.0, 24.0, 26.0, 34.0, 39.0, 41.0, 46.0, 44.0, 39.0, 36.0, 39.0, 55.0, 38.0, 36.0, 37.0, 40.0, 47.0, 36.0, 37.0, 38.0, 24.0, 22.0, 17.0, 21.0, 17.0, 17.0, 11.0, 13.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.75, -93.59977722167969, -90.4495620727539, -87.2993392944336, -84.14912414550781, -80.9989013671875, -77.84867858886719, -74.6984634399414, -71.54824829101562, -68.39802551269531, -65.24781036376953, -62.09758758544922, -58.94737243652344, -55.797149658203125, -52.64693069458008, -49.49671173095703, -46.34648895263672, -43.19626998901367, -40.046051025390625, -36.89582824707031, -33.74561309814453, -30.59539222717285, -27.445171356201172, -24.294952392578125, -21.144733428955078, -17.99451446533203, -14.844294548034668, -11.694074630737305, -8.543855667114258, -5.393636703491211, -2.2434158325195312, 0.9068031311035156, 4.0570220947265625, 7.207241535186768, 10.357460975646973, 13.507680892944336, 16.657899856567383, 19.80811882019043, 22.95833969116211, 26.108558654785156, 29.258777618408203, 32.40899658203125, 35.5592155456543, 38.709434509277344, 41.859657287597656, 45.00987243652344, 48.16009521484375, 51.3103141784668, 54.460533142089844, 57.61075210571289, 60.76097106933594, 63.91119384765625, 67.06140899658203, 70.21163177490234, 73.36184692382812, 76.51206970214844, 79.66229248046875, 82.81251525878906, 85.96273040771484, 89.11295318603516, 92.26316833496094, 95.41339111328125, 98.56361389160156, 101.71382904052734, 104.86404418945312]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 9.0, 2.0, 16.0, 12.0, 8.0, 18.0, 17.0, 19.0, 14.0, 27.0, 36.0, 29.0, 36.0, 25.0, 50.0, 48.0, 41.0, 36.0, 65.0, 36.0, 39.0, 36.0, 55.0, 31.0, 34.0, 36.0, 26.0, 22.0, 30.0, 24.0, 13.0, 13.0, 16.0, 16.0, 12.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.0377197265625, -14.505126953125, -13.9725341796875, -13.43994140625, -12.9073486328125, -12.374755859375, -11.8421630859375, -11.3095703125, -10.7769775390625, -10.244384765625, -9.7117919921875, -9.17919921875, -8.6466064453125, -8.114013671875, -7.5814208984375, -7.048828125, -6.5162353515625, -5.983642578125, -5.4510498046875, -4.91845703125, -4.3858642578125, -3.853271484375, -3.3206787109375, -2.7880859375, -2.2554931640625, -1.722900390625, -1.1903076171875, -0.65771484375, -0.1251220703125, 0.407470703125, 0.9400634765625, 1.47265625, 2.0052490234375, 2.537841796875, 3.0704345703125, 3.60302734375, 4.1356201171875, 4.668212890625, 5.2008056640625, 5.7333984375, 6.2659912109375, 6.798583984375, 7.3311767578125, 7.86376953125, 8.3963623046875, 8.928955078125, 9.4615478515625, 9.994140625, 10.5267333984375, 11.059326171875, 11.5919189453125, 12.12451171875, 12.6571044921875, 13.189697265625, 13.7222900390625, 14.2548828125, 14.7874755859375, 15.320068359375, 15.8526611328125, 16.38525390625, 16.9178466796875, 17.450439453125, 17.9830322265625, 18.515625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 15.0, 45.0, 36.0, 89.0, 101.0, 187.0, 264.0, 360.0, 606.0, 912.0, 1279.0, 2001.0, 2931.0, 4273.0, 6270.0, 8942.0, 13509.0, 20087.0, 29833.0, 47638.0, 79551.0, 146497.0, 315911.0, 147289.0, 79757.0, 48186.0, 30048.0, 20105.0, 13598.0, 9028.0, 6240.0, 4193.0, 2930.0, 1974.0, 1272.0, 878.0, 571.0, 393.0, 253.0, 173.0, 112.0, 68.0, 49.0, 32.0, 22.0, 10.0, 6.0, 10.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.466278076171875, -3.34466552734375, -3.223052978515625, -3.1014404296875, -2.979827880859375, -2.85821533203125, -2.736602783203125, -2.614990234375, -2.493377685546875, -2.37176513671875, -2.250152587890625, -2.1285400390625, -2.006927490234375, -1.88531494140625, -1.763702392578125, -1.64208984375, -1.520477294921875, -1.39886474609375, -1.277252197265625, -1.1556396484375, -1.034027099609375, -0.91241455078125, -0.790802001953125, -0.669189453125, -0.547576904296875, -0.42596435546875, -0.304351806640625, -0.1827392578125, -0.061126708984375, 0.06048583984375, 0.182098388671875, 0.3037109375, 0.425323486328125, 0.54693603515625, 0.668548583984375, 0.7901611328125, 0.911773681640625, 1.03338623046875, 1.154998779296875, 1.276611328125, 1.398223876953125, 1.51983642578125, 1.641448974609375, 1.7630615234375, 1.884674072265625, 2.00628662109375, 2.127899169921875, 2.24951171875, 2.371124267578125, 2.49273681640625, 2.614349365234375, 2.7359619140625, 2.857574462890625, 2.97918701171875, 3.100799560546875, 3.222412109375, 3.344024658203125, 3.46563720703125, 3.587249755859375, 3.7088623046875, 3.830474853515625, 3.95208740234375, 4.073699951171875, 4.1953125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 8.0, 11.0, 15.0, 7.0, 18.0, 19.0, 31.0, 20.0, 24.0, 29.0, 26.0, 33.0, 35.0, 37.0, 44.0, 35.0, 49.0, 1082.0, 60.0, 45.0, 49.0, 47.0, 35.0, 38.0, 30.0, 32.0, 30.0, 29.0, 22.0, 18.0, 10.0, 10.0, 8.0, 8.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8359375, -12.47314453125, -12.1103515625, -11.74755859375, -11.384765625, -11.02197265625, -10.6591796875, -10.29638671875, -9.93359375, -9.57080078125, -9.2080078125, -8.84521484375, -8.482421875, -8.11962890625, -7.7568359375, -7.39404296875, -7.03125, -6.66845703125, -6.3056640625, -5.94287109375, -5.580078125, -5.21728515625, -4.8544921875, -4.49169921875, -4.12890625, -3.76611328125, -3.4033203125, -3.04052734375, -2.677734375, -2.31494140625, -1.9521484375, -1.58935546875, -1.2265625, -0.86376953125, -0.5009765625, -0.13818359375, 0.224609375, 0.58740234375, 0.9501953125, 1.31298828125, 1.67578125, 2.03857421875, 2.4013671875, 2.76416015625, 3.126953125, 3.48974609375, 3.8525390625, 4.21533203125, 4.578125, 4.94091796875, 5.3037109375, 5.66650390625, 6.029296875, 6.39208984375, 6.7548828125, 7.11767578125, 7.48046875, 7.84326171875, 8.2060546875, 8.56884765625, 8.931640625, 9.29443359375, 9.6572265625, 10.02001953125, 10.3828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 10.0, 19.0, 18.0, 35.0, 59.0, 93.0, 140.0, 180.0, 310.0, 441.0, 712.0, 1139.0, 1793.0, 3000.0, 5060.0, 8497.0, 15023.0, 26328.0, 46500.0, 85942.0, 190597.0, 1431735.0, 129072.0, 65111.0, 36047.0, 20355.0, 11495.0, 6881.0, 4042.0, 2462.0, 1481.0, 891.0, 575.0, 355.0, 250.0, 160.0, 108.0, 61.0, 53.0, 31.0, 22.0, 14.0, 9.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.84375, -4.68890380859375, -4.5340576171875, -4.37921142578125, -4.224365234375, -4.06951904296875, -3.9146728515625, -3.75982666015625, -3.60498046875, -3.45013427734375, -3.2952880859375, -3.14044189453125, -2.985595703125, -2.83074951171875, -2.6759033203125, -2.52105712890625, -2.3662109375, -2.21136474609375, -2.0565185546875, -1.90167236328125, -1.746826171875, -1.59197998046875, -1.4371337890625, -1.28228759765625, -1.12744140625, -0.97259521484375, -0.8177490234375, -0.66290283203125, -0.508056640625, -0.35321044921875, -0.1983642578125, -0.04351806640625, 0.111328125, 0.26617431640625, 0.4210205078125, 0.57586669921875, 0.730712890625, 0.88555908203125, 1.0404052734375, 1.19525146484375, 1.35009765625, 1.50494384765625, 1.6597900390625, 1.81463623046875, 1.969482421875, 2.12432861328125, 2.2791748046875, 2.43402099609375, 2.5888671875, 2.74371337890625, 2.8985595703125, 3.05340576171875, 3.208251953125, 3.36309814453125, 3.5179443359375, 3.67279052734375, 3.82763671875, 3.98248291015625, 4.1373291015625, 4.29217529296875, 4.447021484375, 4.60186767578125, 4.7567138671875, 4.91156005859375, 5.06640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 12.0, 6.0, 12.0, 12.0, 20.0, 30.0, 28.0, 46.0, 47.0, 61.0, 79.0, 101.0, 86.0, 87.0, 79.0, 62.0, 54.0, 40.0, 30.0, 21.0, 20.0, 21.0, 9.0, 7.0, 9.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004505157470703125, -0.004396766424179077, -0.004288375377655029, -0.0041799843311309814, -0.004071593284606934, -0.003963202238082886, -0.003854811191558838, -0.00374642014503479, -0.003638029098510742, -0.0035296380519866943, -0.0034212470054626465, -0.0033128559589385986, -0.0032044649124145508, -0.003096073865890503, -0.002987682819366455, -0.0028792917728424072, -0.0027709007263183594, -0.0026625096797943115, -0.0025541186332702637, -0.002445727586746216, -0.002337336540222168, -0.00222894549369812, -0.0021205544471740723, -0.0020121634006500244, -0.0019037723541259766, -0.0017953813076019287, -0.0016869902610778809, -0.001578599214553833, -0.0014702081680297852, -0.0013618171215057373, -0.0012534260749816895, -0.0011450350284576416, -0.0010366439819335938, -0.0009282529354095459, -0.000819861888885498, -0.0007114708423614502, -0.0006030797958374023, -0.0004946887493133545, -0.00038629770278930664, -0.0002779066562652588, -0.00016951560974121094, -6.112456321716309e-05, 4.7266483306884766e-05, 0.00015565752983093262, 0.00026404857635498047, 0.0003724396228790283, 0.00048083066940307617, 0.000589221715927124, 0.0006976127624511719, 0.0008060038089752197, 0.0009143948554992676, 0.0010227859020233154, 0.0011311769485473633, 0.0012395679950714111, 0.001347959041595459, 0.0014563500881195068, 0.0015647411346435547, 0.0016731321811676025, 0.0017815232276916504, 0.0018899142742156982, 0.001998305320739746, 0.002106696367263794, 0.002215087413787842, 0.0023234784603118896, 0.0024318695068359375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 5.0, 4.0, 16.0, 16.0, 23.0, 19.0, 26.0, 49.0, 42.0, 66.0, 138.0, 293.0, 1538.0, 1043364.0, 2173.0, 334.0, 135.0, 72.0, 57.0, 48.0, 29.0, 24.0, 15.0, 13.0, 5.0, 8.0, 10.0, 10.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06182861328125, -0.05908679962158203, -0.05634498596191406, -0.053603172302246094, -0.050861358642578125, -0.048119544982910156, -0.04537773132324219, -0.04263591766357422, -0.03989410400390625, -0.03715229034423828, -0.03441047668457031, -0.031668663024902344, -0.028926849365234375, -0.026185035705566406, -0.023443222045898438, -0.02070140838623047, -0.0179595947265625, -0.015217781066894531, -0.012475967407226562, -0.009734153747558594, -0.006992340087890625, -0.004250526428222656, -0.0015087127685546875, 0.0012331008911132812, 0.00397491455078125, 0.006716728210449219, 0.009458541870117188, 0.012200355529785156, 0.014942169189453125, 0.017683982849121094, 0.020425796508789062, 0.02316761016845703, 0.025909423828125, 0.02865123748779297, 0.03139305114746094, 0.034134864807128906, 0.036876678466796875, 0.039618492126464844, 0.04236030578613281, 0.04510211944580078, 0.04784393310546875, 0.05058574676513672, 0.05332756042480469, 0.056069374084472656, 0.058811187744140625, 0.061553001403808594, 0.06429481506347656, 0.06703662872314453, 0.0697784423828125, 0.07252025604248047, 0.07526206970214844, 0.0780038833618164, 0.08074569702148438, 0.08348751068115234, 0.08622932434082031, 0.08897113800048828, 0.09171295166015625, 0.09445476531982422, 0.09719657897949219, 0.09993839263916016, 0.10268020629882812, 0.1054220199584961, 0.10816383361816406, 0.11090564727783203, 0.1136474609375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 25.0, 74.0, 175.0, 293.0, 241.0, 129.0, 48.0, 13.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00384248117916286, -0.0037547254469245672, -0.003666969481855631, -0.003579213749617338, -0.0034914580173790455, -0.003403702285140753, -0.0033159463200718164, -0.0032281905878335238, -0.0031404346227645874, -0.0030526788905262947, -0.0029649229254573584, -0.0028771671932190657, -0.002789411460980773, -0.0027016554959118366, -0.002613899763673544, -0.0025261440314352512, -0.0024383882991969585, -0.002350632566958666, -0.0022628766018897295, -0.002175120869651437, -0.002087365137413144, -0.0019996091723442078, -0.001911853440105915, -0.0018240977078676224, -0.0017363418592140079, -0.0016485860105603933, -0.0015608302783221006, -0.0014730744296684861, -0.0013853185810148716, -0.001297562848776579, -0.0012098070001229644, -0.0011220511514693499, -0.0010342954192310572, -0.0009465396287851036, -0.00085878383833915, -0.0007710279896855354, -0.0006832721992395818, -0.0005955164087936282, -0.0005077605601400137, -0.0004200047696940601, -0.0003322489792481065, -0.00024449318880215287, -0.0001567373692523688, -6.898154970258474e-05, 1.8774240743368864e-05, 0.00010653003118932247, 0.000194285879842937, 0.0002820416702888906, 0.0003697974607348442, 0.0004575532511807978, 0.0005453090416267514, 0.0006330648902803659, 0.0007208206807263196, 0.0008085764711722732, 0.0008963323198258877, 0.0009840880520641804, 0.001071843900717795, 0.0011595997493714094, 0.0012473554816097021, 0.0013351113302633166, 0.0014228671789169312, 0.0015106229111552238, 0.0015983787598088384, 0.0016861346084624529, 0.0017738903407007456]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 7.0, 3.0, 14.0, 6.0, 13.0, 13.0, 21.0, 19.0, 23.0, 26.0, 33.0, 31.0, 38.0, 27.0, 33.0, 35.0, 30.0, 33.0, 55.0, 56.0, 28.0, 38.0, 34.0, 36.0, 27.0, 39.0, 41.0, 24.0, 36.0, 20.0, 30.0, 24.0, 18.0, 18.0, 11.0, 8.0, 12.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0013010501861572266, -0.0012602517381310463, -0.001219453290104866, -0.0011786548420786858, -0.0011378563940525055, -0.0010970579460263252, -0.001056259498000145, -0.0010154610499739647, -0.0009746626019477844, -0.0009338641539216042, -0.0008930657058954239, -0.0008522672578692436, -0.0008114688098430634, -0.0007706703618168831, -0.0007298719137907028, -0.0006890734657645226, -0.0006482750177383423, -0.000607476569712162, -0.0005666781216859818, -0.0005258796736598015, -0.0004850812256336212, -0.00044428277760744095, -0.0004034843295812607, -0.0003626858815550804, -0.00032188743352890015, -0.0002810889855027199, -0.0002402905374765396, -0.00019949208945035934, -0.00015869364142417908, -0.00011789519339799881, -7.709674537181854e-05, -3.6298297345638275e-05, 4.500150680541992e-06, 4.529859870672226e-05, 8.609704673290253e-05, 0.0001268954947590828, 0.00016769394278526306, 0.00020849239081144333, 0.0002492908388376236, 0.00029008928686380386, 0.00033088773488998413, 0.0003716861829161644, 0.00041248463094234467, 0.00045328307896852493, 0.0004940815269947052, 0.0005348799750208855, 0.0005756784230470657, 0.000616476871073246, 0.0006572753190994263, 0.0006980737671256065, 0.0007388722151517868, 0.0007796706631779671, 0.0008204691112041473, 0.0008612675592303276, 0.0009020660072565079, 0.0009428644552826881, 0.0009836629033088684, 0.0010244613513350487, 0.001065259799361229, 0.0011060582473874092, 0.0011468566954135895, 0.0011876551434397697, 0.00122845359146595, 0.0012692520394921303, 0.0013100504875183105]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 9.0, 2.0, 16.0, 12.0, 8.0, 18.0, 17.0, 19.0, 14.0, 27.0, 36.0, 29.0, 36.0, 25.0, 50.0, 48.0, 41.0, 36.0, 65.0, 36.0, 39.0, 36.0, 55.0, 31.0, 34.0, 36.0, 26.0, 22.0, 30.0, 24.0, 13.0, 13.0, 16.0, 16.0, 12.0, 12.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.0377197265625, -14.505126953125, -13.9725341796875, -13.43994140625, -12.9073486328125, -12.374755859375, -11.8421630859375, -11.3095703125, -10.7769775390625, -10.244384765625, -9.7117919921875, -9.17919921875, -8.6466064453125, -8.114013671875, -7.5814208984375, -7.048828125, -6.5162353515625, -5.983642578125, -5.4510498046875, -4.91845703125, -4.3858642578125, -3.853271484375, -3.3206787109375, -2.7880859375, -2.2554931640625, -1.722900390625, -1.1903076171875, -0.65771484375, -0.1251220703125, 0.407470703125, 0.9400634765625, 1.47265625, 2.0052490234375, 2.537841796875, 3.0704345703125, 3.60302734375, 4.1356201171875, 4.668212890625, 5.2008056640625, 5.7333984375, 6.2659912109375, 6.798583984375, 7.3311767578125, 7.86376953125, 8.3963623046875, 8.928955078125, 9.4615478515625, 9.994140625, 10.5267333984375, 11.059326171875, 11.5919189453125, 12.12451171875, 12.6571044921875, 13.189697265625, 13.7222900390625, 14.2548828125, 14.7874755859375, 15.320068359375, 15.8526611328125, 16.38525390625, 16.9178466796875, 17.450439453125, 17.9830322265625, 18.515625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 6.0, 5.0, 8.0, 11.0, 6.0, 25.0, 20.0, 30.0, 46.0, 75.0, 98.0, 128.0, 242.0, 399.0, 831.0, 1766.0, 3876.0, 8517.0, 20568.0, 51004.0, 145346.0, 420580.0, 255760.0, 83799.0, 31559.0, 12918.0, 5785.0, 2524.0, 1127.0, 594.0, 323.0, 182.0, 110.0, 80.0, 47.0, 44.0, 36.0, 18.0, 22.0, 7.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.7904052734375, -8.494873046875, -8.1993408203125, -7.90380859375, -7.6082763671875, -7.312744140625, -7.0172119140625, -6.7216796875, -6.4261474609375, -6.130615234375, -5.8350830078125, -5.53955078125, -5.2440185546875, -4.948486328125, -4.6529541015625, -4.357421875, -4.0618896484375, -3.766357421875, -3.4708251953125, -3.17529296875, -2.8797607421875, -2.584228515625, -2.2886962890625, -1.9931640625, -1.6976318359375, -1.402099609375, -1.1065673828125, -0.81103515625, -0.5155029296875, -0.219970703125, 0.0755615234375, 0.37109375, 0.6666259765625, 0.962158203125, 1.2576904296875, 1.55322265625, 1.8487548828125, 2.144287109375, 2.4398193359375, 2.7353515625, 3.0308837890625, 3.326416015625, 3.6219482421875, 3.91748046875, 4.2130126953125, 4.508544921875, 4.8040771484375, 5.099609375, 5.3951416015625, 5.690673828125, 5.9862060546875, 6.28173828125, 6.5772705078125, 6.872802734375, 7.1683349609375, 7.4638671875, 7.7593994140625, 8.054931640625, 8.3504638671875, 8.64599609375, 8.9415283203125, 9.237060546875, 9.5325927734375, 9.828125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 11.0, 8.0, 14.0, 13.0, 18.0, 30.0, 25.0, 34.0, 40.0, 39.0, 48.0, 39.0, 52.0, 73.0, 234.0, 1769.0, 141.0, 63.0, 52.0, 36.0, 35.0, 35.0, 42.0, 31.0, 21.0, 24.0, 21.0, 14.0, 11.0, 13.0, 6.0, 6.0, 10.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.5625, -61.5986328125, -59.634765625, -57.6708984375, -55.70703125, -53.7431640625, -51.779296875, -49.8154296875, -47.8515625, -45.8876953125, -43.923828125, -41.9599609375, -39.99609375, -38.0322265625, -36.068359375, -34.1044921875, -32.140625, -30.1767578125, -28.212890625, -26.2490234375, -24.28515625, -22.3212890625, -20.357421875, -18.3935546875, -16.4296875, -14.4658203125, -12.501953125, -10.5380859375, -8.57421875, -6.6103515625, -4.646484375, -2.6826171875, -0.71875, 1.2451171875, 3.208984375, 5.1728515625, 7.13671875, 9.1005859375, 11.064453125, 13.0283203125, 14.9921875, 16.9560546875, 18.919921875, 20.8837890625, 22.84765625, 24.8115234375, 26.775390625, 28.7392578125, 30.703125, 32.6669921875, 34.630859375, 36.5947265625, 38.55859375, 40.5224609375, 42.486328125, 44.4501953125, 46.4140625, 48.3779296875, 50.341796875, 52.3056640625, 54.26953125, 56.2333984375, 58.197265625, 60.1611328125, 62.125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 9.0, 8.0, 14.0, 14.0, 19.0, 27.0, 45.0, 46.0, 58.0, 82.0, 118.0, 143.0, 172.0, 252.0, 531.0, 2015.0, 3078955.0, 60885.0, 944.0, 415.0, 237.0, 182.0, 114.0, 99.0, 75.0, 41.0, 49.0, 41.0, 24.0, 17.0, 11.0, 9.0, 4.0, 9.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.875, -145.162109375, -140.44921875, -135.736328125, -131.0234375, -126.310546875, -121.59765625, -116.884765625, -112.171875, -107.458984375, -102.74609375, -98.033203125, -93.3203125, -88.607421875, -83.89453125, -79.181640625, -74.46875, -69.755859375, -65.04296875, -60.330078125, -55.6171875, -50.904296875, -46.19140625, -41.478515625, -36.765625, -32.052734375, -27.33984375, -22.626953125, -17.9140625, -13.201171875, -8.48828125, -3.775390625, 0.9375, 5.650390625, 10.36328125, 15.076171875, 19.7890625, 24.501953125, 29.21484375, 33.927734375, 38.640625, 43.353515625, 48.06640625, 52.779296875, 57.4921875, 62.205078125, 66.91796875, 71.630859375, 76.34375, 81.056640625, 85.76953125, 90.482421875, 95.1953125, 99.908203125, 104.62109375, 109.333984375, 114.046875, 118.759765625, 123.47265625, 128.185546875, 132.8984375, 137.611328125, 142.32421875, 147.037109375, 151.75]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 62.0, 352.0, 434.0, 148.0, 14.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.450103759765625, -37.377403259277344, -33.30470275878906, -29.231998443603516, -25.159297943115234, -21.086597442626953, -17.01389503479004, -12.941192626953125, -8.868492126464844, -4.795790672302246, -0.7230892181396484, 3.349612236022949, 7.422313690185547, 11.495014190673828, 15.567716598510742, 19.640419006347656, 23.713119506835938, 27.78582000732422, 31.858522415161133, 35.93122482299805, 40.00392532348633, 44.07662582397461, 48.149330139160156, 52.22203063964844, 56.29473114013672, 60.367431640625, 64.44013214111328, 68.51283264160156, 72.58554077148438, 76.65823364257812, 80.73094177246094, 84.80364227294922, 88.87632751464844, 92.94902801513672, 97.021728515625, 101.09442901611328, 105.16712951660156, 109.23983764648438, 113.31253814697266, 117.38523864746094, 121.45793914794922, 125.5306396484375, 129.6033477783203, 133.67604064941406, 137.74874877929688, 141.82144165039062, 145.89414978027344, 149.96685791015625, 154.03955078125, 158.1122589111328, 162.18495178222656, 166.25765991210938, 170.33035278320312, 174.40306091308594, 178.4757537841797, 182.5484619140625, 186.62115478515625, 190.69386291503906, 194.7665557861328, 198.83926391601562, 202.91195678710938, 206.9846649169922, 211.05735778808594, 215.13006591796875, 219.20277404785156]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 13.0, 8.0, 13.0, 10.0, 11.0, 12.0, 19.0, 11.0, 23.0, 30.0, 28.0, 20.0, 34.0, 35.0, 36.0, 39.0, 37.0, 36.0, 37.0, 36.0, 32.0, 30.0, 34.0, 38.0, 39.0, 45.0, 35.0, 37.0, 26.0, 19.0, 26.0, 23.0, 20.0, 14.0, 10.0, 18.0, 10.0, 8.0, 5.0, 10.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.13558959960938, -127.93862915039062, -123.74166107177734, -119.54469299316406, -115.34773254394531, -111.15077209472656, -106.95380401611328, -102.7568359375, -98.55987548828125, -94.3629150390625, -90.16594696044922, -85.96897888183594, -81.77201843261719, -77.57505798339844, -73.37808990478516, -69.18112182617188, -64.98416137695312, -60.78719711303711, -56.590232849121094, -52.39326858520508, -48.19630432128906, -43.99934005737305, -39.80237579345703, -35.605411529541016, -31.408447265625, -27.211483001708984, -23.01451873779297, -18.817554473876953, -14.620590209960938, -10.423625946044922, -6.226661682128906, -2.0296974182128906, 2.167266845703125, 6.364231109619141, 10.561195373535156, 14.758159637451172, 18.955123901367188, 23.152088165283203, 27.34905242919922, 31.546016693115234, 35.74298095703125, 39.939945220947266, 44.13690948486328, 48.3338737487793, 52.53083801269531, 56.72780227661133, 60.924766540527344, 65.12173461914062, 69.31869506835938, 73.51565551757812, 77.7126235961914, 81.90959167480469, 86.10655212402344, 90.30351257324219, 94.50048065185547, 98.69744873046875, 102.8944091796875, 107.09136962890625, 111.28833770751953, 115.48530578613281, 119.68226623535156, 123.87922668457031, 128.07620239257812, 132.27316284179688, 136.47012329101562]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 3.0, 13.0, 6.0, 18.0, 13.0, 20.0, 16.0, 18.0, 24.0, 34.0, 33.0, 27.0, 32.0, 40.0, 46.0, 37.0, 50.0, 42.0, 36.0, 46.0, 44.0, 44.0, 39.0, 36.0, 32.0, 25.0, 27.0, 27.0, 23.0, 14.0, 19.0, 15.0, 18.0, 11.0, 13.0, 8.0, 11.0, 6.0, 5.0, 8.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6640625, -15.1339111328125, -14.603759765625, -14.0736083984375, -13.54345703125, -13.0133056640625, -12.483154296875, -11.9530029296875, -11.4228515625, -10.8927001953125, -10.362548828125, -9.8323974609375, -9.30224609375, -8.7720947265625, -8.241943359375, -7.7117919921875, -7.181640625, -6.6514892578125, -6.121337890625, -5.5911865234375, -5.06103515625, -4.5308837890625, -4.000732421875, -3.4705810546875, -2.9404296875, -2.4102783203125, -1.880126953125, -1.3499755859375, -0.81982421875, -0.2896728515625, 0.240478515625, 0.7706298828125, 1.30078125, 1.8309326171875, 2.361083984375, 2.8912353515625, 3.42138671875, 3.9515380859375, 4.481689453125, 5.0118408203125, 5.5419921875, 6.0721435546875, 6.602294921875, 7.1324462890625, 7.66259765625, 8.1927490234375, 8.722900390625, 9.2530517578125, 9.783203125, 10.3133544921875, 10.843505859375, 11.3736572265625, 11.90380859375, 12.4339599609375, 12.964111328125, 13.4942626953125, 14.0244140625, 14.5545654296875, 15.084716796875, 15.6148681640625, 16.14501953125, 16.6751708984375, 17.205322265625, 17.7354736328125, 18.265625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 3.0, 7.0, 3.0, 6.0, 11.0, 8.0, 8.0, 10.0, 10.0, 14.0, 21.0, 15.0, 33.0, 24.0, 28.0, 43.0, 72.0, 103.0, 156.0, 285.0, 646.0, 2028.0, 19624.0, 927560.0, 3088503.0, 147712.0, 5144.0, 1059.0, 453.0, 206.0, 123.0, 70.0, 56.0, 38.0, 28.0, 20.0, 15.0, 15.0, 20.0, 20.0, 10.0, 11.0, 11.0, 16.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-46.875, -45.3759765625, -43.876953125, -42.3779296875, -40.87890625, -39.3798828125, -37.880859375, -36.3818359375, -34.8828125, -33.3837890625, -31.884765625, -30.3857421875, -28.88671875, -27.3876953125, -25.888671875, -24.3896484375, -22.890625, -21.3916015625, -19.892578125, -18.3935546875, -16.89453125, -15.3955078125, -13.896484375, -12.3974609375, -10.8984375, -9.3994140625, -7.900390625, -6.4013671875, -4.90234375, -3.4033203125, -1.904296875, -0.4052734375, 1.09375, 2.5927734375, 4.091796875, 5.5908203125, 7.08984375, 8.5888671875, 10.087890625, 11.5869140625, 13.0859375, 14.5849609375, 16.083984375, 17.5830078125, 19.08203125, 20.5810546875, 22.080078125, 23.5791015625, 25.078125, 26.5771484375, 28.076171875, 29.5751953125, 31.07421875, 32.5732421875, 34.072265625, 35.5712890625, 37.0703125, 38.5693359375, 40.068359375, 41.5673828125, 43.06640625, 44.5654296875, 46.064453125, 47.5634765625, 49.0625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 5.0, 6.0, 12.0, 5.0, 12.0, 13.0, 16.0, 22.0, 27.0, 41.0, 43.0, 40.0, 71.0, 78.0, 119.0, 136.0, 188.0, 209.0, 312.0, 378.0, 448.0, 411.0, 357.0, 277.0, 197.0, 140.0, 108.0, 81.0, 69.0, 51.0, 45.0, 30.0, 23.0, 26.0, 17.0, 18.0, 3.0, 4.0, 13.0, 6.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.15625, -20.362060546875, -19.56787109375, -18.773681640625, -17.9794921875, -17.185302734375, -16.39111328125, -15.596923828125, -14.802734375, -14.008544921875, -13.21435546875, -12.420166015625, -11.6259765625, -10.831787109375, -10.03759765625, -9.243408203125, -8.44921875, -7.655029296875, -6.86083984375, -6.066650390625, -5.2724609375, -4.478271484375, -3.68408203125, -2.889892578125, -2.095703125, -1.301513671875, -0.50732421875, 0.286865234375, 1.0810546875, 1.875244140625, 2.66943359375, 3.463623046875, 4.2578125, 5.052001953125, 5.84619140625, 6.640380859375, 7.4345703125, 8.228759765625, 9.02294921875, 9.817138671875, 10.611328125, 11.405517578125, 12.19970703125, 12.993896484375, 13.7880859375, 14.582275390625, 15.37646484375, 16.170654296875, 16.96484375, 17.759033203125, 18.55322265625, 19.347412109375, 20.1416015625, 20.935791015625, 21.72998046875, 22.524169921875, 23.318359375, 24.112548828125, 24.90673828125, 25.700927734375, 26.4951171875, 27.289306640625, 28.08349609375, 28.877685546875, 29.671875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 7.0, 10.0, 12.0, 11.0, 18.0, 22.0, 26.0, 42.0, 44.0, 55.0, 80.0, 71.0, 104.0, 155.0, 190.0, 272.0, 406.0, 777.0, 15800.0, 4170601.0, 3462.0, 641.0, 333.0, 240.0, 159.0, 135.0, 109.0, 101.0, 62.0, 67.0, 61.0, 56.0, 26.0, 29.0, 21.0, 25.0, 19.0, 9.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-220.0, -213.783203125, -207.56640625, -201.349609375, -195.1328125, -188.916015625, -182.69921875, -176.482421875, -170.265625, -164.048828125, -157.83203125, -151.615234375, -145.3984375, -139.181640625, -132.96484375, -126.748046875, -120.53125, -114.314453125, -108.09765625, -101.880859375, -95.6640625, -89.447265625, -83.23046875, -77.013671875, -70.796875, -64.580078125, -58.36328125, -52.146484375, -45.9296875, -39.712890625, -33.49609375, -27.279296875, -21.0625, -14.845703125, -8.62890625, -2.412109375, 3.8046875, 10.021484375, 16.23828125, 22.455078125, 28.671875, 34.888671875, 41.10546875, 47.322265625, 53.5390625, 59.755859375, 65.97265625, 72.189453125, 78.40625, 84.623046875, 90.83984375, 97.056640625, 103.2734375, 109.490234375, 115.70703125, 121.923828125, 128.140625, 134.357421875, 140.57421875, 146.791015625, 153.0078125, 159.224609375, 165.44140625, 171.658203125, 177.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 90.0, 502.0, 382.0, 37.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-763.6664428710938, -748.9329223632812, -734.1993408203125, -719.4658203125, -704.7322998046875, -689.998779296875, -675.2651977539062, -660.5316772460938, -645.7981567382812, -631.0646362304688, -616.3310546875, -601.5975341796875, -586.864013671875, -572.1304931640625, -557.3969116210938, -542.6633911132812, -527.9298095703125, -513.1962890625, -498.4627380371094, -483.72918701171875, -468.99566650390625, -454.2621154785156, -439.528564453125, -424.7950439453125, -410.0615234375, -395.3279724121094, -380.5944519042969, -365.86090087890625, -351.12738037109375, -336.3938293457031, -321.6602783203125, -306.9267578125, -292.1932067871094, -277.45965576171875, -262.72613525390625, -247.99258422851562, -233.25906372070312, -218.5255126953125, -203.79197692871094, -189.05844116210938, -174.3249053955078, -159.59136962890625, -144.8578338623047, -130.12429809570312, -115.39075469970703, -100.65721893310547, -85.92367553710938, -71.19013977050781, -56.45660400390625, -41.72306823730469, -26.98952865600586, -12.255989074707031, 2.4775466918945312, 17.211082458496094, 31.944625854492188, 46.67816162109375, 61.41169738769531, 76.14523315429688, 90.87876892089844, 105.61231231689453, 120.3458480834961, 135.07937622070312, 149.81292724609375, 164.5464630126953, 179.27999877929688]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 4.0, 8.0, 11.0, 16.0, 13.0, 16.0, 10.0, 17.0, 15.0, 18.0, 29.0, 29.0, 23.0, 25.0, 24.0, 37.0, 46.0, 41.0, 40.0, 26.0, 33.0, 43.0, 20.0, 36.0, 35.0, 35.0, 34.0, 37.0, 29.0, 28.0, 22.0, 27.0, 28.0, 17.0, 10.0, 12.0, 15.0, 9.0, 13.0, 15.0, 5.0, 10.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-85.51187133789062, -82.82881164550781, -80.145751953125, -77.46269226074219, -74.77963256835938, -72.09657287597656, -69.41351318359375, -66.73045349121094, -64.04739379882812, -61.36433410644531, -58.6812744140625, -55.99821472167969, -53.315155029296875, -50.63209533691406, -47.949031829833984, -45.26597213745117, -42.582908630371094, -39.89984893798828, -37.21678924560547, -34.533729553222656, -31.85066795349121, -29.1676082611084, -26.484546661376953, -23.80148696899414, -21.118427276611328, -18.435367584228516, -15.752306938171387, -13.069246292114258, -10.386186599731445, -7.703126907348633, -5.0200653076171875, -2.337005615234375, 0.3460540771484375, 3.029114246368408, 5.712174415588379, 8.395235061645508, 11.07829475402832, 13.761354446411133, 16.444416046142578, 19.12747573852539, 21.810535430908203, 24.493595123291016, 27.176654815673828, 29.859716415405273, 32.54277801513672, 35.22583770751953, 37.908897399902344, 40.591957092285156, 43.27501678466797, 45.95807647705078, 48.641136169433594, 51.324195861816406, 54.00725555419922, 56.69031524658203, 59.37337875366211, 62.05643844604492, 64.739501953125, 67.42256164550781, 70.10562133789062, 72.78868103027344, 75.47174072265625, 78.15480041503906, 80.83786010742188, 83.52091979980469, 86.2039794921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 7.0, 7.0, 7.0, 7.0, 10.0, 12.0, 6.0, 12.0, 13.0, 23.0, 23.0, 31.0, 27.0, 31.0, 29.0, 31.0, 44.0, 45.0, 27.0, 44.0, 49.0, 38.0, 48.0, 31.0, 46.0, 43.0, 41.0, 36.0, 31.0, 36.0, 20.0, 22.0, 17.0, 13.0, 18.0, 10.0, 12.0, 14.0, 9.0, 8.0, 12.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.931396484375, -15.40966796875, -14.887939453125, -14.3662109375, -13.844482421875, -13.32275390625, -12.801025390625, -12.279296875, -11.757568359375, -11.23583984375, -10.714111328125, -10.1923828125, -9.670654296875, -9.14892578125, -8.627197265625, -8.10546875, -7.583740234375, -7.06201171875, -6.540283203125, -6.0185546875, -5.496826171875, -4.97509765625, -4.453369140625, -3.931640625, -3.409912109375, -2.88818359375, -2.366455078125, -1.8447265625, -1.322998046875, -0.80126953125, -0.279541015625, 0.2421875, 0.763916015625, 1.28564453125, 1.807373046875, 2.3291015625, 2.850830078125, 3.37255859375, 3.894287109375, 4.416015625, 4.937744140625, 5.45947265625, 5.981201171875, 6.5029296875, 7.024658203125, 7.54638671875, 8.068115234375, 8.58984375, 9.111572265625, 9.63330078125, 10.155029296875, 10.6767578125, 11.198486328125, 11.72021484375, 12.241943359375, 12.763671875, 13.285400390625, 13.80712890625, 14.328857421875, 14.8505859375, 15.372314453125, 15.89404296875, 16.415771484375, 16.9375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 8.0, 4.0, 11.0, 14.0, 24.0, 27.0, 56.0, 67.0, 97.0, 135.0, 241.0, 286.0, 443.0, 651.0, 918.0, 1203.0, 1893.0, 2597.0, 3813.0, 5463.0, 8079.0, 11700.0, 17460.0, 26559.0, 42682.0, 70342.0, 123795.0, 288499.0, 186871.0, 95553.0, 55366.0, 34758.0, 22593.0, 14749.0, 9719.0, 6633.0, 4639.0, 3187.0, 2186.0, 1554.0, 1118.0, 778.0, 558.0, 375.0, 270.0, 201.0, 116.0, 90.0, 59.0, 44.0, 29.0, 23.0, 10.0, 4.0, 11.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.8125, -3.692535400390625, -3.57257080078125, -3.452606201171875, -3.3326416015625, -3.212677001953125, -3.09271240234375, -2.972747802734375, -2.852783203125, -2.732818603515625, -2.61285400390625, -2.492889404296875, -2.3729248046875, -2.252960205078125, -2.13299560546875, -2.013031005859375, -1.89306640625, -1.773101806640625, -1.65313720703125, -1.533172607421875, -1.4132080078125, -1.293243408203125, -1.17327880859375, -1.053314208984375, -0.933349609375, -0.813385009765625, -0.69342041015625, -0.573455810546875, -0.4534912109375, -0.333526611328125, -0.21356201171875, -0.093597412109375, 0.0263671875, 0.146331787109375, 0.26629638671875, 0.386260986328125, 0.5062255859375, 0.626190185546875, 0.74615478515625, 0.866119384765625, 0.986083984375, 1.106048583984375, 1.22601318359375, 1.345977783203125, 1.4659423828125, 1.585906982421875, 1.70587158203125, 1.825836181640625, 1.94580078125, 2.065765380859375, 2.18572998046875, 2.305694580078125, 2.4256591796875, 2.545623779296875, 2.66558837890625, 2.785552978515625, 2.905517578125, 3.025482177734375, 3.14544677734375, 3.265411376953125, 3.3853759765625, 3.505340576171875, 3.62530517578125, 3.745269775390625, 3.865234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 5.0, 12.0, 9.0, 13.0, 13.0, 20.0, 19.0, 25.0, 31.0, 22.0, 29.0, 32.0, 27.0, 31.0, 44.0, 40.0, 33.0, 36.0, 32.0, 1078.0, 33.0, 32.0, 34.0, 36.0, 37.0, 25.0, 22.0, 37.0, 25.0, 29.0, 24.0, 19.0, 26.0, 12.0, 10.0, 10.0, 7.0, 6.0, 7.0, 2.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-10.0234375, -9.729736328125, -9.43603515625, -9.142333984375, -8.8486328125, -8.554931640625, -8.26123046875, -7.967529296875, -7.673828125, -7.380126953125, -7.08642578125, -6.792724609375, -6.4990234375, -6.205322265625, -5.91162109375, -5.617919921875, -5.32421875, -5.030517578125, -4.73681640625, -4.443115234375, -4.1494140625, -3.855712890625, -3.56201171875, -3.268310546875, -2.974609375, -2.680908203125, -2.38720703125, -2.093505859375, -1.7998046875, -1.506103515625, -1.21240234375, -0.918701171875, -0.625, -0.331298828125, -0.03759765625, 0.256103515625, 0.5498046875, 0.843505859375, 1.13720703125, 1.430908203125, 1.724609375, 2.018310546875, 2.31201171875, 2.605712890625, 2.8994140625, 3.193115234375, 3.48681640625, 3.780517578125, 4.07421875, 4.367919921875, 4.66162109375, 4.955322265625, 5.2490234375, 5.542724609375, 5.83642578125, 6.130126953125, 6.423828125, 6.717529296875, 7.01123046875, 7.304931640625, 7.5986328125, 7.892333984375, 8.18603515625, 8.479736328125, 8.7734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 17.0, 19.0, 17.0, 35.0, 43.0, 72.0, 73.0, 116.0, 178.0, 268.0, 341.0, 487.0, 741.0, 1034.0, 1571.0, 2369.0, 3477.0, 5398.0, 8252.0, 13071.0, 20747.0, 33512.0, 54130.0, 91617.0, 174996.0, 1365937.0, 127848.0, 72069.0, 43495.0, 27159.0, 17024.0, 10653.0, 6734.0, 4504.0, 2955.0, 2040.0, 1260.0, 907.0, 576.0, 394.0, 296.0, 192.0, 154.0, 95.0, 82.0, 63.0, 27.0, 28.0, 21.0, 11.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.76953125, -3.649017333984375, -3.52850341796875, -3.407989501953125, -3.2874755859375, -3.166961669921875, -3.04644775390625, -2.925933837890625, -2.805419921875, -2.684906005859375, -2.56439208984375, -2.443878173828125, -2.3233642578125, -2.202850341796875, -2.08233642578125, -1.961822509765625, -1.84130859375, -1.720794677734375, -1.60028076171875, -1.479766845703125, -1.3592529296875, -1.238739013671875, -1.11822509765625, -0.997711181640625, -0.877197265625, -0.756683349609375, -0.63616943359375, -0.515655517578125, -0.3951416015625, -0.274627685546875, -0.15411376953125, -0.033599853515625, 0.0869140625, 0.207427978515625, 0.32794189453125, 0.448455810546875, 0.5689697265625, 0.689483642578125, 0.80999755859375, 0.930511474609375, 1.051025390625, 1.171539306640625, 1.29205322265625, 1.412567138671875, 1.5330810546875, 1.653594970703125, 1.77410888671875, 1.894622802734375, 2.01513671875, 2.135650634765625, 2.25616455078125, 2.376678466796875, 2.4971923828125, 2.617706298828125, 2.73822021484375, 2.858734130859375, 2.979248046875, 3.099761962890625, 3.22027587890625, 3.340789794921875, 3.4613037109375, 3.581817626953125, 3.70233154296875, 3.822845458984375, 3.943359375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 1.0, 7.0, 4.0, 6.0, 6.0, 9.0, 13.0, 20.0, 21.0, 25.0, 31.0, 49.0, 51.0, 59.0, 62.0, 75.0, 95.0, 66.0, 72.0, 63.0, 48.0, 41.0, 29.0, 22.0, 27.0, 15.0, 14.0, 6.0, 11.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0021209716796875, -0.002059653401374817, -0.001998335123062134, -0.0019370168447494507, -0.0018756985664367676, -0.0018143802881240845, -0.0017530620098114014, -0.0016917437314987183, -0.0016304254531860352, -0.001569107174873352, -0.001507788896560669, -0.0014464706182479858, -0.0013851523399353027, -0.0013238340616226196, -0.0012625157833099365, -0.0012011975049972534, -0.0011398792266845703, -0.0010785609483718872, -0.001017242670059204, -0.000955924391746521, -0.0008946061134338379, -0.0008332878351211548, -0.0007719695568084717, -0.0007106512784957886, -0.0006493330001831055, -0.0005880147218704224, -0.0005266964435577393, -0.00046537816524505615, -0.00040405988693237305, -0.00034274160861968994, -0.00028142333030700684, -0.00022010505199432373, -0.00015878677368164062, -9.746849536895752e-05, -3.6150217056274414e-05, 2.516806125640869e-05, 8.64863395690918e-05, 0.0001478046178817749, 0.000209122896194458, 0.0002704411745071411, 0.0003317594528198242, 0.0003930777311325073, 0.00045439600944519043, 0.0005157142877578735, 0.0005770325660705566, 0.0006383508443832397, 0.0006996691226959229, 0.000760987401008606, 0.0008223056793212891, 0.0008836239576339722, 0.0009449422359466553, 0.0010062605142593384, 0.0010675787925720215, 0.0011288970708847046, 0.0011902153491973877, 0.0012515336275100708, 0.001312851905822754, 0.001374170184135437, 0.0014354884624481201, 0.0014968067407608032, 0.0015581250190734863, 0.0016194432973861694, 0.0016807615756988525, 0.0017420798540115356, 0.0018033981323242188]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 5.0, 9.0, 11.0, 6.0, 21.0, 8.0, 33.0, 24.0, 34.0, 63.0, 69.0, 106.0, 202.0, 459.0, 1861.0, 1017315.0, 26745.0, 745.0, 311.0, 152.0, 85.0, 60.0, 41.0, 43.0, 37.0, 18.0, 12.0, 14.0, 17.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.04656982421875, -0.04500389099121094, -0.043437957763671875, -0.04187202453613281, -0.04030609130859375, -0.03874015808105469, -0.037174224853515625, -0.03560829162597656, -0.0340423583984375, -0.03247642517089844, -0.030910491943359375, -0.029344558715820312, -0.02777862548828125, -0.026212692260742188, -0.024646759033203125, -0.023080825805664062, -0.021514892578125, -0.019948959350585938, -0.018383026123046875, -0.016817092895507812, -0.01525115966796875, -0.013685226440429688, -0.012119293212890625, -0.010553359985351562, -0.0089874267578125, -0.0074214935302734375, -0.005855560302734375, -0.0042896270751953125, -0.00272369384765625, -0.0011577606201171875, 0.000408172607421875, 0.0019741058349609375, 0.0035400390625, 0.0051059722900390625, 0.006671905517578125, 0.008237838745117188, 0.00980377197265625, 0.011369705200195312, 0.012935638427734375, 0.014501571655273438, 0.0160675048828125, 0.017633438110351562, 0.019199371337890625, 0.020765304565429688, 0.02233123779296875, 0.023897171020507812, 0.025463104248046875, 0.027029037475585938, 0.028594970703125, 0.030160903930664062, 0.031726837158203125, 0.03329277038574219, 0.03485870361328125, 0.03642463684082031, 0.037990570068359375, 0.03955650329589844, 0.0411224365234375, 0.04268836975097656, 0.044254302978515625, 0.04582023620605469, 0.04738616943359375, 0.04895210266113281, 0.050518035888671875, 0.05208396911621094, 0.05364990234375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 35.0, 194.0, 437.0, 256.0, 65.0, 15.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004027646500617266, -0.0039044541772454977, -0.003781261621043086, -0.003658069297671318, -0.0035348767414689064, -0.0034116844180971384, -0.0032884920947253704, -0.0031652995385229588, -0.0030421072151511908, -0.0029189148917794228, -0.002795722335577011, -0.002672530012205243, -0.002549337688833475, -0.0024261451326310635, -0.0023029528092592955, -0.0021797604858875275, -0.002056567929685116, -0.001933375489898026, -0.0018101830501109362, -0.0016869907267391682, -0.0015637982869520783, -0.0014406058471649885, -0.0013174135237932205, -0.0011942210840061307, -0.0010710286442190409, -0.000947836204431951, -0.0008246438228525221, -0.0007014514412730932, -0.0005782590014860034, -0.0004550665616989136, -0.00033187418011948466, -0.00020868179854005575, -8.548982441425323e-05, 3.770258626900613e-05, 0.0001608949969522655, 0.00028408740763552487, 0.00040727981831878424, 0.0005304722581058741, 0.000653664639685303, 0.0007768570212647319, 0.0009000494610518217, 0.0010232419008389115, 0.0011464343406260014, 0.0012696266639977694, 0.0013928191037848592, 0.001516011543571949, 0.001639203866943717, 0.0017623963067308068, 0.0018855887465178967, 0.0020087810698896646, 0.0021319736260920763, 0.0022551659494638443, 0.002378358505666256, 0.002501550829038024, 0.002624743152409792, 0.0027479357086122036, 0.0028711280319839716, 0.0029943203553557396, 0.0031175129115581512, 0.0032407052349299192, 0.0033638975583016872, 0.003487090114504099, 0.003610282437875867, 0.003733474761247635, 0.0038566673174500465]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 9.0, 11.0, 11.0, 9.0, 13.0, 20.0, 28.0, 31.0, 35.0, 36.0, 35.0, 29.0, 24.0, 43.0, 42.0, 56.0, 45.0, 32.0, 39.0, 37.0, 36.0, 32.0, 32.0, 35.0, 42.0, 31.0, 32.0, 24.0, 17.0, 22.0, 22.0, 11.0, 15.0, 9.0, 7.0, 8.0, 6.0, 6.0, 1.0, 5.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009384751319885254, -0.0009088581427931786, -0.0008792411535978317, -0.0008496241644024849, -0.0008200071752071381, -0.0007903901860117912, -0.0007607731968164444, -0.0007311562076210976, -0.0007015392184257507, -0.0006719222292304039, -0.0006423052400350571, -0.0006126882508397102, -0.0005830712616443634, -0.0005534542724490166, -0.0005238372832536697, -0.0004942202940583229, -0.0004646033048629761, -0.00043498631566762924, -0.0004053693264722824, -0.0003757523372769356, -0.00034613534808158875, -0.0003165183588862419, -0.0002869013696908951, -0.00025728438049554825, -0.00022766739130020142, -0.00019805040210485458, -0.00016843341290950775, -0.00013881642371416092, -0.00010919943451881409, -7.958244532346725e-05, -4.996545612812042e-05, -2.034846693277359e-05, 9.268522262573242e-06, 3.8885511457920074e-05, 6.85025006532669e-05, 9.811948984861374e-05, 0.00012773647904396057, 0.0001573534682393074, 0.00018697045743465424, 0.00021658744663000107, 0.0002462044358253479, 0.00027582142502069473, 0.00030543841421604156, 0.0003350554034113884, 0.00036467239260673523, 0.00039428938180208206, 0.0004239063709974289, 0.0004535233601927757, 0.00048314034938812256, 0.0005127573385834694, 0.0005423743277788162, 0.0005719913169741631, 0.0006016083061695099, 0.0006312252953648567, 0.0006608422845602036, 0.0006904592737555504, 0.0007200762629508972, 0.000749693252146244, 0.0007793102413415909, 0.0008089272305369377, 0.0008385442197322845, 0.0008681612089276314, 0.0008977781981229782, 0.000927395187318325, 0.0009570121765136719]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 7.0, 7.0, 7.0, 7.0, 10.0, 12.0, 6.0, 12.0, 13.0, 23.0, 23.0, 31.0, 27.0, 31.0, 29.0, 31.0, 44.0, 45.0, 27.0, 44.0, 49.0, 38.0, 48.0, 31.0, 46.0, 43.0, 41.0, 36.0, 31.0, 36.0, 20.0, 22.0, 17.0, 13.0, 18.0, 10.0, 12.0, 14.0, 9.0, 8.0, 12.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.453125, -15.931396484375, -15.40966796875, -14.887939453125, -14.3662109375, -13.844482421875, -13.32275390625, -12.801025390625, -12.279296875, -11.757568359375, -11.23583984375, -10.714111328125, -10.1923828125, -9.670654296875, -9.14892578125, -8.627197265625, -8.10546875, -7.583740234375, -7.06201171875, -6.540283203125, -6.0185546875, -5.496826171875, -4.97509765625, -4.453369140625, -3.931640625, -3.409912109375, -2.88818359375, -2.366455078125, -1.8447265625, -1.322998046875, -0.80126953125, -0.279541015625, 0.2421875, 0.763916015625, 1.28564453125, 1.807373046875, 2.3291015625, 2.850830078125, 3.37255859375, 3.894287109375, 4.416015625, 4.937744140625, 5.45947265625, 5.981201171875, 6.5029296875, 7.024658203125, 7.54638671875, 8.068115234375, 8.58984375, 9.111572265625, 9.63330078125, 10.155029296875, 10.6767578125, 11.198486328125, 11.72021484375, 12.241943359375, 12.763671875, 13.285400390625, 13.80712890625, 14.328857421875, 14.8505859375, 15.372314453125, 15.89404296875, 16.415771484375, 16.9375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 8.0, 4.0, 16.0, 11.0, 18.0, 13.0, 23.0, 49.0, 49.0, 59.0, 101.0, 121.0, 166.0, 255.0, 414.0, 756.0, 1830.0, 5682.0, 20893.0, 84063.0, 455408.0, 378906.0, 72777.0, 18156.0, 5158.0, 1705.0, 687.0, 380.0, 237.0, 146.0, 111.0, 100.0, 66.0, 48.0, 29.0, 31.0, 21.0, 15.0, 11.0, 14.0, 3.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.150634765625, -18.55126953125, -17.951904296875, -17.3525390625, -16.753173828125, -16.15380859375, -15.554443359375, -14.955078125, -14.355712890625, -13.75634765625, -13.156982421875, -12.5576171875, -11.958251953125, -11.35888671875, -10.759521484375, -10.16015625, -9.560791015625, -8.96142578125, -8.362060546875, -7.7626953125, -7.163330078125, -6.56396484375, -5.964599609375, -5.365234375, -4.765869140625, -4.16650390625, -3.567138671875, -2.9677734375, -2.368408203125, -1.76904296875, -1.169677734375, -0.5703125, 0.029052734375, 0.62841796875, 1.227783203125, 1.8271484375, 2.426513671875, 3.02587890625, 3.625244140625, 4.224609375, 4.823974609375, 5.42333984375, 6.022705078125, 6.6220703125, 7.221435546875, 7.82080078125, 8.420166015625, 9.01953125, 9.618896484375, 10.21826171875, 10.817626953125, 11.4169921875, 12.016357421875, 12.61572265625, 13.215087890625, 13.814453125, 14.413818359375, 15.01318359375, 15.612548828125, 16.2119140625, 16.811279296875, 17.41064453125, 18.010009765625, 18.609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 6.0, 2.0, 12.0, 5.0, 11.0, 13.0, 17.0, 22.0, 21.0, 28.0, 28.0, 28.0, 29.0, 62.0, 42.0, 39.0, 54.0, 101.0, 1652.0, 370.0, 90.0, 43.0, 52.0, 38.0, 33.0, 43.0, 41.0, 28.0, 18.0, 14.0, 16.0, 15.0, 14.0, 9.0, 4.0, 4.0, 10.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.78125, -56.07470703125, -54.3681640625, -52.66162109375, -50.955078125, -49.24853515625, -47.5419921875, -45.83544921875, -44.12890625, -42.42236328125, -40.7158203125, -39.00927734375, -37.302734375, -35.59619140625, -33.8896484375, -32.18310546875, -30.4765625, -28.77001953125, -27.0634765625, -25.35693359375, -23.650390625, -21.94384765625, -20.2373046875, -18.53076171875, -16.82421875, -15.11767578125, -13.4111328125, -11.70458984375, -9.998046875, -8.29150390625, -6.5849609375, -4.87841796875, -3.171875, -1.46533203125, 0.2412109375, 1.94775390625, 3.654296875, 5.36083984375, 7.0673828125, 8.77392578125, 10.48046875, 12.18701171875, 13.8935546875, 15.60009765625, 17.306640625, 19.01318359375, 20.7197265625, 22.42626953125, 24.1328125, 25.83935546875, 27.5458984375, 29.25244140625, 30.958984375, 32.66552734375, 34.3720703125, 36.07861328125, 37.78515625, 39.49169921875, 41.1982421875, 42.90478515625, 44.611328125, 46.31787109375, 48.0244140625, 49.73095703125, 51.4375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 10.0, 12.0, 11.0, 7.0, 12.0, 18.0, 23.0, 27.0, 38.0, 35.0, 53.0, 58.0, 106.0, 96.0, 144.0, 179.0, 295.0, 546.0, 1676.0, 156807.0, 2979884.0, 3609.0, 683.0, 386.0, 237.0, 193.0, 111.0, 85.0, 67.0, 67.0, 48.0, 41.0, 28.0, 17.0, 16.0, 13.0, 10.0, 10.0, 8.0, 9.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.25, -102.7275390625, -99.205078125, -95.6826171875, -92.16015625, -88.6376953125, -85.115234375, -81.5927734375, -78.0703125, -74.5478515625, -71.025390625, -67.5029296875, -63.98046875, -60.4580078125, -56.935546875, -53.4130859375, -49.890625, -46.3681640625, -42.845703125, -39.3232421875, -35.80078125, -32.2783203125, -28.755859375, -25.2333984375, -21.7109375, -18.1884765625, -14.666015625, -11.1435546875, -7.62109375, -4.0986328125, -0.576171875, 2.9462890625, 6.46875, 9.9912109375, 13.513671875, 17.0361328125, 20.55859375, 24.0810546875, 27.603515625, 31.1259765625, 34.6484375, 38.1708984375, 41.693359375, 45.2158203125, 48.73828125, 52.2607421875, 55.783203125, 59.3056640625, 62.828125, 66.3505859375, 69.873046875, 73.3955078125, 76.91796875, 80.4404296875, 83.962890625, 87.4853515625, 91.0078125, 94.5302734375, 98.052734375, 101.5751953125, 105.09765625, 108.6201171875, 112.142578125, 115.6650390625, 119.1875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 45.0, 256.0, 460.0, 212.0, 36.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.90327453613281, -123.40721130371094, -118.9111557006836, -114.41510009765625, -109.91903686523438, -105.4229736328125, -100.92691802978516, -96.43086242675781, -91.93479919433594, -87.43873596191406, -82.94268035888672, -78.44662475585938, -73.9505615234375, -69.45449829101562, -64.95844268798828, -60.46238327026367, -55.96632385253906, -51.47026443481445, -46.974205017089844, -42.478145599365234, -37.982086181640625, -33.486026763916016, -28.989967346191406, -24.493907928466797, -19.997848510742188, -15.501789093017578, -11.005729675292969, -6.509670257568359, -2.01361083984375, 2.4824485778808594, 6.978507995605469, 11.474567413330078, 15.970626831054688, 20.466686248779297, 24.962745666503906, 29.458805084228516, 33.954864501953125, 38.450923919677734, 42.946983337402344, 47.44304275512695, 51.93910217285156, 56.43516159057617, 60.93122100830078, 65.42727661132812, 69.92333984375, 74.41940307617188, 78.91545867919922, 83.41151428222656, 87.90757751464844, 92.40364074707031, 96.89969635009766, 101.395751953125, 105.89181518554688, 110.38787841796875, 114.8839340209961, 119.37998962402344, 123.87605285644531, 128.3721160888672, 132.8681640625, 137.36422729492188, 141.86029052734375, 146.35635375976562, 150.8524169921875, 155.3484649658203, 159.8445281982422]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 7.0, 10.0, 10.0, 12.0, 11.0, 21.0, 25.0, 19.0, 26.0, 29.0, 23.0, 27.0, 31.0, 45.0, 31.0, 34.0, 35.0, 33.0, 48.0, 31.0, 39.0, 43.0, 37.0, 32.0, 38.0, 29.0, 31.0, 30.0, 28.0, 30.0, 20.0, 16.0, 24.0, 15.0, 12.0, 17.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-130.80917358398438, -126.80463409423828, -122.80009460449219, -118.79556274414062, -114.79102325439453, -110.78648376464844, -106.78195190429688, -102.77741241455078, -98.77287292480469, -94.7683334350586, -90.7637939453125, -86.75926208496094, -82.75472259521484, -78.75018310546875, -74.74565124511719, -70.7411117553711, -66.736572265625, -62.732032775878906, -58.72749710083008, -54.72296142578125, -50.718421936035156, -46.71388244628906, -42.709346771240234, -38.704811096191406, -34.70027160644531, -30.69573402404785, -26.69119644165039, -22.68665885925293, -18.68212127685547, -14.677583694458008, -10.673046112060547, -6.668508529663086, -2.6639556884765625, 1.3405818939208984, 5.345119476318359, 9.34965705871582, 13.354194641113281, 17.358732223510742, 21.363269805908203, 25.367807388305664, 29.372344970703125, 33.37688446044922, 37.38142013549805, 41.385955810546875, 45.39049530029297, 49.39503479003906, 53.39957046508789, 57.40410614013672, 61.40864562988281, 65.4131851196289, 69.417724609375, 73.42225646972656, 77.42679595947266, 81.43133544921875, 85.43586730957031, 89.4404067993164, 93.4449462890625, 97.4494857788086, 101.45402526855469, 105.45855712890625, 109.46309661865234, 113.46763610839844, 117.47216796875, 121.4767074584961, 125.48124694824219]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 7.0, 11.0, 8.0, 9.0, 13.0, 12.0, 20.0, 26.0, 27.0, 22.0, 30.0, 37.0, 36.0, 35.0, 38.0, 31.0, 34.0, 52.0, 46.0, 34.0, 36.0, 44.0, 40.0, 41.0, 42.0, 34.0, 30.0, 22.0, 25.0, 19.0, 15.0, 14.0, 19.0, 13.0, 11.0, 9.0, 11.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.3125, -15.78271484375, -15.2529296875, -14.72314453125, -14.193359375, -13.66357421875, -13.1337890625, -12.60400390625, -12.07421875, -11.54443359375, -11.0146484375, -10.48486328125, -9.955078125, -9.42529296875, -8.8955078125, -8.36572265625, -7.8359375, -7.30615234375, -6.7763671875, -6.24658203125, -5.716796875, -5.18701171875, -4.6572265625, -4.12744140625, -3.59765625, -3.06787109375, -2.5380859375, -2.00830078125, -1.478515625, -0.94873046875, -0.4189453125, 0.11083984375, 0.640625, 1.17041015625, 1.7001953125, 2.22998046875, 2.759765625, 3.28955078125, 3.8193359375, 4.34912109375, 4.87890625, 5.40869140625, 5.9384765625, 6.46826171875, 6.998046875, 7.52783203125, 8.0576171875, 8.58740234375, 9.1171875, 9.64697265625, 10.1767578125, 10.70654296875, 11.236328125, 11.76611328125, 12.2958984375, 12.82568359375, 13.35546875, 13.88525390625, 14.4150390625, 14.94482421875, 15.474609375, 16.00439453125, 16.5341796875, 17.06396484375, 17.59375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 8.0, 13.0, 13.0, 10.0, 13.0, 11.0, 14.0, 19.0, 37.0, 36.0, 50.0, 64.0, 91.0, 117.0, 156.0, 200.0, 374.0, 892.0, 5164.0, 135888.0, 3135063.0, 895222.0, 17543.0, 1748.0, 543.0, 264.0, 171.0, 142.0, 68.0, 70.0, 46.0, 48.0, 31.0, 22.0, 14.0, 21.0, 12.0, 12.0, 13.0, 8.0, 6.0, 12.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-47.59375, -46.09375, -44.59375, -43.09375, -41.59375, -40.09375, -38.59375, -37.09375, -35.59375, -34.09375, -32.59375, -31.09375, -29.59375, -28.09375, -26.59375, -25.09375, -23.59375, -22.09375, -20.59375, -19.09375, -17.59375, -16.09375, -14.59375, -13.09375, -11.59375, -10.09375, -8.59375, -7.09375, -5.59375, -4.09375, -2.59375, -1.09375, 0.40625, 1.90625, 3.40625, 4.90625, 6.40625, 7.90625, 9.40625, 10.90625, 12.40625, 13.90625, 15.40625, 16.90625, 18.40625, 19.90625, 21.40625, 22.90625, 24.40625, 25.90625, 27.40625, 28.90625, 30.40625, 31.90625, 33.40625, 34.90625, 36.40625, 37.90625, 39.40625, 40.90625, 42.40625, 43.90625, 45.40625, 46.90625, 48.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 15.0, 24.0, 33.0, 46.0, 82.0, 131.0, 225.0, 319.0, 606.0, 870.0, 717.0, 383.0, 224.0, 139.0, 92.0, 49.0, 37.0, 30.0, 22.0, 10.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.4375, -43.90673828125, -42.3759765625, -40.84521484375, -39.314453125, -37.78369140625, -36.2529296875, -34.72216796875, -33.19140625, -31.66064453125, -30.1298828125, -28.59912109375, -27.068359375, -25.53759765625, -24.0068359375, -22.47607421875, -20.9453125, -19.41455078125, -17.8837890625, -16.35302734375, -14.822265625, -13.29150390625, -11.7607421875, -10.22998046875, -8.69921875, -7.16845703125, -5.6376953125, -4.10693359375, -2.576171875, -1.04541015625, 0.4853515625, 2.01611328125, 3.546875, 5.07763671875, 6.6083984375, 8.13916015625, 9.669921875, 11.20068359375, 12.7314453125, 14.26220703125, 15.79296875, 17.32373046875, 18.8544921875, 20.38525390625, 21.916015625, 23.44677734375, 24.9775390625, 26.50830078125, 28.0390625, 29.56982421875, 31.1005859375, 32.63134765625, 34.162109375, 35.69287109375, 37.2236328125, 38.75439453125, 40.28515625, 41.81591796875, 43.3466796875, 44.87744140625, 46.408203125, 47.93896484375, 49.4697265625, 51.00048828125, 52.53125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 11.0, 17.0, 12.0, 28.0, 48.0, 49.0, 69.0, 75.0, 103.0, 141.0, 194.0, 280.0, 510.0, 1785.0, 4179696.0, 9262.0, 750.0, 347.0, 228.0, 175.0, 128.0, 112.0, 90.0, 44.0, 46.0, 26.0, 17.0, 17.0, 10.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-308.75, -299.578125, -290.40625, -281.234375, -272.0625, -262.890625, -253.71875, -244.546875, -235.375, -226.203125, -217.03125, -207.859375, -198.6875, -189.515625, -180.34375, -171.171875, -162.0, -152.828125, -143.65625, -134.484375, -125.3125, -116.140625, -106.96875, -97.796875, -88.625, -79.453125, -70.28125, -61.109375, -51.9375, -42.765625, -33.59375, -24.421875, -15.25, -6.078125, 3.09375, 12.265625, 21.4375, 30.609375, 39.78125, 48.953125, 58.125, 67.296875, 76.46875, 85.640625, 94.8125, 103.984375, 113.15625, 122.328125, 131.5, 140.671875, 149.84375, 159.015625, 168.1875, 177.359375, 186.53125, 195.703125, 204.875, 214.046875, 223.21875, 232.390625, 241.5625, 250.734375, 259.90625, 269.078125, 278.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 23.0, 59.0, 108.0, 214.0, 244.0, 180.0, 104.0, 61.0, 9.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.35163116455078, -97.11163330078125, -91.87162780761719, -86.63162231445312, -81.3916244506836, -76.15162658691406, -70.91162109375, -65.67161560058594, -60.431617736816406, -55.19161605834961, -49.95161437988281, -44.711612701416016, -39.47161102294922, -34.23160934448242, -28.991607666015625, -23.751605987548828, -18.51160430908203, -13.271602630615234, -8.031600952148438, -2.7915992736816406, 2.4484024047851562, 7.688404083251953, 12.92840576171875, 18.168407440185547, 23.408409118652344, 28.64841079711914, 33.88841247558594, 39.128414154052734, 44.36841583251953, 49.60841751098633, 54.848419189453125, 60.08842086791992, 65.32843017578125, 70.56843566894531, 75.80843353271484, 81.04843139648438, 86.28843688964844, 91.5284423828125, 96.76844024658203, 102.00843811035156, 107.24844360351562, 112.48844909667969, 117.72844696044922, 122.96844482421875, 128.2084503173828, 133.44845581054688, 138.68844604492188, 143.92845153808594, 149.16845703125, 154.40846252441406, 159.64846801757812, 164.88845825195312, 170.1284637451172, 175.36846923828125, 180.60845947265625, 185.8484649658203, 191.08847045898438, 196.32847595214844, 201.5684814453125, 206.8084716796875, 212.04847717285156, 217.28848266601562, 222.52847290039062, 227.7684783935547, 233.00848388671875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 11.0, 11.0, 11.0, 22.0, 24.0, 20.0, 25.0, 24.0, 42.0, 29.0, 26.0, 41.0, 41.0, 45.0, 42.0, 46.0, 35.0, 39.0, 42.0, 47.0, 36.0, 32.0, 43.0, 32.0, 37.0, 28.0, 29.0, 30.0, 19.0, 7.0, 6.0, 15.0, 11.0, 6.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.59030151367188, -89.48638153076172, -86.38246154785156, -83.2785415649414, -80.17462158203125, -77.07069396972656, -73.9667739868164, -70.86285400390625, -67.7589340209961, -64.65501403808594, -61.55109405517578, -58.44717025756836, -55.3432502746582, -52.23933029174805, -49.135406494140625, -46.03148651123047, -42.92756652832031, -39.823646545410156, -36.7197265625, -33.61580276489258, -30.511882781982422, -27.407962799072266, -24.304040908813477, -21.200119018554688, -18.09619903564453, -14.992278099060059, -11.888357162475586, -8.784436225891113, -5.680515289306641, -2.576594352722168, 0.5273265838623047, 3.6312484741210938, 6.73516845703125, 9.839089393615723, 12.943010330200195, 16.046932220458984, 19.15085220336914, 22.254772186279297, 25.358694076538086, 28.462615966796875, 31.56653594970703, 34.67045593261719, 37.774375915527344, 40.878299713134766, 43.98221969604492, 47.08613967895508, 50.1900634765625, 53.293983459472656, 56.39790344238281, 59.50182342529297, 62.605743408203125, 65.70966339111328, 68.81358337402344, 71.91751098632812, 75.02143096923828, 78.12535095214844, 81.2292709350586, 84.33319091796875, 87.4371109008789, 90.54103088378906, 93.64495849609375, 96.7488784790039, 99.85279846191406, 102.95671844482422, 106.06063842773438]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 13.0, 13.0, 16.0, 20.0, 23.0, 17.0, 19.0, 32.0, 31.0, 34.0, 36.0, 37.0, 38.0, 47.0, 57.0, 43.0, 43.0, 45.0, 42.0, 39.0, 48.0, 23.0, 34.0, 34.0, 33.0, 25.0, 22.0, 20.0, 14.0, 14.0, 11.0, 15.0, 9.0, 10.0, 12.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.027587890625, -15.46142578125, -14.895263671875, -14.3291015625, -13.762939453125, -13.19677734375, -12.630615234375, -12.064453125, -11.498291015625, -10.93212890625, -10.365966796875, -9.7998046875, -9.233642578125, -8.66748046875, -8.101318359375, -7.53515625, -6.968994140625, -6.40283203125, -5.836669921875, -5.2705078125, -4.704345703125, -4.13818359375, -3.572021484375, -3.005859375, -2.439697265625, -1.87353515625, -1.307373046875, -0.7412109375, -0.175048828125, 0.39111328125, 0.957275390625, 1.5234375, 2.089599609375, 2.65576171875, 3.221923828125, 3.7880859375, 4.354248046875, 4.92041015625, 5.486572265625, 6.052734375, 6.618896484375, 7.18505859375, 7.751220703125, 8.3173828125, 8.883544921875, 9.44970703125, 10.015869140625, 10.58203125, 11.148193359375, 11.71435546875, 12.280517578125, 12.8466796875, 13.412841796875, 13.97900390625, 14.545166015625, 15.111328125, 15.677490234375, 16.24365234375, 16.809814453125, 17.3759765625, 17.942138671875, 18.50830078125, 19.074462890625, 19.640625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 9.0, 18.0, 19.0, 33.0, 44.0, 77.0, 113.0, 185.0, 294.0, 453.0, 683.0, 1087.0, 1729.0, 2731.0, 4584.0, 7078.0, 11178.0, 17752.0, 28383.0, 47091.0, 81680.0, 161845.0, 334252.0, 151183.0, 77418.0, 45183.0, 27256.0, 16960.0, 10737.0, 6840.0, 4260.0, 2774.0, 1685.0, 1061.0, 676.0, 379.0, 279.0, 183.0, 105.0, 88.0, 56.0, 41.0, 21.0, 16.0, 10.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.1962890625, -4.048828125, -3.9013671875, -3.75390625, -3.6064453125, -3.458984375, -3.3115234375, -3.1640625, -3.0166015625, -2.869140625, -2.7216796875, -2.57421875, -2.4267578125, -2.279296875, -2.1318359375, -1.984375, -1.8369140625, -1.689453125, -1.5419921875, -1.39453125, -1.2470703125, -1.099609375, -0.9521484375, -0.8046875, -0.6572265625, -0.509765625, -0.3623046875, -0.21484375, -0.0673828125, 0.080078125, 0.2275390625, 0.375, 0.5224609375, 0.669921875, 0.8173828125, 0.96484375, 1.1123046875, 1.259765625, 1.4072265625, 1.5546875, 1.7021484375, 1.849609375, 1.9970703125, 2.14453125, 2.2919921875, 2.439453125, 2.5869140625, 2.734375, 2.8818359375, 3.029296875, 3.1767578125, 3.32421875, 3.4716796875, 3.619140625, 3.7666015625, 3.9140625, 4.0615234375, 4.208984375, 4.3564453125, 4.50390625, 4.6513671875, 4.798828125, 4.9462890625, 5.09375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 9.0, 6.0, 9.0, 2.0, 9.0, 15.0, 17.0, 12.0, 19.0, 22.0, 16.0, 20.0, 36.0, 33.0, 36.0, 32.0, 46.0, 36.0, 35.0, 37.0, 1066.0, 60.0, 25.0, 34.0, 32.0, 29.0, 34.0, 36.0, 34.0, 29.0, 26.0, 27.0, 19.0, 23.0, 17.0, 18.0, 18.0, 9.0, 10.0, 8.0, 2.0, 4.0, 6.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.953125, -9.619873046875, -9.28662109375, -8.953369140625, -8.6201171875, -8.286865234375, -7.95361328125, -7.620361328125, -7.287109375, -6.953857421875, -6.62060546875, -6.287353515625, -5.9541015625, -5.620849609375, -5.28759765625, -4.954345703125, -4.62109375, -4.287841796875, -3.95458984375, -3.621337890625, -3.2880859375, -2.954833984375, -2.62158203125, -2.288330078125, -1.955078125, -1.621826171875, -1.28857421875, -0.955322265625, -0.6220703125, -0.288818359375, 0.04443359375, 0.377685546875, 0.7109375, 1.044189453125, 1.37744140625, 1.710693359375, 2.0439453125, 2.377197265625, 2.71044921875, 3.043701171875, 3.376953125, 3.710205078125, 4.04345703125, 4.376708984375, 4.7099609375, 5.043212890625, 5.37646484375, 5.709716796875, 6.04296875, 6.376220703125, 6.70947265625, 7.042724609375, 7.3759765625, 7.709228515625, 8.04248046875, 8.375732421875, 8.708984375, 9.042236328125, 9.37548828125, 9.708740234375, 10.0419921875, 10.375244140625, 10.70849609375, 11.041748046875, 11.375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 9.0, 26.0, 33.0, 38.0, 71.0, 74.0, 124.0, 167.0, 253.0, 376.0, 550.0, 761.0, 1126.0, 1769.0, 2816.0, 4208.0, 6470.0, 10291.0, 16411.0, 26195.0, 42907.0, 72255.0, 128259.0, 1383087.0, 170077.0, 89999.0, 52753.0, 31795.0, 19620.0, 12350.0, 7810.0, 4831.0, 3241.0, 2083.0, 1380.0, 921.0, 623.0, 414.0, 280.0, 206.0, 153.0, 79.0, 77.0, 47.0, 30.0, 23.0, 14.0, 18.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.48046875, -4.34344482421875, -4.2064208984375, -4.06939697265625, -3.932373046875, -3.79534912109375, -3.6583251953125, -3.52130126953125, -3.38427734375, -3.24725341796875, -3.1102294921875, -2.97320556640625, -2.836181640625, -2.69915771484375, -2.5621337890625, -2.42510986328125, -2.2880859375, -2.15106201171875, -2.0140380859375, -1.87701416015625, -1.739990234375, -1.60296630859375, -1.4659423828125, -1.32891845703125, -1.19189453125, -1.05487060546875, -0.9178466796875, -0.78082275390625, -0.643798828125, -0.50677490234375, -0.3697509765625, -0.23272705078125, -0.095703125, 0.04132080078125, 0.1783447265625, 0.31536865234375, 0.452392578125, 0.58941650390625, 0.7264404296875, 0.86346435546875, 1.00048828125, 1.13751220703125, 1.2745361328125, 1.41156005859375, 1.548583984375, 1.68560791015625, 1.8226318359375, 1.95965576171875, 2.0966796875, 2.23370361328125, 2.3707275390625, 2.50775146484375, 2.644775390625, 2.78179931640625, 2.9188232421875, 3.05584716796875, 3.19287109375, 3.32989501953125, 3.4669189453125, 3.60394287109375, 3.740966796875, 3.87799072265625, 4.0150146484375, 4.15203857421875, 4.2890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 1.0, 7.0, 7.0, 11.0, 18.0, 24.0, 16.0, 30.0, 35.0, 39.0, 40.0, 52.0, 68.0, 92.0, 86.0, 71.0, 64.0, 67.0, 47.0, 40.0, 34.0, 26.0, 21.0, 23.0, 9.0, 14.0, 8.0, 6.0, 5.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025119781494140625, -0.0024245083332061768, -0.002337038516998291, -0.0022495687007904053, -0.0021620988845825195, -0.002074629068374634, -0.001987159252166748, -0.0018996894359588623, -0.0018122196197509766, -0.0017247498035430908, -0.001637279987335205, -0.0015498101711273193, -0.0014623403549194336, -0.0013748705387115479, -0.0012874007225036621, -0.0011999309062957764, -0.0011124610900878906, -0.0010249912738800049, -0.0009375214576721191, -0.0008500516414642334, -0.0007625818252563477, -0.0006751120090484619, -0.0005876421928405762, -0.0005001723766326904, -0.0004127025604248047, -0.00032523274421691895, -0.0002377629280090332, -0.00015029311180114746, -6.282329559326172e-05, 2.4646520614624023e-05, 0.00011211633682250977, 0.0001995861530303955, 0.00028705596923828125, 0.000374525785446167, 0.00046199560165405273, 0.0005494654178619385, 0.0006369352340698242, 0.00072440505027771, 0.0008118748664855957, 0.0008993446826934814, 0.0009868144989013672, 0.001074284315109253, 0.0011617541313171387, 0.0012492239475250244, 0.0013366937637329102, 0.001424163579940796, 0.0015116333961486816, 0.0015991032123565674, 0.0016865730285644531, 0.0017740428447723389, 0.0018615126609802246, 0.0019489824771881104, 0.002036452293395996, 0.002123922109603882, 0.0022113919258117676, 0.0022988617420196533, 0.002386331558227539, 0.002473801374435425, 0.0025612711906433105, 0.0026487410068511963, 0.002736210823059082, 0.0028236806392669678, 0.0029111504554748535, 0.0029986202716827393, 0.003086090087890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 8.0, 15.0, 13.0, 21.0, 29.0, 30.0, 44.0, 75.0, 102.0, 191.0, 489.0, 5950.0, 1039307.0, 1408.0, 362.0, 151.0, 101.0, 63.0, 40.0, 29.0, 25.0, 19.0, 17.0, 14.0, 7.0, 5.0, 1.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08770751953125, -0.08522510528564453, -0.08274269104003906, -0.0802602767944336, -0.07777786254882812, -0.07529544830322266, -0.07281303405761719, -0.07033061981201172, -0.06784820556640625, -0.06536579132080078, -0.06288337707519531, -0.060400962829589844, -0.057918548583984375, -0.055436134338378906, -0.05295372009277344, -0.05047130584716797, -0.0479888916015625, -0.04550647735595703, -0.04302406311035156, -0.040541648864746094, -0.038059234619140625, -0.035576820373535156, -0.03309440612792969, -0.03061199188232422, -0.02812957763671875, -0.02564716339111328, -0.023164749145507812, -0.020682334899902344, -0.018199920654296875, -0.015717506408691406, -0.013235092163085938, -0.010752677917480469, -0.008270263671875, -0.005787849426269531, -0.0033054351806640625, -0.0008230209350585938, 0.001659393310546875, 0.004141807556152344, 0.0066242218017578125, 0.009106636047363281, 0.01158905029296875, 0.014071464538574219, 0.016553878784179688, 0.019036293029785156, 0.021518707275390625, 0.024001121520996094, 0.026483535766601562, 0.02896595001220703, 0.0314483642578125, 0.03393077850341797, 0.03641319274902344, 0.038895606994628906, 0.041378021240234375, 0.043860435485839844, 0.04634284973144531, 0.04882526397705078, 0.05130767822265625, 0.05379009246826172, 0.05627250671386719, 0.058754920959472656, 0.061237335205078125, 0.0637197494506836, 0.06620216369628906, 0.06868457794189453, 0.0711669921875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 25.0, 72.0, 202.0, 330.0, 235.0, 97.0, 34.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00419703871011734, -0.004098706413060427, -0.004000373650342226, -0.0039020413532853127, -0.0038037088233977556, -0.0037053762935101986, -0.0036070439964532852, -0.003508711466565728, -0.003410378936678171, -0.003312046406790614, -0.0032137141097337008, -0.0031153815798461437, -0.0030170490499585867, -0.0029187165200710297, -0.0028203842230141163, -0.0027220516931265593, -0.002623719396069646, -0.002525386866182089, -0.0024270545691251755, -0.0023287220392376184, -0.0022303895093500614, -0.002132057212293148, -0.002033724682405591, -0.001935392152518034, -0.0018370597390457988, -0.0017387273255735636, -0.0016403947956860065, -0.0015420623822137713, -0.0014437299687415361, -0.0013453974388539791, -0.001247065025381744, -0.0011487326119095087, -0.0010504000820219517, -0.0009520676103420556, -0.0008537351386621594, -0.0007554027251899242, -0.0006570702535100281, -0.000558737781830132, -0.0004604053683578968, -0.0003620728966780007, -0.00026374042499810457, -0.00016540796787012368, -6.70755107421428e-05, 3.125693183392286e-05, 0.00012958940351381898, 0.0002279218751937151, 0.0003262542886659503, 0.0004245867603458464, 0.0005229192320257425, 0.0006212517037056386, 0.0007195841753855348, 0.00081791658885777, 0.0009162490605376661, 0.0010145815322175622, 0.0011129139456897974, 0.0012112464755773544, 0.0013095788890495896, 0.0014079113025218248, 0.0015062438324093819, 0.001604576245881617, 0.0017029086593538523, 0.0018012411892414093, 0.0018995736027136445, 0.0019979060161858797, 0.0020962385460734367]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 10.0, 8.0, 13.0, 15.0, 11.0, 22.0, 26.0, 26.0, 23.0, 27.0, 31.0, 35.0, 35.0, 28.0, 36.0, 36.0, 42.0, 41.0, 35.0, 48.0, 40.0, 29.0, 35.0, 41.0, 34.0, 24.0, 29.0, 19.0, 21.0, 24.0, 20.0, 19.0, 14.0, 23.0, 15.0, 5.0, 13.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011341571807861328, -0.0010976670309901237, -0.0010611768811941147, -0.0010246867313981056, -0.0009881965816020966, -0.0009517064318060875, -0.0009152162820100784, -0.0008787261322140694, -0.0008422359824180603, -0.0008057458326220512, -0.0007692556828260422, -0.0007327655330300331, -0.000696275383234024, -0.000659785233438015, -0.0006232950836420059, -0.0005868049338459969, -0.0005503147840499878, -0.0005138246342539787, -0.00047733448445796967, -0.0004408443346619606, -0.00040435418486595154, -0.0003678640350699425, -0.0003313738852739334, -0.00029488373547792435, -0.0002583935856819153, -0.00022190343588590622, -0.00018541328608989716, -0.0001489231362938881, -0.00011243298649787903, -7.594283670186996e-05, -3.94526869058609e-05, -2.962537109851837e-06, 3.3527612686157227e-05, 7.001776248216629e-05, 0.00010650791227817535, 0.00014299806207418442, 0.00017948821187019348, 0.00021597836166620255, 0.0002524685114622116, 0.00028895866125822067, 0.00032544881105422974, 0.0003619389608502388, 0.00039842911064624786, 0.00043491926044225693, 0.000471409410238266, 0.0005078995600342751, 0.0005443897098302841, 0.0005808798596262932, 0.0006173700094223022, 0.0006538601592183113, 0.0006903503090143204, 0.0007268404588103294, 0.0007633306086063385, 0.0007998207584023476, 0.0008363109081983566, 0.0008728010579943657, 0.0009092912077903748, 0.0009457813575863838, 0.0009822715073823929, 0.001018761657178402, 0.001055251806974411, 0.00109174195677042, 0.0011282321065664291, 0.0011647222563624382, 0.0012012124061584473]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 13.0, 13.0, 16.0, 20.0, 23.0, 17.0, 19.0, 32.0, 31.0, 34.0, 36.0, 37.0, 38.0, 47.0, 57.0, 43.0, 43.0, 45.0, 42.0, 39.0, 48.0, 23.0, 34.0, 34.0, 33.0, 25.0, 22.0, 20.0, 14.0, 14.0, 11.0, 15.0, 9.0, 10.0, 12.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.027587890625, -15.46142578125, -14.895263671875, -14.3291015625, -13.762939453125, -13.19677734375, -12.630615234375, -12.064453125, -11.498291015625, -10.93212890625, -10.365966796875, -9.7998046875, -9.233642578125, -8.66748046875, -8.101318359375, -7.53515625, -6.968994140625, -6.40283203125, -5.836669921875, -5.2705078125, -4.704345703125, -4.13818359375, -3.572021484375, -3.005859375, -2.439697265625, -1.87353515625, -1.307373046875, -0.7412109375, -0.175048828125, 0.39111328125, 0.957275390625, 1.5234375, 2.089599609375, 2.65576171875, 3.221923828125, 3.7880859375, 4.354248046875, 4.92041015625, 5.486572265625, 6.052734375, 6.618896484375, 7.18505859375, 7.751220703125, 8.3173828125, 8.883544921875, 9.44970703125, 10.015869140625, 10.58203125, 11.148193359375, 11.71435546875, 12.280517578125, 12.8466796875, 13.412841796875, 13.97900390625, 14.545166015625, 15.111328125, 15.677490234375, 16.24365234375, 16.809814453125, 17.3759765625, 17.942138671875, 18.50830078125, 19.074462890625, 19.640625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 15.0, 25.0, 37.0, 39.0, 56.0, 55.0, 84.0, 127.0, 170.0, 286.0, 402.0, 715.0, 1494.0, 6068.0, 62917.0, 822534.0, 138729.0, 10382.0, 2067.0, 800.0, 520.0, 299.0, 182.0, 140.0, 92.0, 65.0, 50.0, 43.0, 26.0, 27.0, 16.0, 13.0, 12.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.8935546875, -28.849609375, -27.8056640625, -26.76171875, -25.7177734375, -24.673828125, -23.6298828125, -22.5859375, -21.5419921875, -20.498046875, -19.4541015625, -18.41015625, -17.3662109375, -16.322265625, -15.2783203125, -14.234375, -13.1904296875, -12.146484375, -11.1025390625, -10.05859375, -9.0146484375, -7.970703125, -6.9267578125, -5.8828125, -4.8388671875, -3.794921875, -2.7509765625, -1.70703125, -0.6630859375, 0.380859375, 1.4248046875, 2.46875, 3.5126953125, 4.556640625, 5.6005859375, 6.64453125, 7.6884765625, 8.732421875, 9.7763671875, 10.8203125, 11.8642578125, 12.908203125, 13.9521484375, 14.99609375, 16.0400390625, 17.083984375, 18.1279296875, 19.171875, 20.2158203125, 21.259765625, 22.3037109375, 23.34765625, 24.3916015625, 25.435546875, 26.4794921875, 27.5234375, 28.5673828125, 29.611328125, 30.6552734375, 31.69921875, 32.7431640625, 33.787109375, 34.8310546875, 35.875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 8.0, 16.0, 7.0, 18.0, 21.0, 15.0, 25.0, 23.0, 37.0, 30.0, 40.0, 47.0, 34.0, 57.0, 65.0, 181.0, 1837.0, 120.0, 61.0, 47.0, 36.0, 41.0, 33.0, 32.0, 26.0, 19.0, 28.0, 17.0, 27.0, 16.0, 10.0, 13.0, 10.0, 9.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-58.03125, -56.2421875, -54.453125, -52.6640625, -50.875, -49.0859375, -47.296875, -45.5078125, -43.71875, -41.9296875, -40.140625, -38.3515625, -36.5625, -34.7734375, -32.984375, -31.1953125, -29.40625, -27.6171875, -25.828125, -24.0390625, -22.25, -20.4609375, -18.671875, -16.8828125, -15.09375, -13.3046875, -11.515625, -9.7265625, -7.9375, -6.1484375, -4.359375, -2.5703125, -0.78125, 1.0078125, 2.796875, 4.5859375, 6.375, 8.1640625, 9.953125, 11.7421875, 13.53125, 15.3203125, 17.109375, 18.8984375, 20.6875, 22.4765625, 24.265625, 26.0546875, 27.84375, 29.6328125, 31.421875, 33.2109375, 35.0, 36.7890625, 38.578125, 40.3671875, 42.15625, 43.9453125, 45.734375, 47.5234375, 49.3125, 51.1015625, 52.890625, 54.6796875, 56.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 3.0, 9.0, 13.0, 12.0, 11.0, 17.0, 28.0, 19.0, 22.0, 25.0, 33.0, 43.0, 60.0, 96.0, 154.0, 257.0, 546.0, 3388.0, 3134334.0, 5137.0, 597.0, 285.0, 161.0, 102.0, 72.0, 44.0, 51.0, 28.0, 25.0, 21.0, 21.0, 20.0, 10.0, 14.0, 7.0, 6.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-169.5, -164.126953125, -158.75390625, -153.380859375, -148.0078125, -142.634765625, -137.26171875, -131.888671875, -126.515625, -121.142578125, -115.76953125, -110.396484375, -105.0234375, -99.650390625, -94.27734375, -88.904296875, -83.53125, -78.158203125, -72.78515625, -67.412109375, -62.0390625, -56.666015625, -51.29296875, -45.919921875, -40.546875, -35.173828125, -29.80078125, -24.427734375, -19.0546875, -13.681640625, -8.30859375, -2.935546875, 2.4375, 7.810546875, 13.18359375, 18.556640625, 23.9296875, 29.302734375, 34.67578125, 40.048828125, 45.421875, 50.794921875, 56.16796875, 61.541015625, 66.9140625, 72.287109375, 77.66015625, 83.033203125, 88.40625, 93.779296875, 99.15234375, 104.525390625, 109.8984375, 115.271484375, 120.64453125, 126.017578125, 131.390625, 136.763671875, 142.13671875, 147.509765625, 152.8828125, 158.255859375, 163.62890625, 169.001953125, 174.375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 18.0, 24.0, 65.0, 109.0, 146.0, 159.0, 130.0, 113.0, 85.0, 57.0, 47.0, 24.0, 13.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.0739803314209, -25.8387451171875, -24.60350799560547, -23.36827278137207, -22.13303565979004, -20.89780044555664, -19.66256332397461, -18.42732810974121, -17.192092895507812, -15.956856727600098, -14.721620559692383, -13.486385345458984, -12.251148223876953, -11.015913009643555, -9.78067684173584, -8.545440673828125, -7.310203552246094, -6.074967384338379, -4.839731216430664, -3.6044955253601074, -2.3692593574523926, -1.1340231895446777, 0.1012125015258789, 1.3364486694335938, 2.5716848373413086, 3.8069210052490234, 5.042157173156738, 6.277392864227295, 7.51262903213501, 8.747865676879883, 9.983100891113281, 11.218337059020996, 12.453571319580078, 13.688807487487793, 14.924043655395508, 16.159278869628906, 17.394515991210938, 18.629751205444336, 19.864986419677734, 21.100223541259766, 22.335460662841797, 23.570695877075195, 24.805932998657227, 26.041168212890625, 27.276405334472656, 28.511640548706055, 29.746875762939453, 30.982112884521484, 32.21734619140625, 33.45258331298828, 34.68781661987305, 35.92305374145508, 37.15829086303711, 38.39352798461914, 39.628761291503906, 40.86399841308594, 42.09923553466797, 43.33447265625, 44.569705963134766, 45.8049430847168, 47.04018020629883, 48.27541732788086, 49.510650634765625, 50.745887756347656, 51.98112487792969]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 9.0, 13.0, 12.0, 11.0, 17.0, 22.0, 24.0, 28.0, 20.0, 29.0, 28.0, 46.0, 44.0, 36.0, 40.0, 50.0, 53.0, 40.0, 34.0, 38.0, 34.0, 41.0, 29.0, 32.0, 30.0, 44.0, 24.0, 24.0, 24.0, 24.0, 16.0, 15.0, 8.0, 11.0, 7.0, 9.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-170.48995971679688, -165.18670654296875, -159.88345336914062, -154.5802001953125, -149.27694702148438, -143.97369384765625, -138.67044067382812, -133.3671875, -128.06393432617188, -122.76068115234375, -117.45742797851562, -112.1541748046875, -106.85092163085938, -101.54766845703125, -96.24442291259766, -90.94116973876953, -85.63792419433594, -80.33467102050781, -75.03141784667969, -69.72816467285156, -64.42491149902344, -59.12166213989258, -53.81841278076172, -48.515159606933594, -43.21190643310547, -37.908653259277344, -32.60540008544922, -27.30215072631836, -21.998897552490234, -16.69564437866211, -11.392393112182617, -6.089141845703125, -0.7859039306640625, 4.517348289489746, 9.820600509643555, 15.123852729797363, 20.427104949951172, 25.730358123779297, 31.03360939025879, 36.33686065673828, 41.640113830566406, 46.94336700439453, 52.246620178222656, 57.549869537353516, 62.85312271118164, 68.1563720703125, 73.45962524414062, 78.76287841796875, 84.06613159179688, 89.369384765625, 94.67263793945312, 99.97589111328125, 105.27914428710938, 110.5823974609375, 115.8856430053711, 121.18889617919922, 126.49214935302734, 131.79539489746094, 137.09864807128906, 142.4019012451172, 147.7051544189453, 153.00840759277344, 158.31166076660156, 163.6149139404297, 168.9181671142578]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 11.0, 14.0, 14.0, 10.0, 26.0, 18.0, 27.0, 23.0, 43.0, 27.0, 30.0, 33.0, 37.0, 48.0, 41.0, 44.0, 45.0, 40.0, 42.0, 41.0, 39.0, 37.0, 32.0, 37.0, 29.0, 26.0, 24.0, 26.0, 17.0, 13.0, 15.0, 14.0, 8.0, 12.0, 12.0, 4.0, 7.0, 3.0, 3.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.875, -16.30908203125, -15.7431640625, -15.17724609375, -14.611328125, -14.04541015625, -13.4794921875, -12.91357421875, -12.34765625, -11.78173828125, -11.2158203125, -10.64990234375, -10.083984375, -9.51806640625, -8.9521484375, -8.38623046875, -7.8203125, -7.25439453125, -6.6884765625, -6.12255859375, -5.556640625, -4.99072265625, -4.4248046875, -3.85888671875, -3.29296875, -2.72705078125, -2.1611328125, -1.59521484375, -1.029296875, -0.46337890625, 0.1025390625, 0.66845703125, 1.234375, 1.80029296875, 2.3662109375, 2.93212890625, 3.498046875, 4.06396484375, 4.6298828125, 5.19580078125, 5.76171875, 6.32763671875, 6.8935546875, 7.45947265625, 8.025390625, 8.59130859375, 9.1572265625, 9.72314453125, 10.2890625, 10.85498046875, 11.4208984375, 11.98681640625, 12.552734375, 13.11865234375, 13.6845703125, 14.25048828125, 14.81640625, 15.38232421875, 15.9482421875, 16.51416015625, 17.080078125, 17.64599609375, 18.2119140625, 18.77783203125, 19.34375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 6.0, 12.0, 16.0, 15.0, 20.0, 37.0, 38.0, 38.0, 46.0, 62.0, 75.0, 107.0, 139.0, 196.0, 288.0, 472.0, 886.0, 1798.0, 4200.0, 12072.0, 44472.0, 188221.0, 697838.0, 1462494.0, 1196676.0, 437867.0, 106834.0, 25633.0, 7699.0, 2760.0, 1282.0, 702.0, 372.0, 225.0, 168.0, 119.0, 96.0, 79.0, 62.0, 37.0, 37.0, 20.0, 17.0, 11.0, 12.0, 7.0, 9.0, 7.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.171875, -16.595703125, -16.01953125, -15.443359375, -14.8671875, -14.291015625, -13.71484375, -13.138671875, -12.5625, -11.986328125, -11.41015625, -10.833984375, -10.2578125, -9.681640625, -9.10546875, -8.529296875, -7.953125, -7.376953125, -6.80078125, -6.224609375, -5.6484375, -5.072265625, -4.49609375, -3.919921875, -3.34375, -2.767578125, -2.19140625, -1.615234375, -1.0390625, -0.462890625, 0.11328125, 0.689453125, 1.265625, 1.841796875, 2.41796875, 2.994140625, 3.5703125, 4.146484375, 4.72265625, 5.298828125, 5.875, 6.451171875, 7.02734375, 7.603515625, 8.1796875, 8.755859375, 9.33203125, 9.908203125, 10.484375, 11.060546875, 11.63671875, 12.212890625, 12.7890625, 13.365234375, 13.94140625, 14.517578125, 15.09375, 15.669921875, 16.24609375, 16.822265625, 17.3984375, 17.974609375, 18.55078125, 19.126953125, 19.703125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 14.0, 19.0, 23.0, 43.0, 55.0, 73.0, 105.0, 151.0, 185.0, 257.0, 358.0, 520.0, 556.0, 502.0, 347.0, 208.0, 179.0, 131.0, 91.0, 64.0, 46.0, 40.0, 31.0, 13.0, 13.0, 9.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.125, -47.84619140625, -46.5673828125, -45.28857421875, -44.009765625, -42.73095703125, -41.4521484375, -40.17333984375, -38.89453125, -37.61572265625, -36.3369140625, -35.05810546875, -33.779296875, -32.50048828125, -31.2216796875, -29.94287109375, -28.6640625, -27.38525390625, -26.1064453125, -24.82763671875, -23.548828125, -22.27001953125, -20.9912109375, -19.71240234375, -18.43359375, -17.15478515625, -15.8759765625, -14.59716796875, -13.318359375, -12.03955078125, -10.7607421875, -9.48193359375, -8.203125, -6.92431640625, -5.6455078125, -4.36669921875, -3.087890625, -1.80908203125, -0.5302734375, 0.74853515625, 2.02734375, 3.30615234375, 4.5849609375, 5.86376953125, 7.142578125, 8.42138671875, 9.7001953125, 10.97900390625, 12.2578125, 13.53662109375, 14.8154296875, 16.09423828125, 17.373046875, 18.65185546875, 19.9306640625, 21.20947265625, 22.48828125, 23.76708984375, 25.0458984375, 26.32470703125, 27.603515625, 28.88232421875, 30.1611328125, 31.43994140625, 32.71875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 3.0, 8.0, 12.0, 18.0, 10.0, 25.0, 29.0, 32.0, 40.0, 50.0, 59.0, 86.0, 101.0, 134.0, 138.0, 197.0, 234.0, 282.0, 480.0, 1319.0, 60280.0, 4123474.0, 4652.0, 761.0, 404.0, 267.0, 204.0, 197.0, 149.0, 132.0, 92.0, 97.0, 51.0, 49.0, 40.0, 43.0, 29.0, 20.0, 15.0, 14.0, 15.0, 7.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-166.125, -160.642578125, -155.16015625, -149.677734375, -144.1953125, -138.712890625, -133.23046875, -127.748046875, -122.265625, -116.783203125, -111.30078125, -105.818359375, -100.3359375, -94.853515625, -89.37109375, -83.888671875, -78.40625, -72.923828125, -67.44140625, -61.958984375, -56.4765625, -50.994140625, -45.51171875, -40.029296875, -34.546875, -29.064453125, -23.58203125, -18.099609375, -12.6171875, -7.134765625, -1.65234375, 3.830078125, 9.3125, 14.794921875, 20.27734375, 25.759765625, 31.2421875, 36.724609375, 42.20703125, 47.689453125, 53.171875, 58.654296875, 64.13671875, 69.619140625, 75.1015625, 80.583984375, 86.06640625, 91.548828125, 97.03125, 102.513671875, 107.99609375, 113.478515625, 118.9609375, 124.443359375, 129.92578125, 135.408203125, 140.890625, 146.373046875, 151.85546875, 157.337890625, 162.8203125, 168.302734375, 173.78515625, 179.267578125, 184.75]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 31.0, 338.0, 569.0, 72.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-825.1871337890625, -809.674072265625, -794.1610107421875, -778.64794921875, -763.1348876953125, -747.621826171875, -732.1087646484375, -716.5957641601562, -701.0827026367188, -685.5696411132812, -670.0565795898438, -654.5435180664062, -639.0304565429688, -623.5174560546875, -608.00439453125, -592.4913330078125, -576.978271484375, -561.4652099609375, -545.9521484375, -530.4390869140625, -514.926025390625, -499.4129943847656, -483.8999328613281, -468.3868713378906, -452.873779296875, -437.3607177734375, -421.84765625, -406.3345947265625, -390.8215637207031, -375.3085021972656, -359.7954406738281, -344.2823791503906, -328.7693786621094, -313.2563171386719, -297.7432556152344, -282.230224609375, -266.7171630859375, -251.2041015625, -235.6910400390625, -220.177978515625, -204.66493225097656, -189.15187072753906, -173.63882446289062, -158.12576293945312, -142.61270141601562, -127.09965515136719, -111.58659362792969, -96.07353973388672, -80.56048583984375, -65.04743194580078, -49.53437423706055, -34.02131652832031, -18.508262634277344, -2.995208740234375, 12.517852783203125, 28.030906677246094, 43.54396057128906, 59.05701446533203, 74.570068359375, 90.0831298828125, 105.59618377685547, 121.10923767089844, 136.62229919433594, 152.13534545898438, 167.64840698242188]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 9.0, 3.0, 4.0, 18.0, 21.0, 9.0, 24.0, 21.0, 20.0, 18.0, 18.0, 35.0, 25.0, 25.0, 35.0, 40.0, 40.0, 33.0, 39.0, 53.0, 58.0, 32.0, 45.0, 44.0, 37.0, 28.0, 35.0, 35.0, 28.0, 22.0, 29.0, 28.0, 21.0, 16.0, 10.0, 4.0, 9.0, 8.0, 14.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.32623291015625, -121.19496154785156, -117.06369018554688, -112.93242645263672, -108.80115509033203, -104.66988372802734, -100.53861999511719, -96.4073486328125, -92.27607727050781, -88.14480590820312, -84.01353454589844, -79.88227081298828, -75.7509994506836, -71.6197280883789, -67.48846435546875, -63.35719299316406, -59.225921630859375, -55.09465026855469, -50.963382720947266, -46.832115173339844, -42.700843811035156, -38.56957244873047, -34.43830490112305, -30.307035446166992, -26.175765991210938, -22.044496536254883, -17.913227081298828, -13.781957626342773, -9.650688171386719, -5.519418716430664, -1.3881492614746094, 2.7431201934814453, 6.8743896484375, 11.005659103393555, 15.13692855834961, 19.268198013305664, 23.39946746826172, 27.530736923217773, 31.662006378173828, 35.79327392578125, 39.92454528808594, 44.055816650390625, 48.18708419799805, 52.31835174560547, 56.449623107910156, 60.580894470214844, 64.712158203125, 68.84342956542969, 72.97470092773438, 77.10597229003906, 81.23724365234375, 85.3685073852539, 89.4997787475586, 93.63105010986328, 97.76231384277344, 101.89358520507812, 106.02485656738281, 110.1561279296875, 114.28739929199219, 118.41866302490234, 122.54993438720703, 126.68120574951172, 130.81246948242188, 134.94374084472656, 139.07501220703125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 4.0, 10.0, 10.0, 6.0, 7.0, 17.0, 16.0, 16.0, 21.0, 28.0, 17.0, 30.0, 38.0, 33.0, 38.0, 34.0, 38.0, 28.0, 34.0, 37.0, 39.0, 43.0, 41.0, 38.0, 41.0, 32.0, 41.0, 30.0, 24.0, 28.0, 30.0, 24.0, 18.0, 13.0, 15.0, 17.0, 7.0, 15.0, 7.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.370361328125, -14.85009765625, -14.329833984375, -13.8095703125, -13.289306640625, -12.76904296875, -12.248779296875, -11.728515625, -11.208251953125, -10.68798828125, -10.167724609375, -9.6474609375, -9.127197265625, -8.60693359375, -8.086669921875, -7.56640625, -7.046142578125, -6.52587890625, -6.005615234375, -5.4853515625, -4.965087890625, -4.44482421875, -3.924560546875, -3.404296875, -2.884033203125, -2.36376953125, -1.843505859375, -1.3232421875, -0.802978515625, -0.28271484375, 0.237548828125, 0.7578125, 1.278076171875, 1.79833984375, 2.318603515625, 2.8388671875, 3.359130859375, 3.87939453125, 4.399658203125, 4.919921875, 5.440185546875, 5.96044921875, 6.480712890625, 7.0009765625, 7.521240234375, 8.04150390625, 8.561767578125, 9.08203125, 9.602294921875, 10.12255859375, 10.642822265625, 11.1630859375, 11.683349609375, 12.20361328125, 12.723876953125, 13.244140625, 13.764404296875, 14.28466796875, 14.804931640625, 15.3251953125, 15.845458984375, 16.36572265625, 16.885986328125, 17.40625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 9.0, 16.0, 33.0, 55.0, 73.0, 94.0, 120.0, 203.0, 272.0, 393.0, 523.0, 738.0, 1050.0, 1413.0, 2080.0, 2949.0, 4084.0, 5797.0, 8180.0, 11755.0, 17174.0, 25116.0, 38024.0, 57634.0, 91173.0, 171198.0, 271852.0, 119748.0, 71713.0, 46068.0, 30741.0, 20599.0, 14170.0, 9808.0, 6915.0, 4918.0, 3395.0, 2402.0, 1751.0, 1269.0, 857.0, 640.0, 473.0, 316.0, 236.0, 139.0, 107.0, 89.0, 58.0, 43.0, 20.0, 21.0, 16.0, 7.0, 7.0, 7.0, 3.0], "bins": [-3.7734375, -3.659942626953125, -3.54644775390625, -3.432952880859375, -3.3194580078125, -3.205963134765625, -3.09246826171875, -2.978973388671875, -2.865478515625, -2.751983642578125, -2.63848876953125, -2.524993896484375, -2.4114990234375, -2.298004150390625, -2.18450927734375, -2.071014404296875, -1.95751953125, -1.844024658203125, -1.73052978515625, -1.617034912109375, -1.5035400390625, -1.390045166015625, -1.27655029296875, -1.163055419921875, -1.049560546875, -0.936065673828125, -0.82257080078125, -0.709075927734375, -0.5955810546875, -0.482086181640625, -0.36859130859375, -0.255096435546875, -0.1416015625, -0.028106689453125, 0.08538818359375, 0.198883056640625, 0.3123779296875, 0.425872802734375, 0.53936767578125, 0.652862548828125, 0.766357421875, 0.879852294921875, 0.99334716796875, 1.106842041015625, 1.2203369140625, 1.333831787109375, 1.44732666015625, 1.560821533203125, 1.67431640625, 1.787811279296875, 1.90130615234375, 2.014801025390625, 2.1282958984375, 2.241790771484375, 2.35528564453125, 2.468780517578125, 2.582275390625, 2.695770263671875, 2.80926513671875, 2.922760009765625, 3.0362548828125, 3.149749755859375, 3.26324462890625, 3.376739501953125, 3.490234375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 6.0, 9.0, 6.0, 10.0, 11.0, 21.0, 20.0, 15.0, 17.0, 23.0, 20.0, 24.0, 31.0, 41.0, 53.0, 30.0, 40.0, 44.0, 31.0, 1064.0, 42.0, 40.0, 36.0, 44.0, 38.0, 38.0, 32.0, 25.0, 26.0, 21.0, 27.0, 22.0, 17.0, 19.0, 13.0, 12.0, 7.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.46875, -10.1368408203125, -9.804931640625, -9.4730224609375, -9.14111328125, -8.8092041015625, -8.477294921875, -8.1453857421875, -7.8134765625, -7.4815673828125, -7.149658203125, -6.8177490234375, -6.48583984375, -6.1539306640625, -5.822021484375, -5.4901123046875, -5.158203125, -4.8262939453125, -4.494384765625, -4.1624755859375, -3.83056640625, -3.4986572265625, -3.166748046875, -2.8348388671875, -2.5029296875, -2.1710205078125, -1.839111328125, -1.5072021484375, -1.17529296875, -0.8433837890625, -0.511474609375, -0.1795654296875, 0.15234375, 0.4842529296875, 0.816162109375, 1.1480712890625, 1.47998046875, 1.8118896484375, 2.143798828125, 2.4757080078125, 2.8076171875, 3.1395263671875, 3.471435546875, 3.8033447265625, 4.13525390625, 4.4671630859375, 4.799072265625, 5.1309814453125, 5.462890625, 5.7947998046875, 6.126708984375, 6.4586181640625, 6.79052734375, 7.1224365234375, 7.454345703125, 7.7862548828125, 8.1181640625, 8.4500732421875, 8.781982421875, 9.1138916015625, 9.44580078125, 9.7777099609375, 10.109619140625, 10.4415283203125, 10.7734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 5.0, 14.0, 12.0, 24.0, 33.0, 42.0, 69.0, 78.0, 135.0, 159.0, 242.0, 347.0, 478.0, 693.0, 1008.0, 1508.0, 2314.0, 3348.0, 5176.0, 7803.0, 12274.0, 18939.0, 29830.0, 48616.0, 84619.0, 160570.0, 1375720.0, 142729.0, 76966.0, 44751.0, 27855.0, 17602.0, 11267.0, 7280.0, 4736.0, 3183.0, 2089.0, 1389.0, 980.0, 683.0, 508.0, 308.0, 212.0, 144.0, 106.0, 74.0, 76.0, 46.0, 27.0, 16.0, 18.0, 10.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0], "bins": [-4.23046875, -4.0999755859375, -3.969482421875, -3.8389892578125, -3.70849609375, -3.5780029296875, -3.447509765625, -3.3170166015625, -3.1865234375, -3.0560302734375, -2.925537109375, -2.7950439453125, -2.66455078125, -2.5340576171875, -2.403564453125, -2.2730712890625, -2.142578125, -2.0120849609375, -1.881591796875, -1.7510986328125, -1.62060546875, -1.4901123046875, -1.359619140625, -1.2291259765625, -1.0986328125, -0.9681396484375, -0.837646484375, -0.7071533203125, -0.57666015625, -0.4461669921875, -0.315673828125, -0.1851806640625, -0.0546875, 0.0758056640625, 0.206298828125, 0.3367919921875, 0.46728515625, 0.5977783203125, 0.728271484375, 0.8587646484375, 0.9892578125, 1.1197509765625, 1.250244140625, 1.3807373046875, 1.51123046875, 1.6417236328125, 1.772216796875, 1.9027099609375, 2.033203125, 2.1636962890625, 2.294189453125, 2.4246826171875, 2.55517578125, 2.6856689453125, 2.816162109375, 2.9466552734375, 3.0771484375, 3.2076416015625, 3.338134765625, 3.4686279296875, 3.59912109375, 3.7296142578125, 3.860107421875, 3.9906005859375, 4.12109375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 10.0, 8.0, 20.0, 26.0, 29.0, 32.0, 50.0, 77.0, 76.0, 113.0, 126.0, 111.0, 70.0, 53.0, 52.0, 36.0, 30.0, 18.0, 13.0, 8.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00270843505859375, -0.0026085376739501953, -0.0025086402893066406, -0.002408742904663086, -0.0023088455200195312, -0.0022089481353759766, -0.002109050750732422, -0.002009153366088867, -0.0019092559814453125, -0.0018093585968017578, -0.0017094612121582031, -0.0016095638275146484, -0.0015096664428710938, -0.001409769058227539, -0.0013098716735839844, -0.0012099742889404297, -0.001110076904296875, -0.0010101795196533203, -0.0009102821350097656, -0.0008103847503662109, -0.0007104873657226562, -0.0006105899810791016, -0.0005106925964355469, -0.0004107952117919922, -0.0003108978271484375, -0.0002110004425048828, -0.00011110305786132812, -1.1205673217773438e-05, 8.869171142578125e-05, 0.00018858909606933594, 0.0002884864807128906, 0.0003883838653564453, 0.00048828125, 0.0005881786346435547, 0.0006880760192871094, 0.0007879734039306641, 0.0008878707885742188, 0.0009877681732177734, 0.0010876655578613281, 0.0011875629425048828, 0.0012874603271484375, 0.0013873577117919922, 0.0014872550964355469, 0.0015871524810791016, 0.0016870498657226562, 0.001786947250366211, 0.0018868446350097656, 0.0019867420196533203, 0.002086639404296875, 0.0021865367889404297, 0.0022864341735839844, 0.002386331558227539, 0.0024862289428710938, 0.0025861263275146484, 0.002686023712158203, 0.002785921096801758, 0.0028858184814453125, 0.002985715866088867, 0.003085613250732422, 0.0031855106353759766, 0.0032854080200195312, 0.003385305404663086, 0.0034852027893066406, 0.0035851001739501953, 0.00368499755859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 8.0, 5.0, 8.0, 10.0, 8.0, 16.0, 17.0, 35.0, 44.0, 57.0, 94.0, 133.0, 294.0, 803.0, 317562.0, 727913.0, 798.0, 302.0, 151.0, 63.0, 67.0, 33.0, 33.0, 20.0, 17.0, 12.0, 11.0, 5.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.08294677734375, -0.08070659637451172, -0.07846641540527344, -0.07622623443603516, -0.07398605346679688, -0.0717458724975586, -0.06950569152832031, -0.06726551055908203, -0.06502532958984375, -0.06278514862060547, -0.06054496765136719, -0.058304786682128906, -0.056064605712890625, -0.053824424743652344, -0.05158424377441406, -0.04934406280517578, -0.0471038818359375, -0.04486370086669922, -0.04262351989746094, -0.040383338928222656, -0.038143157958984375, -0.035902976989746094, -0.03366279602050781, -0.03142261505126953, -0.02918243408203125, -0.02694225311279297, -0.024702072143554688, -0.022461891174316406, -0.020221710205078125, -0.017981529235839844, -0.015741348266601562, -0.013501167297363281, -0.011260986328125, -0.009020805358886719, -0.0067806243896484375, -0.004540443420410156, -0.002300262451171875, -6.008148193359375e-05, 0.0021800994873046875, 0.004420280456542969, 0.00666046142578125, 0.008900642395019531, 0.011140823364257812, 0.013381004333496094, 0.015621185302734375, 0.017861366271972656, 0.020101547241210938, 0.02234172821044922, 0.0245819091796875, 0.02682209014892578, 0.029062271118164062, 0.031302452087402344, 0.033542633056640625, 0.035782814025878906, 0.03802299499511719, 0.04026317596435547, 0.04250335693359375, 0.04474353790283203, 0.04698371887207031, 0.049223899841308594, 0.051464080810546875, 0.053704261779785156, 0.05594444274902344, 0.05818462371826172, 0.0604248046875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 21.0, 31.0, 111.0, 282.0, 277.0, 191.0, 71.0, 17.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0021979815792292356, -0.0021110076922923326, -0.002024033572524786, -0.001937059685587883, -0.0018500856822356582, -0.0017631116788834333, -0.0016761377919465303, -0.0015891637885943055, -0.0015021897852420807, -0.0014152157818898559, -0.001328241778537631, -0.001241267891600728, -0.0011542938882485032, -0.0010673198848962784, -0.0009803459979593754, -0.0008933719946071506, -0.0008063979912549257, -0.0007194239879027009, -0.000632450042758137, -0.0005454760976135731, -0.00045850209426134825, -0.0003715281200129539, -0.0002845541457645595, -0.0001975802006199956, -0.00011060619726777077, -2.3632223019376397e-05, 6.334175122901797e-05, 0.00015031572547741234, 0.0002372896997258067, 0.0003242636739742011, 0.00041123764822259545, 0.0004982115933671594, 0.0005851858295500278, 0.0006721598329022527, 0.0007591337780468166, 0.0008461077231913805, 0.0009330817265436053, 0.0010200557298958302, 0.0011070296168327332, 0.001194003620184958, 0.0012809776235371828, 0.0013679516268894076, 0.0014549256302416325, 0.0015418995171785355, 0.0016288735205307603, 0.0017158475238829851, 0.0018028214108198881, 0.001889795414172113, 0.0019767694175243378, 0.0020637433044612408, 0.0021507174242287874, 0.0022376913111656904, 0.002324665430933237, 0.00241163931787014, 0.002498613204807043, 0.002585587091743946, 0.0026725612115114927, 0.0027595350984483957, 0.0028465092182159424, 0.0029334831051528454, 0.0030204569920897484, 0.003107431111857295, 0.003194404998794198, 0.0032813791185617447, 0.0033683530054986477]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 13.0, 15.0, 6.0, 13.0, 15.0, 15.0, 18.0, 21.0, 30.0, 19.0, 21.0, 28.0, 45.0, 34.0, 36.0, 37.0, 29.0, 33.0, 37.0, 40.0, 48.0, 36.0, 34.0, 35.0, 36.0, 31.0, 25.0, 28.0, 27.0, 30.0, 16.0, 21.0, 29.0, 19.0, 12.0, 8.0, 7.0, 17.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012203454971313477, -0.001184944063425064, -0.0011495426297187805, -0.001114141196012497, -0.0010787397623062134, -0.0010433383285999298, -0.0010079368948936462, -0.0009725354611873627, -0.0009371340274810791, -0.0009017325937747955, -0.000866331160068512, -0.0008309297263622284, -0.0007955282926559448, -0.0007601268589496613, -0.0007247254252433777, -0.0006893239915370941, -0.0006539225578308105, -0.000618521124124527, -0.0005831196904182434, -0.0005477182567119598, -0.0005123168230056763, -0.0004769153892993927, -0.00044151395559310913, -0.00040611252188682556, -0.000370711088180542, -0.0003353096544742584, -0.00029990822076797485, -0.0002645067870616913, -0.00022910535335540771, -0.00019370391964912415, -0.00015830248594284058, -0.000122901052236557, -8.749961853027344e-05, -5.209818482398987e-05, -1.66967511177063e-05, 1.870468258857727e-05, 5.410611629486084e-05, 8.950755000114441e-05, 0.00012490898370742798, 0.00016031041741371155, 0.00019571185111999512, 0.0002311132848262787, 0.00026651471853256226, 0.0003019161522388458, 0.0003373175859451294, 0.00037271901965141296, 0.00040812045335769653, 0.0004435218870639801, 0.00047892332077026367, 0.0005143247544765472, 0.0005497261881828308, 0.0005851276218891144, 0.000620529055595398, 0.0006559304893016815, 0.0006913319230079651, 0.0007267333567142487, 0.0007621347904205322, 0.0007975362241268158, 0.0008329376578330994, 0.0008683390915393829, 0.0009037405252456665, 0.0009391419589519501, 0.0009745433926582336, 0.0010099448263645172, 0.0010453462600708008]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 4.0, 10.0, 10.0, 6.0, 7.0, 17.0, 16.0, 16.0, 21.0, 28.0, 17.0, 30.0, 38.0, 33.0, 38.0, 34.0, 38.0, 28.0, 34.0, 37.0, 39.0, 43.0, 41.0, 38.0, 41.0, 32.0, 41.0, 30.0, 24.0, 28.0, 30.0, 24.0, 18.0, 13.0, 15.0, 17.0, 7.0, 15.0, 7.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.370361328125, -14.85009765625, -14.329833984375, -13.8095703125, -13.289306640625, -12.76904296875, -12.248779296875, -11.728515625, -11.208251953125, -10.68798828125, -10.167724609375, -9.6474609375, -9.127197265625, -8.60693359375, -8.086669921875, -7.56640625, -7.046142578125, -6.52587890625, -6.005615234375, -5.4853515625, -4.965087890625, -4.44482421875, -3.924560546875, -3.404296875, -2.884033203125, -2.36376953125, -1.843505859375, -1.3232421875, -0.802978515625, -0.28271484375, 0.237548828125, 0.7578125, 1.278076171875, 1.79833984375, 2.318603515625, 2.8388671875, 3.359130859375, 3.87939453125, 4.399658203125, 4.919921875, 5.440185546875, 5.96044921875, 6.480712890625, 7.0009765625, 7.521240234375, 8.04150390625, 8.561767578125, 9.08203125, 9.602294921875, 10.12255859375, 10.642822265625, 11.1630859375, 11.683349609375, 12.20361328125, 12.723876953125, 13.244140625, 13.764404296875, 14.28466796875, 14.804931640625, 15.3251953125, 15.845458984375, 16.36572265625, 16.885986328125, 17.40625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 8.0, 14.0, 12.0, 9.0, 17.0, 27.0, 24.0, 29.0, 38.0, 59.0, 128.0, 158.0, 292.0, 554.0, 1125.0, 2171.0, 4704.0, 11183.0, 26499.0, 69015.0, 201619.0, 420736.0, 196478.0, 67210.0, 26286.0, 10826.0, 4789.0, 2204.0, 1005.0, 554.0, 285.0, 146.0, 91.0, 55.0, 45.0, 29.0, 30.0, 19.0, 23.0, 17.0, 11.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.84375, -12.4224853515625, -12.001220703125, -11.5799560546875, -11.15869140625, -10.7374267578125, -10.316162109375, -9.8948974609375, -9.4736328125, -9.0523681640625, -8.631103515625, -8.2098388671875, -7.78857421875, -7.3673095703125, -6.946044921875, -6.5247802734375, -6.103515625, -5.6822509765625, -5.260986328125, -4.8397216796875, -4.41845703125, -3.9971923828125, -3.575927734375, -3.1546630859375, -2.7333984375, -2.3121337890625, -1.890869140625, -1.4696044921875, -1.04833984375, -0.6270751953125, -0.205810546875, 0.2154541015625, 0.63671875, 1.0579833984375, 1.479248046875, 1.9005126953125, 2.32177734375, 2.7430419921875, 3.164306640625, 3.5855712890625, 4.0068359375, 4.4281005859375, 4.849365234375, 5.2706298828125, 5.69189453125, 6.1131591796875, 6.534423828125, 6.9556884765625, 7.376953125, 7.7982177734375, 8.219482421875, 8.6407470703125, 9.06201171875, 9.4832763671875, 9.904541015625, 10.3258056640625, 10.7470703125, 11.1683349609375, 11.589599609375, 12.0108642578125, 12.43212890625, 12.8533935546875, 13.274658203125, 13.6959228515625, 14.1171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 8.0, 6.0, 9.0, 11.0, 12.0, 22.0, 18.0, 17.0, 24.0, 21.0, 30.0, 35.0, 33.0, 36.0, 55.0, 58.0, 75.0, 236.0, 1700.0, 151.0, 53.0, 46.0, 45.0, 41.0, 37.0, 23.0, 27.0, 31.0, 23.0, 24.0, 21.0, 18.0, 17.0, 14.0, 9.0, 9.0, 3.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0], "bins": [-58.34375, -56.740234375, -55.13671875, -53.533203125, -51.9296875, -50.326171875, -48.72265625, -47.119140625, -45.515625, -43.912109375, -42.30859375, -40.705078125, -39.1015625, -37.498046875, -35.89453125, -34.291015625, -32.6875, -31.083984375, -29.48046875, -27.876953125, -26.2734375, -24.669921875, -23.06640625, -21.462890625, -19.859375, -18.255859375, -16.65234375, -15.048828125, -13.4453125, -11.841796875, -10.23828125, -8.634765625, -7.03125, -5.427734375, -3.82421875, -2.220703125, -0.6171875, 0.986328125, 2.58984375, 4.193359375, 5.796875, 7.400390625, 9.00390625, 10.607421875, 12.2109375, 13.814453125, 15.41796875, 17.021484375, 18.625, 20.228515625, 21.83203125, 23.435546875, 25.0390625, 26.642578125, 28.24609375, 29.849609375, 31.453125, 33.056640625, 34.66015625, 36.263671875, 37.8671875, 39.470703125, 41.07421875, 42.677734375, 44.28125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 9.0, 10.0, 6.0, 9.0, 11.0, 20.0, 29.0, 26.0, 46.0, 56.0, 54.0, 67.0, 102.0, 138.0, 187.0, 247.0, 368.0, 761.0, 5043.0, 2617612.0, 515721.0, 3174.0, 718.0, 363.0, 206.0, 183.0, 118.0, 93.0, 58.0, 69.0, 34.0, 32.0, 33.0, 19.0, 21.0, 14.0, 7.0, 6.0, 5.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.625, -79.86328125, -77.1015625, -74.33984375, -71.578125, -68.81640625, -66.0546875, -63.29296875, -60.53125, -57.76953125, -55.0078125, -52.24609375, -49.484375, -46.72265625, -43.9609375, -41.19921875, -38.4375, -35.67578125, -32.9140625, -30.15234375, -27.390625, -24.62890625, -21.8671875, -19.10546875, -16.34375, -13.58203125, -10.8203125, -8.05859375, -5.296875, -2.53515625, 0.2265625, 2.98828125, 5.75, 8.51171875, 11.2734375, 14.03515625, 16.796875, 19.55859375, 22.3203125, 25.08203125, 27.84375, 30.60546875, 33.3671875, 36.12890625, 38.890625, 41.65234375, 44.4140625, 47.17578125, 49.9375, 52.69921875, 55.4609375, 58.22265625, 60.984375, 63.74609375, 66.5078125, 69.26953125, 72.03125, 74.79296875, 77.5546875, 80.31640625, 83.078125, 85.83984375, 88.6015625, 91.36328125, 94.125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 46.0, 415.0, 463.0, 88.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.51224899291992, -50.27079391479492, -44.02934265136719, -37.78788757324219, -31.546432495117188, -25.304977416992188, -19.063526153564453, -12.822071075439453, -6.580615997314453, -0.33916187286376953, 5.902292251586914, 12.143745422363281, 18.38520050048828, 24.62665557861328, 30.868106842041016, 37.109561920166016, 43.351016998291016, 49.592472076416016, 55.83392333984375, 62.07537841796875, 68.31683349609375, 74.55828857421875, 80.79974365234375, 87.04119873046875, 93.28265380859375, 99.52410888671875, 105.76556396484375, 112.00701904296875, 118.24847412109375, 124.48992919921875, 130.73138427734375, 136.97283935546875, 143.21429443359375, 149.45574951171875, 155.69720458984375, 161.93865966796875, 168.18011474609375, 174.42156982421875, 180.66302490234375, 186.90447998046875, 193.14593505859375, 199.38739013671875, 205.62884521484375, 211.87030029296875, 218.11175537109375, 224.35321044921875, 230.59466552734375, 236.83612060546875, 243.0775604248047, 249.3190155029297, 255.5604705810547, 261.8019104003906, 268.0433654785156, 274.2848205566406, 280.5262756347656, 286.7677307128906, 293.0091857910156, 299.2506408691406, 305.4920959472656, 311.7335510253906, 317.9750061035156, 324.2164611816406, 330.4579162597656, 336.6993713378906, 342.9408264160156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 17.0, 16.0, 16.0, 24.0, 23.0, 39.0, 40.0, 38.0, 38.0, 47.0, 51.0, 53.0, 68.0, 47.0, 54.0, 57.0, 61.0, 42.0, 41.0, 29.0, 27.0, 31.0, 18.0, 22.0, 15.0, 15.0, 14.0, 9.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-178.88841247558594, -173.8727569580078, -168.8571014404297, -163.84144592285156, -158.82579040527344, -153.8101348876953, -148.7944793701172, -143.77882385253906, -138.76316833496094, -133.7475128173828, -128.7318572998047, -123.71620178222656, -118.70054626464844, -113.68489074707031, -108.66923522949219, -103.65357971191406, -98.63792419433594, -93.62226867675781, -88.60661315917969, -83.59095764160156, -78.57530212402344, -73.55964660644531, -68.54399108886719, -63.52833557128906, -58.51268005371094, -53.49702453613281, -48.48136901855469, -43.46571350097656, -38.45005798339844, -33.43440246582031, -28.418746948242188, -23.403091430664062, -18.387451171875, -13.371795654296875, -8.35614013671875, -3.340484619140625, 1.6751708984375, 6.690826416015625, 11.70648193359375, 16.722137451171875, 21.73779296875, 26.753448486328125, 31.76910400390625, 36.784759521484375, 41.8004150390625, 46.816070556640625, 51.83172607421875, 56.847381591796875, 61.863037109375, 66.87869262695312, 71.89434814453125, 76.91000366210938, 81.9256591796875, 86.94131469726562, 91.95697021484375, 96.97262573242188, 101.98828125, 107.00393676757812, 112.01959228515625, 117.03524780273438, 122.0509033203125, 127.06655883789062, 132.08221435546875, 137.09786987304688, 142.113525390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 10.0, 9.0, 11.0, 8.0, 10.0, 19.0, 18.0, 22.0, 31.0, 21.0, 42.0, 30.0, 42.0, 35.0, 34.0, 37.0, 41.0, 36.0, 37.0, 35.0, 30.0, 51.0, 48.0, 33.0, 40.0, 31.0, 32.0, 23.0, 30.0, 18.0, 13.0, 19.0, 17.0, 15.0, 9.0, 17.0, 4.0, 4.0, 8.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.204833984375, -15.65966796875, -15.114501953125, -14.5693359375, -14.024169921875, -13.47900390625, -12.933837890625, -12.388671875, -11.843505859375, -11.29833984375, -10.753173828125, -10.2080078125, -9.662841796875, -9.11767578125, -8.572509765625, -8.02734375, -7.482177734375, -6.93701171875, -6.391845703125, -5.8466796875, -5.301513671875, -4.75634765625, -4.211181640625, -3.666015625, -3.120849609375, -2.57568359375, -2.030517578125, -1.4853515625, -0.940185546875, -0.39501953125, 0.150146484375, 0.6953125, 1.240478515625, 1.78564453125, 2.330810546875, 2.8759765625, 3.421142578125, 3.96630859375, 4.511474609375, 5.056640625, 5.601806640625, 6.14697265625, 6.692138671875, 7.2373046875, 7.782470703125, 8.32763671875, 8.872802734375, 9.41796875, 9.963134765625, 10.50830078125, 11.053466796875, 11.5986328125, 12.143798828125, 12.68896484375, 13.234130859375, 13.779296875, 14.324462890625, 14.86962890625, 15.414794921875, 15.9599609375, 16.505126953125, 17.05029296875, 17.595458984375, 18.140625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 3.0, 5.0, 5.0, 5.0, 14.0, 11.0, 7.0, 20.0, 19.0, 16.0, 30.0, 30.0, 37.0, 45.0, 61.0, 66.0, 90.0, 183.0, 384.0, 1055.0, 6372.0, 237729.0, 3599767.0, 338325.0, 7775.0, 1125.0, 400.0, 201.0, 114.0, 84.0, 54.0, 47.0, 33.0, 22.0, 31.0, 18.0, 18.0, 16.0, 11.0, 12.0, 7.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.33349609375, -47.5419921875, -45.75048828125, -43.958984375, -42.16748046875, -40.3759765625, -38.58447265625, -36.79296875, -35.00146484375, -33.2099609375, -31.41845703125, -29.626953125, -27.83544921875, -26.0439453125, -24.25244140625, -22.4609375, -20.66943359375, -18.8779296875, -17.08642578125, -15.294921875, -13.50341796875, -11.7119140625, -9.92041015625, -8.12890625, -6.33740234375, -4.5458984375, -2.75439453125, -0.962890625, 0.82861328125, 2.6201171875, 4.41162109375, 6.203125, 7.99462890625, 9.7861328125, 11.57763671875, 13.369140625, 15.16064453125, 16.9521484375, 18.74365234375, 20.53515625, 22.32666015625, 24.1181640625, 25.90966796875, 27.701171875, 29.49267578125, 31.2841796875, 33.07568359375, 34.8671875, 36.65869140625, 38.4501953125, 40.24169921875, 42.033203125, 43.82470703125, 45.6162109375, 47.40771484375, 49.19921875, 50.99072265625, 52.7822265625, 54.57373046875, 56.365234375, 58.15673828125, 59.9482421875, 61.73974609375, 63.53125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 8.0, 11.0, 15.0, 17.0, 21.0, 26.0, 34.0, 32.0, 44.0, 49.0, 63.0, 79.0, 138.0, 186.0, 247.0, 386.0, 494.0, 516.0, 486.0, 307.0, 225.0, 164.0, 141.0, 87.0, 65.0, 62.0, 36.0, 31.0, 25.0, 12.0, 14.0, 14.0, 8.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.71875, -28.73828125, -27.7578125, -26.77734375, -25.796875, -24.81640625, -23.8359375, -22.85546875, -21.875, -20.89453125, -19.9140625, -18.93359375, -17.953125, -16.97265625, -15.9921875, -15.01171875, -14.03125, -13.05078125, -12.0703125, -11.08984375, -10.109375, -9.12890625, -8.1484375, -7.16796875, -6.1875, -5.20703125, -4.2265625, -3.24609375, -2.265625, -1.28515625, -0.3046875, 0.67578125, 1.65625, 2.63671875, 3.6171875, 4.59765625, 5.578125, 6.55859375, 7.5390625, 8.51953125, 9.5, 10.48046875, 11.4609375, 12.44140625, 13.421875, 14.40234375, 15.3828125, 16.36328125, 17.34375, 18.32421875, 19.3046875, 20.28515625, 21.265625, 22.24609375, 23.2265625, 24.20703125, 25.1875, 26.16796875, 27.1484375, 28.12890625, 29.109375, 30.08984375, 31.0703125, 32.05078125, 33.03125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 3.0, 10.0, 13.0, 10.0, 22.0, 17.0, 31.0, 55.0, 74.0, 81.0, 102.0, 155.0, 242.0, 331.0, 674.0, 4452.0, 4180730.0, 5460.0, 644.0, 301.0, 197.0, 144.0, 128.0, 93.0, 73.0, 55.0, 37.0, 35.0, 16.0, 27.0, 13.0, 9.0, 10.0, 8.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-284.75, -276.5, -268.25, -260.0, -251.75, -243.5, -235.25, -227.0, -218.75, -210.5, -202.25, -194.0, -185.75, -177.5, -169.25, -161.0, -152.75, -144.5, -136.25, -128.0, -119.75, -111.5, -103.25, -95.0, -86.75, -78.5, -70.25, -62.0, -53.75, -45.5, -37.25, -29.0, -20.75, -12.5, -4.25, 4.0, 12.25, 20.5, 28.75, 37.0, 45.25, 53.5, 61.75, 70.0, 78.25, 86.5, 94.75, 103.0, 111.25, 119.5, 127.75, 136.0, 144.25, 152.5, 160.75, 169.0, 177.25, 185.5, 193.75, 202.0, 210.25, 218.5, 226.75, 235.0, 243.25]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 158.0, 608.0, 228.0, 19.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-482.3219909667969, -468.36419677734375, -454.4063720703125, -440.4485778808594, -426.49078369140625, -412.532958984375, -398.5751647949219, -384.61737060546875, -370.6595458984375, -356.7017517089844, -342.7439270019531, -328.7861328125, -314.8283386230469, -300.8705139160156, -286.9127197265625, -272.95489501953125, -258.99713134765625, -245.03932189941406, -231.08152770996094, -217.12371826171875, -203.16590881347656, -189.20809936523438, -175.25030517578125, -161.29249572753906, -147.33468627929688, -133.3768768310547, -119.41907501220703, -105.46127319335938, -91.50346374511719, -77.54566192626953, -63.587860107421875, -49.63005065917969, -35.6722412109375, -21.714435577392578, -7.756631851196289, 6.201171875, 20.158977508544922, 34.116783142089844, 48.0745849609375, 62.03239440917969, 75.99019622802734, 89.947998046875, 103.90580749511719, 117.86360931396484, 131.8214111328125, 145.7792205810547, 159.73703002929688, 173.69482421875, 187.6526336669922, 201.61044311523438, 215.5682373046875, 229.5260467529297, 243.48385620117188, 257.441650390625, 271.39947509765625, 285.3572692871094, 299.3150634765625, 313.2728576660156, 327.2306823730469, 341.1884765625, 355.1462707519531, 369.1040954589844, 383.0618896484375, 397.01971435546875, 410.9775085449219]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 7.0, 3.0, 8.0, 6.0, 3.0, 10.0, 11.0, 10.0, 22.0, 23.0, 26.0, 32.0, 33.0, 36.0, 39.0, 38.0, 38.0, 39.0, 46.0, 47.0, 48.0, 56.0, 38.0, 41.0, 39.0, 36.0, 36.0, 26.0, 33.0, 25.0, 27.0, 25.0, 22.0, 20.0, 10.0, 5.0, 8.0, 8.0, 7.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-145.69122314453125, -141.64866638183594, -137.60610961914062, -133.56356811523438, -129.52101135253906, -125.47845458984375, -121.43589782714844, -117.39334106445312, -113.35078430175781, -109.3082275390625, -105.26567840576172, -101.2231216430664, -97.1805648803711, -93.13801574707031, -89.095458984375, -85.05290222167969, -81.0103530883789, -76.9677963256836, -72.92524719238281, -68.8826904296875, -64.84013366699219, -60.79758071899414, -56.755027770996094, -52.71247100830078, -48.669918060302734, -44.62736511230469, -40.584808349609375, -36.54225540161133, -32.49970245361328, -28.45714569091797, -24.414592742919922, -20.372037887573242, -16.329483032226562, -12.286928176879883, -8.24437427520752, -4.201820373535156, -0.15926551818847656, 3.883289337158203, 7.92584228515625, 11.96839714050293, 16.01095199584961, 20.05350685119629, 24.09606170654297, 28.138614654541016, 32.18116760253906, 36.223724365234375, 40.26627731323242, 44.30883026123047, 48.35138702392578, 52.39393997192383, 56.43649673461914, 60.47904968261719, 64.5216064453125, 68.56416320800781, 72.6067123413086, 76.6492691040039, 80.69181823730469, 84.734375, 88.77692413330078, 92.8194808959961, 96.8620376586914, 100.90458679199219, 104.9471435546875, 108.98970031738281, 113.03225708007812]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 11.0, 10.0, 9.0, 16.0, 11.0, 13.0, 26.0, 27.0, 25.0, 30.0, 29.0, 33.0, 32.0, 47.0, 34.0, 30.0, 38.0, 46.0, 47.0, 28.0, 48.0, 31.0, 35.0, 41.0, 37.0, 33.0, 34.0, 19.0, 16.0, 25.0, 20.0, 19.0, 14.0, 12.0, 15.0, 12.0, 11.0, 4.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-17.859375, -17.325927734375, -16.79248046875, -16.259033203125, -15.7255859375, -15.192138671875, -14.65869140625, -14.125244140625, -13.591796875, -13.058349609375, -12.52490234375, -11.991455078125, -11.4580078125, -10.924560546875, -10.39111328125, -9.857666015625, -9.32421875, -8.790771484375, -8.25732421875, -7.723876953125, -7.1904296875, -6.656982421875, -6.12353515625, -5.590087890625, -5.056640625, -4.523193359375, -3.98974609375, -3.456298828125, -2.9228515625, -2.389404296875, -1.85595703125, -1.322509765625, -0.7890625, -0.255615234375, 0.27783203125, 0.811279296875, 1.3447265625, 1.878173828125, 2.41162109375, 2.945068359375, 3.478515625, 4.011962890625, 4.54541015625, 5.078857421875, 5.6123046875, 6.145751953125, 6.67919921875, 7.212646484375, 7.74609375, 8.279541015625, 8.81298828125, 9.346435546875, 9.8798828125, 10.413330078125, 10.94677734375, 11.480224609375, 12.013671875, 12.547119140625, 13.08056640625, 13.614013671875, 14.1474609375, 14.680908203125, 15.21435546875, 15.747802734375, 16.28125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 6.0, 18.0, 21.0, 22.0, 41.0, 51.0, 72.0, 113.0, 197.0, 256.0, 397.0, 562.0, 951.0, 1356.0, 2221.0, 3521.0, 5464.0, 8862.0, 14337.0, 23814.0, 41406.0, 75537.0, 151592.0, 369662.0, 161674.0, 78633.0, 42792.0, 24893.0, 14987.0, 9208.0, 5782.0, 3605.0, 2330.0, 1439.0, 926.0, 596.0, 406.0, 251.0, 182.0, 140.0, 64.0, 51.0, 35.0, 22.0, 21.0, 11.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.651123046875, -4.49365234375, -4.336181640625, -4.1787109375, -4.021240234375, -3.86376953125, -3.706298828125, -3.548828125, -3.391357421875, -3.23388671875, -3.076416015625, -2.9189453125, -2.761474609375, -2.60400390625, -2.446533203125, -2.2890625, -2.131591796875, -1.97412109375, -1.816650390625, -1.6591796875, -1.501708984375, -1.34423828125, -1.186767578125, -1.029296875, -0.871826171875, -0.71435546875, -0.556884765625, -0.3994140625, -0.241943359375, -0.08447265625, 0.072998046875, 0.23046875, 0.387939453125, 0.54541015625, 0.702880859375, 0.8603515625, 1.017822265625, 1.17529296875, 1.332763671875, 1.490234375, 1.647705078125, 1.80517578125, 1.962646484375, 2.1201171875, 2.277587890625, 2.43505859375, 2.592529296875, 2.75, 2.907470703125, 3.06494140625, 3.222412109375, 3.3798828125, 3.537353515625, 3.69482421875, 3.852294921875, 4.009765625, 4.167236328125, 4.32470703125, 4.482177734375, 4.6396484375, 4.797119140625, 4.95458984375, 5.112060546875, 5.26953125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 12.0, 9.0, 11.0, 19.0, 16.0, 16.0, 22.0, 19.0, 22.0, 20.0, 21.0, 26.0, 39.0, 35.0, 46.0, 32.0, 39.0, 42.0, 1056.0, 38.0, 38.0, 49.0, 46.0, 36.0, 43.0, 36.0, 32.0, 25.0, 26.0, 24.0, 21.0, 14.0, 12.0, 13.0, 15.0, 10.0, 9.0, 4.0, 5.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.03125, -10.68359375, -10.3359375, -9.98828125, -9.640625, -9.29296875, -8.9453125, -8.59765625, -8.25, -7.90234375, -7.5546875, -7.20703125, -6.859375, -6.51171875, -6.1640625, -5.81640625, -5.46875, -5.12109375, -4.7734375, -4.42578125, -4.078125, -3.73046875, -3.3828125, -3.03515625, -2.6875, -2.33984375, -1.9921875, -1.64453125, -1.296875, -0.94921875, -0.6015625, -0.25390625, 0.09375, 0.44140625, 0.7890625, 1.13671875, 1.484375, 1.83203125, 2.1796875, 2.52734375, 2.875, 3.22265625, 3.5703125, 3.91796875, 4.265625, 4.61328125, 4.9609375, 5.30859375, 5.65625, 6.00390625, 6.3515625, 6.69921875, 7.046875, 7.39453125, 7.7421875, 8.08984375, 8.4375, 8.78515625, 9.1328125, 9.48046875, 9.828125, 10.17578125, 10.5234375, 10.87109375, 11.21875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 19.0, 16.0, 31.0, 44.0, 58.0, 82.0, 107.0, 154.0, 228.0, 353.0, 449.0, 699.0, 996.0, 1515.0, 2234.0, 3304.0, 5215.0, 8080.0, 12583.0, 19769.0, 31235.0, 50882.0, 89075.0, 174961.0, 1369829.0, 135000.0, 72879.0, 42722.0, 26529.0, 16778.0, 10672.0, 7048.0, 4499.0, 2903.0, 2002.0, 1297.0, 896.0, 567.0, 444.0, 284.0, 215.0, 130.0, 101.0, 69.0, 53.0, 30.0, 28.0, 20.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-4.421875, -4.28509521484375, -4.1483154296875, -4.01153564453125, -3.874755859375, -3.73797607421875, -3.6011962890625, -3.46441650390625, -3.32763671875, -3.19085693359375, -3.0540771484375, -2.91729736328125, -2.780517578125, -2.64373779296875, -2.5069580078125, -2.37017822265625, -2.2333984375, -2.09661865234375, -1.9598388671875, -1.82305908203125, -1.686279296875, -1.54949951171875, -1.4127197265625, -1.27593994140625, -1.13916015625, -1.00238037109375, -0.8656005859375, -0.72882080078125, -0.592041015625, -0.45526123046875, -0.3184814453125, -0.18170166015625, -0.044921875, 0.09185791015625, 0.2286376953125, 0.36541748046875, 0.502197265625, 0.63897705078125, 0.7757568359375, 0.91253662109375, 1.04931640625, 1.18609619140625, 1.3228759765625, 1.45965576171875, 1.596435546875, 1.73321533203125, 1.8699951171875, 2.00677490234375, 2.1435546875, 2.28033447265625, 2.4171142578125, 2.55389404296875, 2.690673828125, 2.82745361328125, 2.9642333984375, 3.10101318359375, 3.23779296875, 3.37457275390625, 3.5113525390625, 3.64813232421875, 3.784912109375, 3.92169189453125, 4.0584716796875, 4.19525146484375, 4.33203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 7.0, 19.0, 15.0, 22.0, 15.0, 25.0, 35.0, 36.0, 53.0, 51.0, 70.0, 79.0, 85.0, 74.0, 60.0, 45.0, 43.0, 42.0, 39.0, 19.0, 19.0, 20.0, 17.0, 14.0, 13.0, 9.0, 7.0, 7.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0034008026123046875, -0.003298431634902954, -0.0031960606575012207, -0.0030936896800994873, -0.002991318702697754, -0.0028889477252960205, -0.002786576747894287, -0.0026842057704925537, -0.0025818347930908203, -0.002479463815689087, -0.0023770928382873535, -0.00227472186088562, -0.0021723508834838867, -0.0020699799060821533, -0.00196760892868042, -0.0018652379512786865, -0.0017628669738769531, -0.0016604959964752197, -0.0015581250190734863, -0.001455754041671753, -0.0013533830642700195, -0.0012510120868682861, -0.0011486411094665527, -0.0010462701320648193, -0.0009438991546630859, -0.0008415281772613525, -0.0007391571998596191, -0.0006367862224578857, -0.0005344152450561523, -0.00043204426765441895, -0.00032967329025268555, -0.00022730231285095215, -0.00012493133544921875, -2.256035804748535e-05, 7.981061935424805e-05, 0.00018218159675598145, 0.00028455257415771484, 0.00038692355155944824, 0.0004892945289611816, 0.000591665506362915, 0.0006940364837646484, 0.0007964074611663818, 0.0008987784385681152, 0.0010011494159698486, 0.001103520393371582, 0.0012058913707733154, 0.0013082623481750488, 0.0014106333255767822, 0.0015130043029785156, 0.001615375280380249, 0.0017177462577819824, 0.0018201172351837158, 0.0019224882125854492, 0.0020248591899871826, 0.002127230167388916, 0.0022296011447906494, 0.002331972122192383, 0.002434343099594116, 0.0025367140769958496, 0.002639085054397583, 0.0027414560317993164, 0.00284382700920105, 0.002946197986602783, 0.0030485689640045166, 0.00315093994140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 7.0, 7.0, 11.0, 10.0, 15.0, 14.0, 18.0, 24.0, 21.0, 41.0, 49.0, 62.0, 88.0, 181.0, 530.0, 76341.0, 969852.0, 640.0, 246.0, 92.0, 69.0, 44.0, 40.0, 25.0, 18.0, 18.0, 19.0, 13.0, 8.0, 8.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0833740234375, -0.08050823211669922, -0.07764244079589844, -0.07477664947509766, -0.07191085815429688, -0.0690450668334961, -0.06617927551269531, -0.06331348419189453, -0.06044769287109375, -0.05758190155029297, -0.05471611022949219, -0.051850318908691406, -0.048984527587890625, -0.046118736267089844, -0.04325294494628906, -0.04038715362548828, -0.0375213623046875, -0.03465557098388672, -0.03178977966308594, -0.028923988342285156, -0.026058197021484375, -0.023192405700683594, -0.020326614379882812, -0.01746082305908203, -0.01459503173828125, -0.011729240417480469, -0.008863449096679688, -0.005997657775878906, -0.003131866455078125, -0.00026607513427734375, 0.0025997161865234375, 0.005465507507324219, 0.008331298828125, 0.011197090148925781, 0.014062881469726562, 0.016928672790527344, 0.019794464111328125, 0.022660255432128906, 0.025526046752929688, 0.02839183807373047, 0.03125762939453125, 0.03412342071533203, 0.03698921203613281, 0.039855003356933594, 0.042720794677734375, 0.045586585998535156, 0.04845237731933594, 0.05131816864013672, 0.0541839599609375, 0.05704975128173828, 0.05991554260253906, 0.06278133392333984, 0.06564712524414062, 0.0685129165649414, 0.07137870788574219, 0.07424449920654297, 0.07711029052734375, 0.07997608184814453, 0.08284187316894531, 0.0857076644897461, 0.08857345581054688, 0.09143924713134766, 0.09430503845214844, 0.09717082977294922, 0.10003662109375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 13.0, 314.0, 622.0, 64.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005202746484428644, -0.004958020988851786, -0.0047132959589362144, -0.004468570463359356, -0.004223844967782497, -0.003979119472205639, -0.003734394209459424, -0.003489668946713209, -0.0032449434511363506, -0.003000217955559492, -0.0027554926928132772, -0.0025107674300670624, -0.002266041934490204, -0.0020213164389133453, -0.0017765911761671305, -0.0015318657970055938, -0.001287140417844057, -0.0010424150386825204, -0.0007976896595209837, -0.000552964280359447, -0.0003082389011979103, -6.351352203637362e-05, 0.00018121185712516308, 0.00042593723628669977, 0.0006706626154482365, 0.0009153879946097732, 0.0011601133737713099, 0.0014048387529328465, 0.0016495641320943832, 0.00189428951125592, 0.0021390148904174566, 0.0023837401531636715, 0.0026284651830792427, 0.0028731906786561012, 0.003117915941402316, 0.003362641204148531, 0.0036073666997253895, 0.003852092195302248, 0.004096817225217819, 0.004341542720794678, 0.004586268216371536, 0.004830993711948395, 0.005075719207525253, 0.0053204442374408245, 0.005565169733017683, 0.0058098952285945415, 0.006054620258510113, 0.006299345754086971, 0.00654407124966383, 0.006788796745240688, 0.007033522240817547, 0.007278247270733118, 0.007522972766309977, 0.007767698261886835, 0.008012423291802406, 0.008257148787379265, 0.008501874282956123, 0.008746599778532982, 0.00899132527410984, 0.009236050769686699, 0.009480776265263557, 0.009725500829517841, 0.0099702263250947, 0.010214951820671558, 0.010459677316248417]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 3.0, 9.0, 11.0, 11.0, 15.0, 14.0, 14.0, 11.0, 14.0, 24.0, 24.0, 36.0, 31.0, 35.0, 22.0, 48.0, 42.0, 46.0, 27.0, 49.0, 43.0, 41.0, 49.0, 35.0, 23.0, 25.0, 39.0, 26.0, 25.0, 28.0, 31.0, 26.0, 21.0, 13.0, 20.0, 13.0, 10.0, 8.0, 5.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001732170581817627, -0.0016816258430480957, -0.0016310811042785645, -0.0015805363655090332, -0.001529991626739502, -0.0014794468879699707, -0.0014289021492004395, -0.0013783574104309082, -0.001327812671661377, -0.0012772679328918457, -0.0012267231941223145, -0.0011761784553527832, -0.001125633716583252, -0.0010750889778137207, -0.0010245442390441895, -0.0009739995002746582, -0.000923454761505127, -0.0008729100227355957, -0.0008223652839660645, -0.0007718205451965332, -0.000721275806427002, -0.0006707310676574707, -0.0006201863288879395, -0.0005696415901184082, -0.000519096851348877, -0.0004685521125793457, -0.00041800737380981445, -0.0003674626350402832, -0.00031691789627075195, -0.0002663731575012207, -0.00021582841873168945, -0.0001652836799621582, -0.00011473894119262695, -6.41942024230957e-05, -1.3649463653564453e-05, 3.68952751159668e-05, 8.744001388549805e-05, 0.0001379847526550293, 0.00018852949142456055, 0.0002390742301940918, 0.00028961896896362305, 0.0003401637077331543, 0.00039070844650268555, 0.0004412531852722168, 0.000491797924041748, 0.0005423426628112793, 0.0005928874015808105, 0.0006434321403503418, 0.000693976879119873, 0.0007445216178894043, 0.0007950663566589355, 0.0008456110954284668, 0.000896155834197998, 0.0009467005729675293, 0.0009972453117370605, 0.0010477900505065918, 0.001098334789276123, 0.0011488795280456543, 0.0011994242668151855, 0.0012499690055847168, 0.001300513744354248, 0.0013510584831237793, 0.0014016032218933105, 0.0014521479606628418, 0.001502692699432373]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 11.0, 10.0, 9.0, 16.0, 11.0, 13.0, 26.0, 27.0, 25.0, 30.0, 29.0, 33.0, 32.0, 47.0, 34.0, 30.0, 38.0, 46.0, 47.0, 28.0, 48.0, 31.0, 35.0, 41.0, 37.0, 33.0, 34.0, 19.0, 16.0, 25.0, 20.0, 19.0, 14.0, 12.0, 15.0, 12.0, 11.0, 4.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-17.859375, -17.325927734375, -16.79248046875, -16.259033203125, -15.7255859375, -15.192138671875, -14.65869140625, -14.125244140625, -13.591796875, -13.058349609375, -12.52490234375, -11.991455078125, -11.4580078125, -10.924560546875, -10.39111328125, -9.857666015625, -9.32421875, -8.790771484375, -8.25732421875, -7.723876953125, -7.1904296875, -6.656982421875, -6.12353515625, -5.590087890625, -5.056640625, -4.523193359375, -3.98974609375, -3.456298828125, -2.9228515625, -2.389404296875, -1.85595703125, -1.322509765625, -0.7890625, -0.255615234375, 0.27783203125, 0.811279296875, 1.3447265625, 1.878173828125, 2.41162109375, 2.945068359375, 3.478515625, 4.011962890625, 4.54541015625, 5.078857421875, 5.6123046875, 6.145751953125, 6.67919921875, 7.212646484375, 7.74609375, 8.279541015625, 8.81298828125, 9.346435546875, 9.8798828125, 10.413330078125, 10.94677734375, 11.480224609375, 12.013671875, 12.547119140625, 13.08056640625, 13.614013671875, 14.1474609375, 14.680908203125, 15.21435546875, 15.747802734375, 16.28125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 13.0, 12.0, 13.0, 23.0, 20.0, 23.0, 44.0, 53.0, 44.0, 85.0, 125.0, 151.0, 247.0, 406.0, 790.0, 2386.0, 13831.0, 121453.0, 743460.0, 144227.0, 16346.0, 2657.0, 805.0, 431.0, 256.0, 166.0, 125.0, 69.0, 52.0, 36.0, 44.0, 33.0, 21.0, 18.0, 16.0, 13.0, 13.0, 5.0, 6.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-34.78125, -33.744140625, -32.70703125, -31.669921875, -30.6328125, -29.595703125, -28.55859375, -27.521484375, -26.484375, -25.447265625, -24.41015625, -23.373046875, -22.3359375, -21.298828125, -20.26171875, -19.224609375, -18.1875, -17.150390625, -16.11328125, -15.076171875, -14.0390625, -13.001953125, -11.96484375, -10.927734375, -9.890625, -8.853515625, -7.81640625, -6.779296875, -5.7421875, -4.705078125, -3.66796875, -2.630859375, -1.59375, -0.556640625, 0.48046875, 1.517578125, 2.5546875, 3.591796875, 4.62890625, 5.666015625, 6.703125, 7.740234375, 8.77734375, 9.814453125, 10.8515625, 11.888671875, 12.92578125, 13.962890625, 15.0, 16.037109375, 17.07421875, 18.111328125, 19.1484375, 20.185546875, 21.22265625, 22.259765625, 23.296875, 24.333984375, 25.37109375, 26.408203125, 27.4453125, 28.482421875, 29.51953125, 30.556640625, 31.59375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 3.0, 8.0, 3.0, 8.0, 10.0, 8.0, 15.0, 14.0, 15.0, 24.0, 24.0, 29.0, 36.0, 47.0, 52.0, 53.0, 64.0, 93.0, 309.0, 1713.0, 114.0, 50.0, 44.0, 37.0, 43.0, 47.0, 38.0, 29.0, 27.0, 16.0, 15.0, 16.0, 15.0, 9.0, 12.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.53125, -52.45458984375, -50.3779296875, -48.30126953125, -46.224609375, -44.14794921875, -42.0712890625, -39.99462890625, -37.91796875, -35.84130859375, -33.7646484375, -31.68798828125, -29.611328125, -27.53466796875, -25.4580078125, -23.38134765625, -21.3046875, -19.22802734375, -17.1513671875, -15.07470703125, -12.998046875, -10.92138671875, -8.8447265625, -6.76806640625, -4.69140625, -2.61474609375, -0.5380859375, 1.53857421875, 3.615234375, 5.69189453125, 7.7685546875, 9.84521484375, 11.921875, 13.99853515625, 16.0751953125, 18.15185546875, 20.228515625, 22.30517578125, 24.3818359375, 26.45849609375, 28.53515625, 30.61181640625, 32.6884765625, 34.76513671875, 36.841796875, 38.91845703125, 40.9951171875, 43.07177734375, 45.1484375, 47.22509765625, 49.3017578125, 51.37841796875, 53.455078125, 55.53173828125, 57.6083984375, 59.68505859375, 61.76171875, 63.83837890625, 65.9150390625, 67.99169921875, 70.068359375, 72.14501953125, 74.2216796875, 76.29833984375, 78.375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 12.0, 20.0, 12.0, 21.0, 28.0, 41.0, 38.0, 63.0, 122.0, 133.0, 307.0, 746.0, 6549.0, 3116716.0, 18825.0, 1083.0, 348.0, 200.0, 117.0, 79.0, 63.0, 41.0, 25.0, 18.0, 15.0, 15.0, 14.0, 10.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.125, -175.892578125, -170.66015625, -165.427734375, -160.1953125, -154.962890625, -149.73046875, -144.498046875, -139.265625, -134.033203125, -128.80078125, -123.568359375, -118.3359375, -113.103515625, -107.87109375, -102.638671875, -97.40625, -92.173828125, -86.94140625, -81.708984375, -76.4765625, -71.244140625, -66.01171875, -60.779296875, -55.546875, -50.314453125, -45.08203125, -39.849609375, -34.6171875, -29.384765625, -24.15234375, -18.919921875, -13.6875, -8.455078125, -3.22265625, 2.009765625, 7.2421875, 12.474609375, 17.70703125, 22.939453125, 28.171875, 33.404296875, 38.63671875, 43.869140625, 49.1015625, 54.333984375, 59.56640625, 64.798828125, 70.03125, 75.263671875, 80.49609375, 85.728515625, 90.9609375, 96.193359375, 101.42578125, 106.658203125, 111.890625, 117.123046875, 122.35546875, 127.587890625, 132.8203125, 138.052734375, 143.28515625, 148.517578125, 153.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 29.0, 666.0, 300.0, 19.0], "bins": [-805.7527465820312, -792.7086181640625, -779.66455078125, -766.6204223632812, -753.5762939453125, -740.5322265625, -727.4880981445312, -714.4439697265625, -701.39990234375, -688.3557739257812, -675.3117065429688, -662.267578125, -649.2234497070312, -636.1793823242188, -623.13525390625, -610.0911254882812, -597.0469970703125, -584.0028686523438, -570.9588012695312, -557.9146728515625, -544.8705444335938, -531.8264770507812, -518.7823486328125, -505.7382507324219, -492.69415283203125, -479.6500549316406, -466.6059265136719, -453.56182861328125, -440.5177307128906, -427.4736328125, -414.42950439453125, -401.3854064941406, -388.34130859375, -375.2972106933594, -362.2530822753906, -349.208984375, -336.1648864746094, -323.12078857421875, -310.07666015625, -297.0325622558594, -283.98846435546875, -270.9443664550781, -257.9002380371094, -244.85614013671875, -231.81204223632812, -218.76792907714844, -205.72381591796875, -192.67971801757812, -179.63558959960938, -166.5914764404297, -153.54737854003906, -140.50326538085938, -127.45915985107422, -114.41505432128906, -101.37094116210938, -88.32683563232422, -75.2827377319336, -62.23863220214844, -49.194522857666016, -36.150413513183594, -23.106307983398438, -10.062202453613281, 2.9819107055664062, 16.026016235351562, 29.07012176513672]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 11.0, 17.0, 9.0, 12.0, 19.0, 16.0, 14.0, 21.0, 20.0, 32.0, 30.0, 29.0, 43.0, 37.0, 43.0, 45.0, 44.0, 47.0, 54.0, 53.0, 46.0, 43.0, 30.0, 32.0, 28.0, 24.0, 38.0, 14.0, 20.0, 19.0, 14.0, 18.0, 5.0, 14.0, 10.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-156.918701171875, -152.21511840820312, -147.5115203857422, -142.8079376220703, -138.10433959960938, -133.4007568359375, -128.69715881347656, -123.99357604980469, -119.28998565673828, -114.58639526367188, -109.88280487060547, -105.17921447753906, -100.47563171386719, -95.77203369140625, -91.06845092773438, -86.36486053466797, -81.66127014160156, -76.95767974853516, -72.25408935546875, -67.55049896240234, -62.8469123840332, -58.1433219909668, -53.439735412597656, -48.73614501953125, -44.032554626464844, -39.32896423339844, -34.62537384033203, -29.92178726196289, -25.218196868896484, -20.514606475830078, -15.811017990112305, -11.107429504394531, -6.403839111328125, -1.7002496719360352, 3.0033397674560547, 7.7069292068481445, 12.410518646240234, 17.11410903930664, 21.817697525024414, 26.521286010742188, 31.224876403808594, 35.928466796875, 40.632057189941406, 45.33564376831055, 50.03923416137695, 54.74282455444336, 59.4464111328125, 64.1500015258789, 68.85359191894531, 73.55718231201172, 78.26077270507812, 82.96436309814453, 87.66795349121094, 92.37153625488281, 97.07512664794922, 101.77871704101562, 106.48230743408203, 111.18589782714844, 115.88948822021484, 120.59307861328125, 125.29666137695312, 130.00025939941406, 134.70384216308594, 139.40744018554688, 144.11102294921875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 1.0, 10.0, 12.0, 10.0, 5.0, 10.0, 10.0, 21.0, 24.0, 21.0, 27.0, 28.0, 35.0, 33.0, 35.0, 32.0, 34.0, 38.0, 39.0, 37.0, 41.0, 43.0, 39.0, 39.0, 31.0, 39.0, 35.0, 30.0, 29.0, 29.0, 28.0, 17.0, 20.0, 17.0, 15.0, 13.0, 7.0, 8.0, 11.0, 8.0, 10.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0], "bins": [-18.75, -18.2060546875, -17.662109375, -17.1181640625, -16.57421875, -16.0302734375, -15.486328125, -14.9423828125, -14.3984375, -13.8544921875, -13.310546875, -12.7666015625, -12.22265625, -11.6787109375, -11.134765625, -10.5908203125, -10.046875, -9.5029296875, -8.958984375, -8.4150390625, -7.87109375, -7.3271484375, -6.783203125, -6.2392578125, -5.6953125, -5.1513671875, -4.607421875, -4.0634765625, -3.51953125, -2.9755859375, -2.431640625, -1.8876953125, -1.34375, -0.7998046875, -0.255859375, 0.2880859375, 0.83203125, 1.3759765625, 1.919921875, 2.4638671875, 3.0078125, 3.5517578125, 4.095703125, 4.6396484375, 5.18359375, 5.7275390625, 6.271484375, 6.8154296875, 7.359375, 7.9033203125, 8.447265625, 8.9912109375, 9.53515625, 10.0791015625, 10.623046875, 11.1669921875, 11.7109375, 12.2548828125, 12.798828125, 13.3427734375, 13.88671875, 14.4306640625, 14.974609375, 15.5185546875, 16.0625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 6.0, 4.0, 8.0, 9.0, 6.0, 16.0, 16.0, 20.0, 24.0, 29.0, 40.0, 45.0, 59.0, 84.0, 104.0, 131.0, 182.0, 278.0, 601.0, 1954.0, 15571.0, 627584.0, 3267788.0, 268435.0, 8492.0, 1330.0, 472.0, 262.0, 148.0, 127.0, 92.0, 70.0, 55.0, 51.0, 30.0, 18.0, 25.0, 24.0, 12.0, 22.0, 12.0, 4.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-48.3125, -46.72265625, -45.1328125, -43.54296875, -41.953125, -40.36328125, -38.7734375, -37.18359375, -35.59375, -34.00390625, -32.4140625, -30.82421875, -29.234375, -27.64453125, -26.0546875, -24.46484375, -22.875, -21.28515625, -19.6953125, -18.10546875, -16.515625, -14.92578125, -13.3359375, -11.74609375, -10.15625, -8.56640625, -6.9765625, -5.38671875, -3.796875, -2.20703125, -0.6171875, 0.97265625, 2.5625, 4.15234375, 5.7421875, 7.33203125, 8.921875, 10.51171875, 12.1015625, 13.69140625, 15.28125, 16.87109375, 18.4609375, 20.05078125, 21.640625, 23.23046875, 24.8203125, 26.41015625, 28.0, 29.58984375, 31.1796875, 32.76953125, 34.359375, 35.94921875, 37.5390625, 39.12890625, 40.71875, 42.30859375, 43.8984375, 45.48828125, 47.078125, 48.66796875, 50.2578125, 51.84765625, 53.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 2.0, 14.0, 6.0, 8.0, 22.0, 26.0, 36.0, 51.0, 75.0, 104.0, 134.0, 214.0, 346.0, 503.0, 650.0, 584.0, 490.0, 303.0, 160.0, 113.0, 75.0, 58.0, 35.0, 22.0, 16.0, 5.0, 7.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.74609375, -33.3984375, -32.05078125, -30.703125, -29.35546875, -28.0078125, -26.66015625, -25.3125, -23.96484375, -22.6171875, -21.26953125, -19.921875, -18.57421875, -17.2265625, -15.87890625, -14.53125, -13.18359375, -11.8359375, -10.48828125, -9.140625, -7.79296875, -6.4453125, -5.09765625, -3.75, -2.40234375, -1.0546875, 0.29296875, 1.640625, 2.98828125, 4.3359375, 5.68359375, 7.03125, 8.37890625, 9.7265625, 11.07421875, 12.421875, 13.76953125, 15.1171875, 16.46484375, 17.8125, 19.16015625, 20.5078125, 21.85546875, 23.203125, 24.55078125, 25.8984375, 27.24609375, 28.59375, 29.94140625, 31.2890625, 32.63671875, 33.984375, 35.33203125, 36.6796875, 38.02734375, 39.375, 40.72265625, 42.0703125, 43.41796875, 44.765625, 46.11328125, 47.4609375, 48.80859375, 50.15625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 6.0, 4.0, 9.0, 13.0, 19.0, 16.0, 24.0, 32.0, 45.0, 42.0, 57.0, 72.0, 102.0, 147.0, 185.0, 328.0, 662.0, 2906.0, 3475372.0, 710415.0, 2080.0, 587.0, 293.0, 192.0, 155.0, 106.0, 76.0, 58.0, 61.0, 35.0, 34.0, 31.0, 28.0, 18.0, 15.0, 9.0, 13.0, 10.0, 11.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-163.625, -157.548828125, -151.47265625, -145.396484375, -139.3203125, -133.244140625, -127.16796875, -121.091796875, -115.015625, -108.939453125, -102.86328125, -96.787109375, -90.7109375, -84.634765625, -78.55859375, -72.482421875, -66.40625, -60.330078125, -54.25390625, -48.177734375, -42.1015625, -36.025390625, -29.94921875, -23.873046875, -17.796875, -11.720703125, -5.64453125, 0.431640625, 6.5078125, 12.583984375, 18.66015625, 24.736328125, 30.8125, 36.888671875, 42.96484375, 49.041015625, 55.1171875, 61.193359375, 67.26953125, 73.345703125, 79.421875, 85.498046875, 91.57421875, 97.650390625, 103.7265625, 109.802734375, 115.87890625, 121.955078125, 128.03125, 134.107421875, 140.18359375, 146.259765625, 152.3359375, 158.412109375, 164.48828125, 170.564453125, 176.640625, 182.716796875, 188.79296875, 194.869140625, 200.9453125, 207.021484375, 213.09765625, 219.173828125, 225.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 62.0, 824.0, 125.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-935.62939453125, -912.601806640625, -889.5742797851562, -866.5466918945312, -843.5191650390625, -820.4915771484375, -797.4639892578125, -774.4364013671875, -751.4088745117188, -728.3812866210938, -705.353759765625, -682.326171875, -659.298583984375, -636.2710571289062, -613.2434692382812, -590.2159423828125, -567.1883544921875, -544.1607666015625, -521.1332397460938, -498.10565185546875, -475.0780944824219, -452.050537109375, -429.02294921875, -405.9953918457031, -382.96783447265625, -359.9402770996094, -336.9127197265625, -313.8851318359375, -290.8575744628906, -267.83001708984375, -244.8024444580078, -221.77487182617188, -198.74737548828125, -175.71981811523438, -152.69224548339844, -129.6646728515625, -106.63711547851562, -83.60955047607422, -60.58198547363281, -37.554412841796875, -14.52685546875, 8.500709533691406, 31.528274536132812, 54.55583953857422, 77.58340454101562, 100.61096954345703, 123.63853454589844, 146.66610717773438, 169.69366455078125, 192.72122192382812, 215.74879455566406, 238.7763671875, 261.8039245605469, 284.83148193359375, 307.85906982421875, 330.8866271972656, 353.9141845703125, 376.9417419433594, 399.96929931640625, 422.99688720703125, 446.0244445800781, 469.052001953125, 492.07958984375, 515.107177734375, 538.1347045898438]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 9.0, 9.0, 15.0, 12.0, 12.0, 15.0, 24.0, 26.0, 25.0, 34.0, 35.0, 32.0, 38.0, 41.0, 39.0, 35.0, 49.0, 44.0, 54.0, 50.0, 43.0, 39.0, 30.0, 34.0, 34.0, 19.0, 29.0, 31.0, 25.0, 16.0, 16.0, 15.0, 16.0, 8.0, 8.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-136.6962890625, -132.9898223876953, -129.28334045410156, -125.57687377929688, -121.87039947509766, -118.16392517089844, -114.45745849609375, -110.75098419189453, -107.04450988769531, -103.3380355834961, -99.6315689086914, -95.92509460449219, -92.21862030029297, -88.51214599609375, -84.80567932128906, -81.09920501708984, -77.39273834228516, -73.68626403808594, -69.97979736328125, -66.27332305908203, -62.56684875488281, -58.86037826538086, -55.153907775878906, -51.44743347167969, -47.740962982177734, -44.03449249267578, -40.32801818847656, -36.62154769897461, -32.915077209472656, -29.208602905273438, -25.502132415771484, -21.7956600189209, -18.089187622070312, -14.382715225219727, -10.676243782043457, -6.9697723388671875, -3.2632999420166016, 0.4431724548339844, 4.1496429443359375, 7.856115341186523, 11.56258773803711, 15.269060134887695, 18.97553253173828, 22.682003021240234, 26.38847541809082, 30.094947814941406, 33.80141830444336, 37.50788879394531, 41.21436309814453, 44.920833587646484, 48.6273078918457, 52.333778381347656, 56.040252685546875, 59.74672317504883, 63.45319366455078, 67.15966796875, 70.86613464355469, 74.5726089477539, 78.2790756225586, 81.98554992675781, 85.69202423095703, 89.39849853515625, 93.10496520996094, 96.81143951416016, 100.51791381835938]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 17.0, 20.0, 14.0, 15.0, 23.0, 16.0, 36.0, 26.0, 33.0, 33.0, 40.0, 32.0, 44.0, 47.0, 43.0, 41.0, 59.0, 37.0, 40.0, 43.0, 41.0, 36.0, 34.0, 26.0, 23.0, 33.0, 25.0, 22.0, 18.0, 12.0, 11.0, 11.0, 9.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.76904296875, -19.1474609375, -18.52587890625, -17.904296875, -17.28271484375, -16.6611328125, -16.03955078125, -15.41796875, -14.79638671875, -14.1748046875, -13.55322265625, -12.931640625, -12.31005859375, -11.6884765625, -11.06689453125, -10.4453125, -9.82373046875, -9.2021484375, -8.58056640625, -7.958984375, -7.33740234375, -6.7158203125, -6.09423828125, -5.47265625, -4.85107421875, -4.2294921875, -3.60791015625, -2.986328125, -2.36474609375, -1.7431640625, -1.12158203125, -0.5, 0.12158203125, 0.7431640625, 1.36474609375, 1.986328125, 2.60791015625, 3.2294921875, 3.85107421875, 4.47265625, 5.09423828125, 5.7158203125, 6.33740234375, 6.958984375, 7.58056640625, 8.2021484375, 8.82373046875, 9.4453125, 10.06689453125, 10.6884765625, 11.31005859375, 11.931640625, 12.55322265625, 13.1748046875, 13.79638671875, 14.41796875, 15.03955078125, 15.6611328125, 16.28271484375, 16.904296875, 17.52587890625, 18.1474609375, 18.76904296875, 19.390625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 11.0, 17.0, 11.0, 22.0, 33.0, 38.0, 80.0, 120.0, 164.0, 266.0, 377.0, 603.0, 828.0, 1317.0, 2039.0, 3345.0, 5418.0, 8617.0, 13936.0, 22849.0, 38767.0, 68080.0, 128338.0, 342013.0, 192782.0, 91582.0, 50252.0, 29720.0, 17786.0, 10813.0, 6621.0, 4222.0, 2697.0, 1626.0, 1118.0, 692.0, 459.0, 278.0, 184.0, 154.0, 88.0, 59.0, 46.0, 24.0, 24.0, 13.0, 5.0, 11.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.339599609375, -5.17138671875, -5.003173828125, -4.8349609375, -4.666748046875, -4.49853515625, -4.330322265625, -4.162109375, -3.993896484375, -3.82568359375, -3.657470703125, -3.4892578125, -3.321044921875, -3.15283203125, -2.984619140625, -2.81640625, -2.648193359375, -2.47998046875, -2.311767578125, -2.1435546875, -1.975341796875, -1.80712890625, -1.638916015625, -1.470703125, -1.302490234375, -1.13427734375, -0.966064453125, -0.7978515625, -0.629638671875, -0.46142578125, -0.293212890625, -0.125, 0.043212890625, 0.21142578125, 0.379638671875, 0.5478515625, 0.716064453125, 0.88427734375, 1.052490234375, 1.220703125, 1.388916015625, 1.55712890625, 1.725341796875, 1.8935546875, 2.061767578125, 2.22998046875, 2.398193359375, 2.56640625, 2.734619140625, 2.90283203125, 3.071044921875, 3.2392578125, 3.407470703125, 3.57568359375, 3.743896484375, 3.912109375, 4.080322265625, 4.24853515625, 4.416748046875, 4.5849609375, 4.753173828125, 4.92138671875, 5.089599609375, 5.2578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 2.0, 2.0, 7.0, 5.0, 9.0, 9.0, 15.0, 22.0, 14.0, 13.0, 31.0, 22.0, 30.0, 38.0, 34.0, 28.0, 43.0, 41.0, 41.0, 48.0, 51.0, 1060.0, 30.0, 36.0, 42.0, 40.0, 44.0, 35.0, 38.0, 30.0, 17.0, 25.0, 21.0, 19.0, 15.0, 14.0, 9.0, 11.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.046875, -11.6595458984375, -11.272216796875, -10.8848876953125, -10.49755859375, -10.1102294921875, -9.722900390625, -9.3355712890625, -8.9482421875, -8.5609130859375, -8.173583984375, -7.7862548828125, -7.39892578125, -7.0115966796875, -6.624267578125, -6.2369384765625, -5.849609375, -5.4622802734375, -5.074951171875, -4.6876220703125, -4.30029296875, -3.9129638671875, -3.525634765625, -3.1383056640625, -2.7509765625, -2.3636474609375, -1.976318359375, -1.5889892578125, -1.20166015625, -0.8143310546875, -0.427001953125, -0.0396728515625, 0.34765625, 0.7349853515625, 1.122314453125, 1.5096435546875, 1.89697265625, 2.2843017578125, 2.671630859375, 3.0589599609375, 3.4462890625, 3.8336181640625, 4.220947265625, 4.6082763671875, 4.99560546875, 5.3829345703125, 5.770263671875, 6.1575927734375, 6.544921875, 6.9322509765625, 7.319580078125, 7.7069091796875, 8.09423828125, 8.4815673828125, 8.868896484375, 9.2562255859375, 9.6435546875, 10.0308837890625, 10.418212890625, 10.8055419921875, 11.19287109375, 11.5802001953125, 11.967529296875, 12.3548583984375, 12.7421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 16.0, 17.0, 26.0, 48.0, 44.0, 72.0, 102.0, 160.0, 219.0, 360.0, 449.0, 713.0, 1077.0, 1670.0, 2582.0, 3803.0, 6149.0, 9782.0, 15770.0, 25676.0, 43346.0, 74537.0, 138482.0, 1386455.0, 169360.0, 87740.0, 49952.0, 29498.0, 18058.0, 11195.0, 6952.0, 4415.0, 2889.0, 1847.0, 1144.0, 774.0, 551.0, 366.0, 271.0, 173.0, 110.0, 83.0, 68.0, 32.0, 29.0, 26.0, 15.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.99609375, -4.843017578125, -4.68994140625, -4.536865234375, -4.3837890625, -4.230712890625, -4.07763671875, -3.924560546875, -3.771484375, -3.618408203125, -3.46533203125, -3.312255859375, -3.1591796875, -3.006103515625, -2.85302734375, -2.699951171875, -2.546875, -2.393798828125, -2.24072265625, -2.087646484375, -1.9345703125, -1.781494140625, -1.62841796875, -1.475341796875, -1.322265625, -1.169189453125, -1.01611328125, -0.863037109375, -0.7099609375, -0.556884765625, -0.40380859375, -0.250732421875, -0.09765625, 0.055419921875, 0.20849609375, 0.361572265625, 0.5146484375, 0.667724609375, 0.82080078125, 0.973876953125, 1.126953125, 1.280029296875, 1.43310546875, 1.586181640625, 1.7392578125, 1.892333984375, 2.04541015625, 2.198486328125, 2.3515625, 2.504638671875, 2.65771484375, 2.810791015625, 2.9638671875, 3.116943359375, 3.27001953125, 3.423095703125, 3.576171875, 3.729248046875, 3.88232421875, 4.035400390625, 4.1884765625, 4.341552734375, 4.49462890625, 4.647705078125, 4.80078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 7.0, 9.0, 9.0, 14.0, 12.0, 18.0, 17.0, 22.0, 34.0, 38.0, 40.0, 46.0, 71.0, 73.0, 69.0, 72.0, 75.0, 66.0, 54.0, 42.0, 35.0, 29.0, 21.0, 16.0, 26.0, 10.0, 14.0, 12.0, 12.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003406524658203125, -0.0033034682273864746, -0.0032004117965698242, -0.003097355365753174, -0.0029942989349365234, -0.002891242504119873, -0.0027881860733032227, -0.0026851296424865723, -0.002582073211669922, -0.0024790167808532715, -0.002375960350036621, -0.0022729039192199707, -0.0021698474884033203, -0.00206679105758667, -0.0019637346267700195, -0.0018606781959533691, -0.0017576217651367188, -0.0016545653343200684, -0.001551508903503418, -0.0014484524726867676, -0.0013453960418701172, -0.0012423396110534668, -0.0011392831802368164, -0.001036226749420166, -0.0009331703186035156, -0.0008301138877868652, -0.0007270574569702148, -0.0006240010261535645, -0.0005209445953369141, -0.00041788816452026367, -0.0003148317337036133, -0.0002117753028869629, -0.0001087188720703125, -5.662441253662109e-06, 9.739398956298828e-05, 0.00020045042037963867, 0.00030350685119628906, 0.00040656328201293945, 0.0005096197128295898, 0.0006126761436462402, 0.0007157325744628906, 0.000818789005279541, 0.0009218454360961914, 0.0010249018669128418, 0.0011279582977294922, 0.0012310147285461426, 0.001334071159362793, 0.0014371275901794434, 0.0015401840209960938, 0.0016432404518127441, 0.0017462968826293945, 0.001849353313446045, 0.0019524097442626953, 0.0020554661750793457, 0.002158522605895996, 0.0022615790367126465, 0.002364635467529297, 0.0024676918983459473, 0.0025707483291625977, 0.002673804759979248, 0.0027768611907958984, 0.002879917621612549, 0.0029829740524291992, 0.0030860304832458496, 0.0031890869140625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 6.0, 16.0, 15.0, 25.0, 19.0, 29.0, 36.0, 48.0, 54.0, 67.0, 140.0, 276.0, 645.0, 5441.0, 1038427.0, 2015.0, 540.0, 249.0, 122.0, 93.0, 54.0, 41.0, 41.0, 21.0, 21.0, 18.0, 17.0, 9.0, 8.0, 10.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.077392578125, -0.07500362396240234, -0.07261466979980469, -0.07022571563720703, -0.06783676147460938, -0.06544780731201172, -0.06305885314941406, -0.060669898986816406, -0.05828094482421875, -0.055891990661621094, -0.05350303649902344, -0.05111408233642578, -0.048725128173828125, -0.04633617401123047, -0.04394721984863281, -0.041558265686035156, -0.0391693115234375, -0.036780357360839844, -0.03439140319824219, -0.03200244903564453, -0.029613494873046875, -0.02722454071044922, -0.024835586547851562, -0.022446632385253906, -0.02005767822265625, -0.017668724060058594, -0.015279769897460938, -0.012890815734863281, -0.010501861572265625, -0.008112907409667969, -0.0057239532470703125, -0.0033349990844726562, -0.000946044921875, 0.0014429092407226562, 0.0038318634033203125, 0.006220817565917969, 0.008609771728515625, 0.010998725891113281, 0.013387680053710938, 0.015776634216308594, 0.01816558837890625, 0.020554542541503906, 0.022943496704101562, 0.02533245086669922, 0.027721405029296875, 0.03011035919189453, 0.03249931335449219, 0.034888267517089844, 0.0372772216796875, 0.039666175842285156, 0.04205513000488281, 0.04444408416748047, 0.046833038330078125, 0.04922199249267578, 0.05161094665527344, 0.053999900817871094, 0.05638885498046875, 0.058777809143066406, 0.06116676330566406, 0.06355571746826172, 0.06594467163085938, 0.06833362579345703, 0.07072257995605469, 0.07311153411865234, 0.07550048828125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 86.0, 865.0, 64.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005491413176059723, -0.0050827511586248875, -0.004674088675528765, -0.004265426658093929, -0.00385676440782845, -0.003448102157562971, -0.0030394401401281357, -0.0026307778898626566, -0.0022221156395971775, -0.0018134533893316984, -0.0014047912554815412, -0.000996129121631384, -0.0005874668713659048, -0.00017880462110042572, 0.00022985739633440971, 0.0006385196465998888, 0.0010471818968653679, 0.001455844147130847, 0.0018645062809810042, 0.0022731684148311615, 0.0026818306650966406, 0.0030904929153621197, 0.003499154932796955, 0.003907817415893078, 0.004316479433327913, 0.004725141450762749, 0.0051338039338588715, 0.005542465951293707, 0.005951127968728542, 0.006359790451824665, 0.0067684524692595005, 0.007177114486694336, 0.007585776969790459, 0.007994439452886581, 0.00840310100466013, 0.008811763487756252, 0.009220425970852375, 0.009629087522625923, 0.010037750005722046, 0.010446412488818169, 0.010855074971914291, 0.011263737455010414, 0.011672399006783962, 0.012081061489880085, 0.012489723972976208, 0.012898385524749756, 0.013307048007845879, 0.013715710490942001, 0.01412437204271555, 0.014533034525811672, 0.01494169607758522, 0.015350358560681343, 0.015759021043777466, 0.01616768352687359, 0.01657634600996971, 0.016985006630420685, 0.017393669113516808, 0.01780233159661293, 0.018210994079709053, 0.018619656562805176, 0.01902831718325615, 0.019436979666352272, 0.019845642149448395, 0.020254304632544518, 0.02066296711564064]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 13.0, 10.0, 11.0, 19.0, 25.0, 18.0, 27.0, 48.0, 27.0, 28.0, 35.0, 41.0, 45.0, 51.0, 43.0, 42.0, 37.0, 65.0, 41.0, 46.0, 42.0, 38.0, 33.0, 25.0, 16.0, 24.0, 20.0, 22.0, 17.0, 15.0, 14.0, 12.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015761852264404297, -0.001519310288131237, -0.0014624353498220444, -0.0014055604115128517, -0.001348685473203659, -0.0012918105348944664, -0.0012349355965852737, -0.001178060658276081, -0.0011211857199668884, -0.0010643107816576958, -0.0010074358433485031, -0.0009505609050393105, -0.0008936859667301178, -0.0008368110284209251, -0.0007799360901117325, -0.0007230611518025398, -0.0006661862134933472, -0.0006093112751841545, -0.0005524363368749619, -0.0004955613985657692, -0.00043868646025657654, -0.0003818115219473839, -0.0003249365836381912, -0.00026806164532899857, -0.0002111867070198059, -0.00015431176871061325, -9.74368304014206e-05, -4.0561892092227936e-05, 1.631304621696472e-05, 7.318798452615738e-05, 0.00013006292283535004, 0.0001869378611445427, 0.00024381279945373535, 0.000300687737762928, 0.00035756267607212067, 0.0004144376143813133, 0.000471312552690506, 0.0005281874909996986, 0.0005850624293088913, 0.000641937367618084, 0.0006988123059272766, 0.0007556872442364693, 0.0008125621825456619, 0.0008694371208548546, 0.0009263120591640472, 0.00098318699747324, 0.0010400619357824326, 0.0010969368740916252, 0.0011538118124008179, 0.0012106867507100105, 0.0012675616890192032, 0.0013244366273283958, 0.0013813115656375885, 0.0014381865039467812, 0.0014950614422559738, 0.0015519363805651665, 0.0016088113188743591, 0.0016656862571835518, 0.0017225611954927444, 0.001779436133801937, 0.0018363110721111298, 0.0018931860104203224, 0.001950060948729515, 0.0020069358870387077, 0.0020638108253479004]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 17.0, 20.0, 14.0, 15.0, 23.0, 16.0, 36.0, 26.0, 33.0, 33.0, 40.0, 32.0, 44.0, 47.0, 43.0, 41.0, 59.0, 37.0, 40.0, 43.0, 41.0, 36.0, 34.0, 26.0, 23.0, 33.0, 25.0, 22.0, 18.0, 12.0, 11.0, 11.0, 9.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.76904296875, -19.1474609375, -18.52587890625, -17.904296875, -17.28271484375, -16.6611328125, -16.03955078125, -15.41796875, -14.79638671875, -14.1748046875, -13.55322265625, -12.931640625, -12.31005859375, -11.6884765625, -11.06689453125, -10.4453125, -9.82373046875, -9.2021484375, -8.58056640625, -7.958984375, -7.33740234375, -6.7158203125, -6.09423828125, -5.47265625, -4.85107421875, -4.2294921875, -3.60791015625, -2.986328125, -2.36474609375, -1.7431640625, -1.12158203125, -0.5, 0.12158203125, 0.7431640625, 1.36474609375, 1.986328125, 2.60791015625, 3.2294921875, 3.85107421875, 4.47265625, 5.09423828125, 5.7158203125, 6.33740234375, 6.958984375, 7.58056640625, 8.2021484375, 8.82373046875, 9.4453125, 10.06689453125, 10.6884765625, 11.31005859375, 11.931640625, 12.55322265625, 13.1748046875, 13.79638671875, 14.41796875, 15.03955078125, 15.6611328125, 16.28271484375, 16.904296875, 17.52587890625, 18.1474609375, 18.76904296875, 19.390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 10.0, 24.0, 32.0, 45.0, 40.0, 53.0, 69.0, 88.0, 132.0, 193.0, 236.0, 344.0, 484.0, 694.0, 1064.0, 3328.0, 32002.0, 860367.0, 136536.0, 8298.0, 1587.0, 836.0, 580.0, 410.0, 276.0, 212.0, 135.0, 113.0, 94.0, 58.0, 41.0, 30.0, 29.0, 19.0, 22.0, 15.0, 5.0, 12.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-51.3125, -49.74462890625, -48.1767578125, -46.60888671875, -45.041015625, -43.47314453125, -41.9052734375, -40.33740234375, -38.76953125, -37.20166015625, -35.6337890625, -34.06591796875, -32.498046875, -30.93017578125, -29.3623046875, -27.79443359375, -26.2265625, -24.65869140625, -23.0908203125, -21.52294921875, -19.955078125, -18.38720703125, -16.8193359375, -15.25146484375, -13.68359375, -12.11572265625, -10.5478515625, -8.97998046875, -7.412109375, -5.84423828125, -4.2763671875, -2.70849609375, -1.140625, 0.42724609375, 1.9951171875, 3.56298828125, 5.130859375, 6.69873046875, 8.2666015625, 9.83447265625, 11.40234375, 12.97021484375, 14.5380859375, 16.10595703125, 17.673828125, 19.24169921875, 20.8095703125, 22.37744140625, 23.9453125, 25.51318359375, 27.0810546875, 28.64892578125, 30.216796875, 31.78466796875, 33.3525390625, 34.92041015625, 36.48828125, 38.05615234375, 39.6240234375, 41.19189453125, 42.759765625, 44.32763671875, 45.8955078125, 47.46337890625, 49.03125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 8.0, 7.0, 16.0, 20.0, 16.0, 20.0, 22.0, 33.0, 35.0, 29.0, 39.0, 41.0, 37.0, 42.0, 48.0, 74.0, 1527.0, 489.0, 83.0, 56.0, 40.0, 43.0, 38.0, 37.0, 37.0, 27.0, 32.0, 23.0, 26.0, 17.0, 11.0, 10.0, 12.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 4.0, 5.0, 1.0, 3.0, 1.0], "bins": [-61.8125, -60.09521484375, -58.3779296875, -56.66064453125, -54.943359375, -53.22607421875, -51.5087890625, -49.79150390625, -48.07421875, -46.35693359375, -44.6396484375, -42.92236328125, -41.205078125, -39.48779296875, -37.7705078125, -36.05322265625, -34.3359375, -32.61865234375, -30.9013671875, -29.18408203125, -27.466796875, -25.74951171875, -24.0322265625, -22.31494140625, -20.59765625, -18.88037109375, -17.1630859375, -15.44580078125, -13.728515625, -12.01123046875, -10.2939453125, -8.57666015625, -6.859375, -5.14208984375, -3.4248046875, -1.70751953125, 0.009765625, 1.72705078125, 3.4443359375, 5.16162109375, 6.87890625, 8.59619140625, 10.3134765625, 12.03076171875, 13.748046875, 15.46533203125, 17.1826171875, 18.89990234375, 20.6171875, 22.33447265625, 24.0517578125, 25.76904296875, 27.486328125, 29.20361328125, 30.9208984375, 32.63818359375, 34.35546875, 36.07275390625, 37.7900390625, 39.50732421875, 41.224609375, 42.94189453125, 44.6591796875, 46.37646484375, 48.09375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 8.0, 9.0, 12.0, 15.0, 16.0, 24.0, 29.0, 30.0, 33.0, 43.0, 55.0, 62.0, 109.0, 189.0, 390.0, 1411.0, 805861.0, 2334767.0, 1506.0, 435.0, 191.0, 110.0, 72.0, 60.0, 32.0, 39.0, 34.0, 31.0, 15.0, 19.0, 20.0, 13.0, 9.0, 10.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.125, -131.267578125, -126.41015625, -121.552734375, -116.6953125, -111.837890625, -106.98046875, -102.123046875, -97.265625, -92.408203125, -87.55078125, -82.693359375, -77.8359375, -72.978515625, -68.12109375, -63.263671875, -58.40625, -53.548828125, -48.69140625, -43.833984375, -38.9765625, -34.119140625, -29.26171875, -24.404296875, -19.546875, -14.689453125, -9.83203125, -4.974609375, -0.1171875, 4.740234375, 9.59765625, 14.455078125, 19.3125, 24.169921875, 29.02734375, 33.884765625, 38.7421875, 43.599609375, 48.45703125, 53.314453125, 58.171875, 63.029296875, 67.88671875, 72.744140625, 77.6015625, 82.458984375, 87.31640625, 92.173828125, 97.03125, 101.888671875, 106.74609375, 111.603515625, 116.4609375, 121.318359375, 126.17578125, 131.033203125, 135.890625, 140.748046875, 145.60546875, 150.462890625, 155.3203125, 160.177734375, 165.03515625, 169.892578125, 174.75]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 65.0, 224.0, 358.0, 241.0, 91.0, 22.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.87594604492188, -116.76344299316406, -113.65093994140625, -110.53843688964844, -107.4259262084961, -104.31342315673828, -101.20092010498047, -98.08841705322266, -94.97590637207031, -91.8634033203125, -88.75090026855469, -85.63839721679688, -82.52588653564453, -79.41338348388672, -76.3008804321289, -73.1883773803711, -70.07587432861328, -66.96337127685547, -63.85086441040039, -60.73836135864258, -57.6258544921875, -54.51335144042969, -51.400848388671875, -48.28834533691406, -45.175838470458984, -42.06333541870117, -38.950828552246094, -35.83832550048828, -32.72582244873047, -29.61331558227539, -26.500812530517578, -23.388307571411133, -20.275802612304688, -17.163297653198242, -14.050793647766113, -10.938289642333984, -7.825784683227539, -4.713279724121094, -1.6007766723632812, 1.511728286743164, 4.624233245849609, 7.7367377281188965, 10.849242210388184, 13.961746215820312, 17.074251174926758, 20.186756134033203, 23.299259185791016, 26.41176414489746, 29.524269104003906, 32.63677215576172, 35.7492790222168, 38.86178207397461, 41.97428894042969, 45.0867919921875, 48.19929504394531, 51.311798095703125, 54.4243049621582, 57.536808013916016, 60.649314880371094, 63.761817932128906, 66.87432098388672, 69.98683166503906, 73.09933471679688, 76.21183776855469, 79.3243408203125]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 14.0, 13.0, 12.0, 14.0, 22.0, 15.0, 11.0, 27.0, 26.0, 32.0, 41.0, 41.0, 31.0, 22.0, 46.0, 44.0, 42.0, 39.0, 32.0, 30.0, 52.0, 38.0, 33.0, 34.0, 32.0, 37.0, 29.0, 26.0, 13.0, 17.0, 23.0, 15.0, 11.0, 13.0, 12.0, 8.0, 9.0, 4.0, 4.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-133.93182373046875, -129.73294067382812, -125.5340576171875, -121.33516693115234, -117.13628387451172, -112.9374008178711, -108.73851013183594, -104.53962707519531, -100.34074401855469, -96.14186096191406, -91.94297790527344, -87.74408721923828, -83.54520416259766, -79.34632110595703, -75.14743041992188, -70.94854736328125, -66.74966430664062, -62.55078125, -58.35189437866211, -54.15300750732422, -49.954124450683594, -45.75524139404297, -41.55635452270508, -37.35746765136719, -33.15858459472656, -28.959699630737305, -24.760814666748047, -20.56192970275879, -16.36304473876953, -12.164159774780273, -7.965274810791016, -3.766389846801758, 0.4324798583984375, 4.631364822387695, 8.830249786376953, 13.029134750366211, 17.22801971435547, 21.426904678344727, 25.625789642333984, 29.824674606323242, 34.0235595703125, 38.222442626953125, 42.421329498291016, 46.620216369628906, 50.81909942626953, 55.017982482910156, 59.21686935424805, 63.41575622558594, 67.61463928222656, 71.81352233886719, 76.01240539550781, 80.21129608154297, 84.4101791381836, 88.60906219482422, 92.80795288085938, 97.0068359375, 101.20571899414062, 105.40460205078125, 109.60348510742188, 113.80237579345703, 118.00125885009766, 122.20014190673828, 126.39903259277344, 130.59791564941406, 134.7967987060547]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 11.0, 14.0, 15.0, 15.0, 15.0, 16.0, 26.0, 21.0, 22.0, 34.0, 39.0, 31.0, 34.0, 39.0, 47.0, 40.0, 40.0, 33.0, 51.0, 53.0, 38.0, 37.0, 40.0, 34.0, 38.0, 28.0, 24.0, 25.0, 29.0, 16.0, 15.0, 15.0, 9.0, 15.0, 5.0, 4.0, 5.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.453125, -19.84228515625, -19.2314453125, -18.62060546875, -18.009765625, -17.39892578125, -16.7880859375, -16.17724609375, -15.56640625, -14.95556640625, -14.3447265625, -13.73388671875, -13.123046875, -12.51220703125, -11.9013671875, -11.29052734375, -10.6796875, -10.06884765625, -9.4580078125, -8.84716796875, -8.236328125, -7.62548828125, -7.0146484375, -6.40380859375, -5.79296875, -5.18212890625, -4.5712890625, -3.96044921875, -3.349609375, -2.73876953125, -2.1279296875, -1.51708984375, -0.90625, -0.29541015625, 0.3154296875, 0.92626953125, 1.537109375, 2.14794921875, 2.7587890625, 3.36962890625, 3.98046875, 4.59130859375, 5.2021484375, 5.81298828125, 6.423828125, 7.03466796875, 7.6455078125, 8.25634765625, 8.8671875, 9.47802734375, 10.0888671875, 10.69970703125, 11.310546875, 11.92138671875, 12.5322265625, 13.14306640625, 13.75390625, 14.36474609375, 14.9755859375, 15.58642578125, 16.197265625, 16.80810546875, 17.4189453125, 18.02978515625, 18.640625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 3.0, 9.0, 9.0, 12.0, 13.0, 20.0, 20.0, 25.0, 39.0, 42.0, 59.0, 72.0, 96.0, 134.0, 167.0, 228.0, 376.0, 581.0, 984.0, 2566.0, 14602.0, 533111.0, 3296838.0, 328752.0, 10610.0, 2150.0, 956.0, 568.0, 326.0, 225.0, 148.0, 122.0, 83.0, 86.0, 52.0, 32.0, 36.0, 13.0, 26.0, 22.0, 13.0, 9.0, 11.0, 5.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.5, -48.8935546875, -47.287109375, -45.6806640625, -44.07421875, -42.4677734375, -40.861328125, -39.2548828125, -37.6484375, -36.0419921875, -34.435546875, -32.8291015625, -31.22265625, -29.6162109375, -28.009765625, -26.4033203125, -24.796875, -23.1904296875, -21.583984375, -19.9775390625, -18.37109375, -16.7646484375, -15.158203125, -13.5517578125, -11.9453125, -10.3388671875, -8.732421875, -7.1259765625, -5.51953125, -3.9130859375, -2.306640625, -0.7001953125, 0.90625, 2.5126953125, 4.119140625, 5.7255859375, 7.33203125, 8.9384765625, 10.544921875, 12.1513671875, 13.7578125, 15.3642578125, 16.970703125, 18.5771484375, 20.18359375, 21.7900390625, 23.396484375, 25.0029296875, 26.609375, 28.2158203125, 29.822265625, 31.4287109375, 33.03515625, 34.6416015625, 36.248046875, 37.8544921875, 39.4609375, 41.0673828125, 42.673828125, 44.2802734375, 45.88671875, 47.4931640625, 49.099609375, 50.7060546875, 52.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 12.0, 22.0, 25.0, 31.0, 37.0, 68.0, 114.0, 203.0, 321.0, 549.0, 825.0, 767.0, 485.0, 261.0, 136.0, 71.0, 52.0, 43.0, 22.0, 13.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-58.28125, -56.69580078125, -55.1103515625, -53.52490234375, -51.939453125, -50.35400390625, -48.7685546875, -47.18310546875, -45.59765625, -44.01220703125, -42.4267578125, -40.84130859375, -39.255859375, -37.67041015625, -36.0849609375, -34.49951171875, -32.9140625, -31.32861328125, -29.7431640625, -28.15771484375, -26.572265625, -24.98681640625, -23.4013671875, -21.81591796875, -20.23046875, -18.64501953125, -17.0595703125, -15.47412109375, -13.888671875, -12.30322265625, -10.7177734375, -9.13232421875, -7.546875, -5.96142578125, -4.3759765625, -2.79052734375, -1.205078125, 0.38037109375, 1.9658203125, 3.55126953125, 5.13671875, 6.72216796875, 8.3076171875, 9.89306640625, 11.478515625, 13.06396484375, 14.6494140625, 16.23486328125, 17.8203125, 19.40576171875, 20.9912109375, 22.57666015625, 24.162109375, 25.74755859375, 27.3330078125, 28.91845703125, 30.50390625, 32.08935546875, 33.6748046875, 35.26025390625, 36.845703125, 38.43115234375, 40.0166015625, 41.60205078125, 43.1875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 6.0, 10.0, 11.0, 7.0, 14.0, 18.0, 32.0, 47.0, 69.0, 92.0, 123.0, 169.0, 262.0, 503.0, 1324.0, 15680.0, 4159750.0, 13564.0, 1248.0, 450.0, 218.0, 187.0, 113.0, 89.0, 56.0, 61.0, 31.0, 34.0, 27.0, 18.0, 15.0, 10.0, 7.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.0, -146.26171875, -140.5234375, -134.78515625, -129.046875, -123.30859375, -117.5703125, -111.83203125, -106.09375, -100.35546875, -94.6171875, -88.87890625, -83.140625, -77.40234375, -71.6640625, -65.92578125, -60.1875, -54.44921875, -48.7109375, -42.97265625, -37.234375, -31.49609375, -25.7578125, -20.01953125, -14.28125, -8.54296875, -2.8046875, 2.93359375, 8.671875, 14.41015625, 20.1484375, 25.88671875, 31.625, 37.36328125, 43.1015625, 48.83984375, 54.578125, 60.31640625, 66.0546875, 71.79296875, 77.53125, 83.26953125, 89.0078125, 94.74609375, 100.484375, 106.22265625, 111.9609375, 117.69921875, 123.4375, 129.17578125, 134.9140625, 140.65234375, 146.390625, 152.12890625, 157.8671875, 163.60546875, 169.34375, 175.08203125, 180.8203125, 186.55859375, 192.296875, 198.03515625, 203.7734375, 209.51171875, 215.25]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 63.0, 336.0, 483.0, 112.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-384.0484313964844, -373.1363830566406, -362.2243347167969, -351.3122863769531, -340.4002380371094, -329.4881896972656, -318.57611083984375, -307.6640625, -296.75201416015625, -285.8399658203125, -274.92791748046875, -264.015869140625, -253.10382080078125, -242.1917724609375, -231.2797088623047, -220.36766052246094, -209.45562744140625, -198.5435791015625, -187.63153076171875, -176.719482421875, -165.80743408203125, -154.8953857421875, -143.9833221435547, -133.07127380371094, -122.15922546386719, -111.24717712402344, -100.33512878417969, -89.4230728149414, -78.51102447509766, -67.5989761352539, -56.686920166015625, -45.774871826171875, -34.86279296875, -23.950742721557617, -13.038692474365234, -2.1266403198242188, 8.785408020019531, 19.69745635986328, 30.609512329101562, 41.52156066894531, 52.43360900878906, 63.34565734863281, 74.25770568847656, 85.16976165771484, 96.0818099975586, 106.99385833740234, 117.90591430664062, 128.81796264648438, 139.73001098632812, 150.64205932617188, 161.55410766601562, 172.46615600585938, 183.37820434570312, 194.29025268554688, 205.2023162841797, 216.11436462402344, 227.0264129638672, 237.93846130371094, 248.8505096435547, 259.7625732421875, 270.67462158203125, 281.586669921875, 292.49871826171875, 303.4107666015625, 314.32281494140625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 9.0, 9.0, 9.0, 15.0, 18.0, 18.0, 28.0, 25.0, 34.0, 29.0, 29.0, 38.0, 37.0, 56.0, 50.0, 40.0, 56.0, 48.0, 50.0, 49.0, 37.0, 37.0, 32.0, 35.0, 39.0, 22.0, 26.0, 21.0, 16.0, 16.0, 19.0, 8.0, 8.0, 10.0, 5.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.992431640625, -113.92119598388672, -109.84996032714844, -105.77872467041016, -101.70748901367188, -97.6362533569336, -93.56501770019531, -89.49378967285156, -85.42254638671875, -81.35131072998047, -77.28007507324219, -73.2088394165039, -69.13760375976562, -65.06636810302734, -60.99513626098633, -56.92390060424805, -52.85266876220703, -48.78143310546875, -44.71019744873047, -40.63896179199219, -36.567726135253906, -32.496490478515625, -28.42525863647461, -24.354022979736328, -20.282787322998047, -16.211551666259766, -12.1403169631958, -8.069082260131836, -3.9978466033935547, 0.07338905334472656, 4.144622802734375, 8.215858459472656, 12.287094116210938, 16.35832977294922, 20.4295654296875, 24.50079917907715, 28.57203483581543, 32.643272399902344, 36.71450424194336, 40.78573989868164, 44.85697555541992, 48.9282112121582, 52.999446868896484, 57.0706787109375, 61.14191436767578, 65.21315002441406, 69.28438568115234, 73.35562133789062, 77.4268569946289, 81.49809265136719, 85.56932830810547, 89.64056396484375, 93.71179962158203, 97.78303527832031, 101.85426330566406, 105.92550659179688, 109.99673461914062, 114.0679702758789, 118.13920593261719, 122.21044158935547, 126.28167724609375, 130.3529052734375, 134.4241485595703, 138.49537658691406, 142.56661987304688]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 15.0, 9.0, 12.0, 15.0, 16.0, 19.0, 27.0, 21.0, 30.0, 32.0, 31.0, 27.0, 39.0, 44.0, 61.0, 40.0, 48.0, 47.0, 35.0, 47.0, 33.0, 36.0, 44.0, 28.0, 29.0, 30.0, 34.0, 27.0, 22.0, 24.0, 18.0, 7.0, 6.0, 11.0, 7.0, 10.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.453125, -18.829833984375, -18.20654296875, -17.583251953125, -16.9599609375, -16.336669921875, -15.71337890625, -15.090087890625, -14.466796875, -13.843505859375, -13.22021484375, -12.596923828125, -11.9736328125, -11.350341796875, -10.72705078125, -10.103759765625, -9.48046875, -8.857177734375, -8.23388671875, -7.610595703125, -6.9873046875, -6.364013671875, -5.74072265625, -5.117431640625, -4.494140625, -3.870849609375, -3.24755859375, -2.624267578125, -2.0009765625, -1.377685546875, -0.75439453125, -0.131103515625, 0.4921875, 1.115478515625, 1.73876953125, 2.362060546875, 2.9853515625, 3.608642578125, 4.23193359375, 4.855224609375, 5.478515625, 6.101806640625, 6.72509765625, 7.348388671875, 7.9716796875, 8.594970703125, 9.21826171875, 9.841552734375, 10.46484375, 11.088134765625, 11.71142578125, 12.334716796875, 12.9580078125, 13.581298828125, 14.20458984375, 14.827880859375, 15.451171875, 16.074462890625, 16.69775390625, 17.321044921875, 17.9443359375, 18.567626953125, 19.19091796875, 19.814208984375, 20.4375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 14.0, 20.0, 19.0, 35.0, 49.0, 74.0, 109.0, 216.0, 380.0, 574.0, 1010.0, 1751.0, 2948.0, 5311.0, 9210.0, 17149.0, 31401.0, 58492.0, 120446.0, 387429.0, 222274.0, 87923.0, 45587.0, 25039.0, 13673.0, 7486.0, 4169.0, 2372.0, 1345.0, 772.0, 488.0, 290.0, 168.0, 106.0, 79.0, 44.0, 40.0, 21.0, 15.0, 15.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.328369140625, -6.12939453125, -5.930419921875, -5.7314453125, -5.532470703125, -5.33349609375, -5.134521484375, -4.935546875, -4.736572265625, -4.53759765625, -4.338623046875, -4.1396484375, -3.940673828125, -3.74169921875, -3.542724609375, -3.34375, -3.144775390625, -2.94580078125, -2.746826171875, -2.5478515625, -2.348876953125, -2.14990234375, -1.950927734375, -1.751953125, -1.552978515625, -1.35400390625, -1.155029296875, -0.9560546875, -0.757080078125, -0.55810546875, -0.359130859375, -0.16015625, 0.038818359375, 0.23779296875, 0.436767578125, 0.6357421875, 0.834716796875, 1.03369140625, 1.232666015625, 1.431640625, 1.630615234375, 1.82958984375, 2.028564453125, 2.2275390625, 2.426513671875, 2.62548828125, 2.824462890625, 3.0234375, 3.222412109375, 3.42138671875, 3.620361328125, 3.8193359375, 4.018310546875, 4.21728515625, 4.416259765625, 4.615234375, 4.814208984375, 5.01318359375, 5.212158203125, 5.4111328125, 5.610107421875, 5.80908203125, 6.008056640625, 6.20703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 3.0, 10.0, 8.0, 8.0, 9.0, 15.0, 20.0, 14.0, 26.0, 27.0, 21.0, 35.0, 38.0, 39.0, 45.0, 35.0, 34.0, 40.0, 38.0, 1080.0, 46.0, 44.0, 25.0, 25.0, 41.0, 37.0, 44.0, 28.0, 27.0, 24.0, 18.0, 15.0, 17.0, 15.0, 10.0, 11.0, 6.0, 9.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.8359375, -11.47314453125, -11.1103515625, -10.74755859375, -10.384765625, -10.02197265625, -9.6591796875, -9.29638671875, -8.93359375, -8.57080078125, -8.2080078125, -7.84521484375, -7.482421875, -7.11962890625, -6.7568359375, -6.39404296875, -6.03125, -5.66845703125, -5.3056640625, -4.94287109375, -4.580078125, -4.21728515625, -3.8544921875, -3.49169921875, -3.12890625, -2.76611328125, -2.4033203125, -2.04052734375, -1.677734375, -1.31494140625, -0.9521484375, -0.58935546875, -0.2265625, 0.13623046875, 0.4990234375, 0.86181640625, 1.224609375, 1.58740234375, 1.9501953125, 2.31298828125, 2.67578125, 3.03857421875, 3.4013671875, 3.76416015625, 4.126953125, 4.48974609375, 4.8525390625, 5.21533203125, 5.578125, 5.94091796875, 6.3037109375, 6.66650390625, 7.029296875, 7.39208984375, 7.7548828125, 8.11767578125, 8.48046875, 8.84326171875, 9.2060546875, 9.56884765625, 9.931640625, 10.29443359375, 10.6572265625, 11.02001953125, 11.3828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 12.0, 18.0, 31.0, 39.0, 56.0, 76.0, 100.0, 139.0, 204.0, 311.0, 490.0, 593.0, 897.0, 1370.0, 2085.0, 3223.0, 4764.0, 7378.0, 11618.0, 18381.0, 29810.0, 50241.0, 86445.0, 159157.0, 1391748.0, 134091.0, 76208.0, 44215.0, 26549.0, 16596.0, 10410.0, 6728.0, 4338.0, 2915.0, 1905.0, 1228.0, 804.0, 590.0, 446.0, 289.0, 186.0, 124.0, 89.0, 61.0, 54.0, 49.0, 24.0, 13.0, 11.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-4.45703125, -4.31500244140625, -4.1729736328125, -4.03094482421875, -3.888916015625, -3.74688720703125, -3.6048583984375, -3.46282958984375, -3.32080078125, -3.17877197265625, -3.0367431640625, -2.89471435546875, -2.752685546875, -2.61065673828125, -2.4686279296875, -2.32659912109375, -2.1845703125, -2.04254150390625, -1.9005126953125, -1.75848388671875, -1.616455078125, -1.47442626953125, -1.3323974609375, -1.19036865234375, -1.04833984375, -0.90631103515625, -0.7642822265625, -0.62225341796875, -0.480224609375, -0.33819580078125, -0.1961669921875, -0.05413818359375, 0.087890625, 0.22991943359375, 0.3719482421875, 0.51397705078125, 0.656005859375, 0.79803466796875, 0.9400634765625, 1.08209228515625, 1.22412109375, 1.36614990234375, 1.5081787109375, 1.65020751953125, 1.792236328125, 1.93426513671875, 2.0762939453125, 2.21832275390625, 2.3603515625, 2.50238037109375, 2.6444091796875, 2.78643798828125, 2.928466796875, 3.07049560546875, 3.2125244140625, 3.35455322265625, 3.49658203125, 3.63861083984375, 3.7806396484375, 3.92266845703125, 4.064697265625, 4.20672607421875, 4.3487548828125, 4.49078369140625, 4.6328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 8.0, 3.0, 10.0, 8.0, 10.0, 11.0, 10.0, 19.0, 26.0, 31.0, 26.0, 60.0, 38.0, 70.0, 78.0, 88.0, 113.0, 89.0, 59.0, 47.0, 38.0, 31.0, 30.0, 18.0, 19.0, 14.0, 14.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004182338714599609, -0.004042625427246094, -0.003902912139892578, -0.0037631988525390625, -0.003623485565185547, -0.0034837722778320312, -0.0033440589904785156, -0.003204345703125, -0.0030646324157714844, -0.0029249191284179688, -0.002785205841064453, -0.0026454925537109375, -0.002505779266357422, -0.0023660659790039062, -0.0022263526916503906, -0.002086639404296875, -0.0019469261169433594, -0.0018072128295898438, -0.0016674995422363281, -0.0015277862548828125, -0.0013880729675292969, -0.0012483596801757812, -0.0011086463928222656, -0.00096893310546875, -0.0008292198181152344, -0.0006895065307617188, -0.0005497932434082031, -0.0004100799560546875, -0.0002703666687011719, -0.00013065338134765625, 9.059906005859375e-06, 0.000148773193359375, 0.0002884864807128906, 0.00042819976806640625, 0.0005679130554199219, 0.0007076263427734375, 0.0008473396301269531, 0.0009870529174804688, 0.0011267662048339844, 0.0012664794921875, 0.0014061927795410156, 0.0015459060668945312, 0.0016856193542480469, 0.0018253326416015625, 0.001965045928955078, 0.0021047592163085938, 0.0022444725036621094, 0.002384185791015625, 0.0025238990783691406, 0.0026636123657226562, 0.002803325653076172, 0.0029430389404296875, 0.003082752227783203, 0.0032224655151367188, 0.0033621788024902344, 0.00350189208984375, 0.0036416053771972656, 0.0037813186645507812, 0.003921031951904297, 0.0040607452392578125, 0.004200458526611328, 0.004340171813964844, 0.004479885101318359, 0.004619598388671875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 13.0, 8.0, 10.0, 16.0, 11.0, 29.0, 32.0, 28.0, 46.0, 94.0, 152.0, 310.0, 804.0, 976601.0, 69062.0, 619.0, 266.0, 142.0, 76.0, 60.0, 28.0, 38.0, 33.0, 12.0, 18.0, 16.0, 5.0, 3.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11214637756347656, -0.10863113403320312, -0.10511589050292969, -0.10160064697265625, -0.09808540344238281, -0.09457015991210938, -0.09105491638183594, -0.0875396728515625, -0.08402442932128906, -0.08050918579101562, -0.07699394226074219, -0.07347869873046875, -0.06996345520019531, -0.06644821166992188, -0.06293296813964844, -0.059417724609375, -0.05590248107910156, -0.052387237548828125, -0.04887199401855469, -0.04535675048828125, -0.04184150695800781, -0.038326263427734375, -0.03481101989746094, -0.0312957763671875, -0.027780532836914062, -0.024265289306640625, -0.020750045776367188, -0.01723480224609375, -0.013719558715820312, -0.010204315185546875, -0.0066890716552734375, -0.003173828125, 0.0003414154052734375, 0.003856658935546875, 0.0073719024658203125, 0.01088714599609375, 0.014402389526367188, 0.017917633056640625, 0.021432876586914062, 0.0249481201171875, 0.028463363647460938, 0.031978607177734375, 0.03549385070800781, 0.03900909423828125, 0.04252433776855469, 0.046039581298828125, 0.04955482482910156, 0.053070068359375, 0.05658531188964844, 0.060100555419921875, 0.06361579895019531, 0.06713104248046875, 0.07064628601074219, 0.07416152954101562, 0.07767677307128906, 0.0811920166015625, 0.08470726013183594, 0.08822250366210938, 0.09173774719238281, 0.09525299072265625, 0.09876823425292969, 0.10228347778320312, 0.10579872131347656, 0.10931396484375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 64.0, 669.0, 277.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015839096158742905, -0.015492979437112808, -0.015146863646805286, -0.01480074692517519, -0.014454631134867668, -0.014108514413237572, -0.013762397691607475, -0.013416281901299953, -0.013070165179669857, -0.01272404845803976, -0.012377932667732239, -0.012031815946102142, -0.01168570015579462, -0.011339583434164524, -0.010993467643857002, -0.010647350922226906, -0.01030123420059681, -0.009955117478966713, -0.009609001688659191, -0.009262884967029095, -0.008916769176721573, -0.008570652455091476, -0.00822453573346138, -0.007878419943153858, -0.007532304152846336, -0.007186187896877527, -0.006840071640908718, -0.006493954919278622, -0.0061478386633098125, -0.005801722407341003, -0.005455606151372194, -0.005109489895403385, -0.004763373639434576, -0.004417257383465767, -0.004071141127496958, -0.003725024638697505, -0.003378908149898052, -0.003032791893929243, -0.002686675637960434, -0.002340559149160981, -0.001994442893192172, -0.001648326520808041, -0.0013022101484239101, -0.000956093892455101, -0.0006099775200709701, -0.0002638611476868391, 8.225510828197002e-05, 0.0004283715970814228, 0.0007744878530502319, 0.0011206042254343629, 0.0014667205978184938, 0.001812836853787303, 0.0021589533425867558, 0.002505069598555565, 0.002851185854524374, 0.003197302343323827, 0.003543418599292636, 0.003889534855261445, 0.004235651344060898, 0.004581767600029707, 0.004927883855998516, 0.0052740005776286125, 0.005620116367936134, 0.005966233089566231, 0.00631234934553504]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 11.0, 9.0, 8.0, 12.0, 16.0, 13.0, 13.0, 20.0, 24.0, 24.0, 30.0, 29.0, 25.0, 31.0, 30.0, 35.0, 37.0, 37.0, 35.0, 33.0, 39.0, 42.0, 36.0, 30.0, 34.0, 32.0, 33.0, 36.0, 36.0, 20.0, 20.0, 19.0, 19.0, 13.0, 15.0, 18.0, 20.0, 6.0, 11.0, 4.0, 5.0, 4.0, 4.0, 8.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.0016980171203613281, -0.0016461238265037537, -0.0015942305326461792, -0.0015423372387886047, -0.0014904439449310303, -0.0014385506510734558, -0.0013866573572158813, -0.0013347640633583069, -0.0012828707695007324, -0.001230977475643158, -0.0011790841817855835, -0.001127190887928009, -0.0010752975940704346, -0.00102340430021286, -0.0009715110063552856, -0.0009196177124977112, -0.0008677244186401367, -0.0008158311247825623, -0.0007639378309249878, -0.0007120445370674133, -0.0006601512432098389, -0.0006082579493522644, -0.0005563646554946899, -0.0005044713616371155, -0.000452578067779541, -0.00040068477392196655, -0.0003487914800643921, -0.0002968981862068176, -0.00024500489234924316, -0.0001931115984916687, -0.00014121830463409424, -8.932501077651978e-05, -3.743171691894531e-05, 1.446157693862915e-05, 6.635487079620361e-05, 0.00011824816465377808, 0.00017014145851135254, 0.000222034752368927, 0.00027392804622650146, 0.00032582134008407593, 0.0003777146339416504, 0.00042960792779922485, 0.0004815012216567993, 0.0005333945155143738, 0.0005852878093719482, 0.0006371811032295227, 0.0006890743970870972, 0.0007409676909446716, 0.0007928609848022461, 0.0008447542786598206, 0.000896647572517395, 0.0009485408663749695, 0.001000434160232544, 0.0010523274540901184, 0.0011042207479476929, 0.0011561140418052673, 0.0012080073356628418, 0.0012599006295204163, 0.0013117939233779907, 0.0013636872172355652, 0.0014155805110931396, 0.0014674738049507141, 0.0015193670988082886, 0.001571260392665863, 0.0016231536865234375]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 15.0, 9.0, 12.0, 15.0, 16.0, 19.0, 27.0, 21.0, 30.0, 32.0, 31.0, 27.0, 39.0, 44.0, 61.0, 40.0, 48.0, 47.0, 35.0, 47.0, 34.0, 35.0, 44.0, 28.0, 29.0, 30.0, 34.0, 27.0, 22.0, 24.0, 18.0, 7.0, 6.0, 11.0, 7.0, 10.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.453125, -18.829833984375, -18.20654296875, -17.583251953125, -16.9599609375, -16.336669921875, -15.71337890625, -15.090087890625, -14.466796875, -13.843505859375, -13.22021484375, -12.596923828125, -11.9736328125, -11.350341796875, -10.72705078125, -10.103759765625, -9.48046875, -8.857177734375, -8.23388671875, -7.610595703125, -6.9873046875, -6.364013671875, -5.74072265625, -5.117431640625, -4.494140625, -3.870849609375, -3.24755859375, -2.624267578125, -2.0009765625, -1.377685546875, -0.75439453125, -0.131103515625, 0.4921875, 1.115478515625, 1.73876953125, 2.362060546875, 2.9853515625, 3.608642578125, 4.23193359375, 4.855224609375, 5.478515625, 6.101806640625, 6.72509765625, 7.348388671875, 7.9716796875, 8.594970703125, 9.21826171875, 9.841552734375, 10.46484375, 11.088134765625, 11.71142578125, 12.334716796875, 12.9580078125, 13.581298828125, 14.20458984375, 14.827880859375, 15.451171875, 16.074462890625, 16.69775390625, 17.321044921875, 17.9443359375, 18.567626953125, 19.19091796875, 19.814208984375, 20.4375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 8.0, 17.0, 19.0, 24.0, 34.0, 41.0, 50.0, 61.0, 83.0, 104.0, 144.0, 222.0, 370.0, 784.0, 2010.0, 6000.0, 21760.0, 98790.0, 461666.0, 358625.0, 72895.0, 16630.0, 4830.0, 1590.0, 645.0, 337.0, 227.0, 143.0, 112.0, 79.0, 57.0, 46.0, 42.0, 21.0, 19.0, 13.0, 11.0, 11.0, 8.0, 5.0, 0.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.875, -24.070068359375, -23.26513671875, -22.460205078125, -21.6552734375, -20.850341796875, -20.04541015625, -19.240478515625, -18.435546875, -17.630615234375, -16.82568359375, -16.020751953125, -15.2158203125, -14.410888671875, -13.60595703125, -12.801025390625, -11.99609375, -11.191162109375, -10.38623046875, -9.581298828125, -8.7763671875, -7.971435546875, -7.16650390625, -6.361572265625, -5.556640625, -4.751708984375, -3.94677734375, -3.141845703125, -2.3369140625, -1.531982421875, -0.72705078125, 0.077880859375, 0.8828125, 1.687744140625, 2.49267578125, 3.297607421875, 4.1025390625, 4.907470703125, 5.71240234375, 6.517333984375, 7.322265625, 8.127197265625, 8.93212890625, 9.737060546875, 10.5419921875, 11.346923828125, 12.15185546875, 12.956787109375, 13.76171875, 14.566650390625, 15.37158203125, 16.176513671875, 16.9814453125, 17.786376953125, 18.59130859375, 19.396240234375, 20.201171875, 21.006103515625, 21.81103515625, 22.615966796875, 23.4208984375, 24.225830078125, 25.03076171875, 25.835693359375, 26.640625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 6.0, 1.0, 5.0, 5.0, 5.0, 6.0, 5.0, 7.0, 6.0, 11.0, 24.0, 13.0, 25.0, 31.0, 27.0, 32.0, 32.0, 28.0, 40.0, 42.0, 47.0, 63.0, 95.0, 242.0, 1577.0, 153.0, 75.0, 51.0, 61.0, 42.0, 40.0, 37.0, 27.0, 31.0, 31.0, 28.0, 13.0, 15.0, 22.0, 12.0, 11.0, 8.0, 10.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.96875, -44.34912109375, -42.7294921875, -41.10986328125, -39.490234375, -37.87060546875, -36.2509765625, -34.63134765625, -33.01171875, -31.39208984375, -29.7724609375, -28.15283203125, -26.533203125, -24.91357421875, -23.2939453125, -21.67431640625, -20.0546875, -18.43505859375, -16.8154296875, -15.19580078125, -13.576171875, -11.95654296875, -10.3369140625, -8.71728515625, -7.09765625, -5.47802734375, -3.8583984375, -2.23876953125, -0.619140625, 1.00048828125, 2.6201171875, 4.23974609375, 5.859375, 7.47900390625, 9.0986328125, 10.71826171875, 12.337890625, 13.95751953125, 15.5771484375, 17.19677734375, 18.81640625, 20.43603515625, 22.0556640625, 23.67529296875, 25.294921875, 26.91455078125, 28.5341796875, 30.15380859375, 31.7734375, 33.39306640625, 35.0126953125, 36.63232421875, 38.251953125, 39.87158203125, 41.4912109375, 43.11083984375, 44.73046875, 46.35009765625, 47.9697265625, 49.58935546875, 51.208984375, 52.82861328125, 54.4482421875, 56.06787109375, 57.6875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 12.0, 8.0, 14.0, 22.0, 34.0, 52.0, 67.0, 91.0, 142.0, 208.0, 318.0, 667.0, 2195.0, 72289.0, 3045233.0, 21544.0, 1412.0, 532.0, 265.0, 208.0, 124.0, 75.0, 58.0, 31.0, 32.0, 25.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-87.875, -84.666015625, -81.45703125, -78.248046875, -75.0390625, -71.830078125, -68.62109375, -65.412109375, -62.203125, -58.994140625, -55.78515625, -52.576171875, -49.3671875, -46.158203125, -42.94921875, -39.740234375, -36.53125, -33.322265625, -30.11328125, -26.904296875, -23.6953125, -20.486328125, -17.27734375, -14.068359375, -10.859375, -7.650390625, -4.44140625, -1.232421875, 1.9765625, 5.185546875, 8.39453125, 11.603515625, 14.8125, 18.021484375, 21.23046875, 24.439453125, 27.6484375, 30.857421875, 34.06640625, 37.275390625, 40.484375, 43.693359375, 46.90234375, 50.111328125, 53.3203125, 56.529296875, 59.73828125, 62.947265625, 66.15625, 69.365234375, 72.57421875, 75.783203125, 78.9921875, 82.201171875, 85.41015625, 88.619140625, 91.828125, 95.037109375, 98.24609375, 101.455078125, 104.6640625, 107.873046875, 111.08203125, 114.291015625, 117.5]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 44.0, 92.0, 176.0, 241.0, 229.0, 142.0, 55.0, 12.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.9842529296875, -82.12683868408203, -79.26941680908203, -76.41200256347656, -73.5545883178711, -70.69717407226562, -67.83975219726562, -64.98233795166016, -62.12491989135742, -59.26750183105469, -56.41008758544922, -53.552669525146484, -50.69525146484375, -47.83783721923828, -44.98041915893555, -42.12300109863281, -39.265586853027344, -36.40816879272461, -33.55075454711914, -30.693336486816406, -27.835920333862305, -24.978504180908203, -22.12108612060547, -19.263669967651367, -16.406253814697266, -13.548837661743164, -10.691420555114746, -7.834003448486328, -4.976587295532227, -2.119171142578125, 0.7382469177246094, 3.595663070678711, 6.453071594238281, 9.310487747192383, 12.1679048538208, 15.025321960449219, 17.88273811340332, 20.740154266357422, 23.597572326660156, 26.454988479614258, 29.31240463256836, 32.169822692871094, 35.02723693847656, 37.8846549987793, 40.74207305908203, 43.5994873046875, 46.456905364990234, 49.31432342529297, 52.17173767089844, 55.02915573120117, 57.88656997680664, 60.743988037109375, 63.601402282714844, 66.45881652832031, 69.31623840332031, 72.17365264892578, 75.03106689453125, 77.88848114013672, 80.74590301513672, 83.60331726074219, 86.46073150634766, 89.31814575195312, 92.17556762695312, 95.0329818725586, 97.8904037475586]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 12.0, 11.0, 11.0, 15.0, 20.0, 22.0, 30.0, 21.0, 24.0, 32.0, 38.0, 39.0, 50.0, 55.0, 45.0, 36.0, 53.0, 41.0, 43.0, 49.0, 34.0, 38.0, 33.0, 37.0, 32.0, 28.0, 27.0, 23.0, 13.0, 20.0, 14.0, 15.0, 4.0, 6.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 3.0], "bins": [-166.73043823242188, -162.52761840820312, -158.32479858398438, -154.12196350097656, -149.9191436767578, -145.71632385253906, -141.5135040283203, -137.3106689453125, -133.10784912109375, -128.905029296875, -124.70220184326172, -120.49938201904297, -116.29655456542969, -112.09373474121094, -107.89091491699219, -103.6880874633789, -99.48526763916016, -95.2824478149414, -91.07962036132812, -86.87680053710938, -82.6739730834961, -78.47115325927734, -74.26832580566406, -70.06550598144531, -65.86268615722656, -61.65986251831055, -57.45703887939453, -53.25421905517578, -49.0513916015625, -44.84857177734375, -40.645748138427734, -36.44292449951172, -32.24009704589844, -28.037273406982422, -23.834449768066406, -19.631628036499023, -15.428804397583008, -11.225980758666992, -7.023159027099609, -2.8203353881835938, 1.3824882507324219, 5.585311412811279, 9.788134574890137, 13.990957260131836, 18.19378089904785, 22.396604537963867, 26.59942626953125, 30.802249908447266, 35.00507354736328, 39.2078971862793, 43.41072082519531, 47.61354064941406, 51.816368103027344, 56.019187927246094, 60.22201156616211, 64.42483520507812, 68.62765502929688, 72.83047485351562, 77.0333023071289, 81.23612213134766, 85.43894958496094, 89.64176940917969, 93.84458923339844, 98.04741668701172, 102.250244140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 0.0, 0.0, 5.0, 3.0, 4.0, 8.0, 8.0, 11.0, 14.0, 12.0, 15.0, 25.0, 26.0, 21.0, 27.0, 26.0, 30.0, 38.0, 31.0, 34.0, 42.0, 38.0, 40.0, 35.0, 45.0, 44.0, 39.0, 31.0, 41.0, 38.0, 38.0, 31.0, 25.0, 27.0, 28.0, 24.0, 17.0, 18.0, 12.0, 13.0, 15.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.015625, -17.41552734375, -16.8154296875, -16.21533203125, -15.615234375, -15.01513671875, -14.4150390625, -13.81494140625, -13.21484375, -12.61474609375, -12.0146484375, -11.41455078125, -10.814453125, -10.21435546875, -9.6142578125, -9.01416015625, -8.4140625, -7.81396484375, -7.2138671875, -6.61376953125, -6.013671875, -5.41357421875, -4.8134765625, -4.21337890625, -3.61328125, -3.01318359375, -2.4130859375, -1.81298828125, -1.212890625, -0.61279296875, -0.0126953125, 0.58740234375, 1.1875, 1.78759765625, 2.3876953125, 2.98779296875, 3.587890625, 4.18798828125, 4.7880859375, 5.38818359375, 5.98828125, 6.58837890625, 7.1884765625, 7.78857421875, 8.388671875, 8.98876953125, 9.5888671875, 10.18896484375, 10.7890625, 11.38916015625, 11.9892578125, 12.58935546875, 13.189453125, 13.78955078125, 14.3896484375, 14.98974609375, 15.58984375, 16.18994140625, 16.7900390625, 17.39013671875, 17.990234375, 18.59033203125, 19.1904296875, 19.79052734375, 20.390625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 5.0, 7.0, 7.0, 9.0, 20.0, 11.0, 12.0, 18.0, 16.0, 29.0, 23.0, 25.0, 38.0, 38.0, 51.0, 84.0, 172.0, 375.0, 936.0, 5421.0, 1105601.0, 3063208.0, 15646.0, 1416.0, 445.0, 189.0, 103.0, 70.0, 46.0, 37.0, 37.0, 27.0, 25.0, 18.0, 15.0, 14.0, 11.0, 7.0, 10.0, 11.0, 7.0, 5.0, 8.0, 1.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-86.875, -84.1728515625, -81.470703125, -78.7685546875, -76.06640625, -73.3642578125, -70.662109375, -67.9599609375, -65.2578125, -62.5556640625, -59.853515625, -57.1513671875, -54.44921875, -51.7470703125, -49.044921875, -46.3427734375, -43.640625, -40.9384765625, -38.236328125, -35.5341796875, -32.83203125, -30.1298828125, -27.427734375, -24.7255859375, -22.0234375, -19.3212890625, -16.619140625, -13.9169921875, -11.21484375, -8.5126953125, -5.810546875, -3.1083984375, -0.40625, 2.2958984375, 4.998046875, 7.7001953125, 10.40234375, 13.1044921875, 15.806640625, 18.5087890625, 21.2109375, 23.9130859375, 26.615234375, 29.3173828125, 32.01953125, 34.7216796875, 37.423828125, 40.1259765625, 42.828125, 45.5302734375, 48.232421875, 50.9345703125, 53.63671875, 56.3388671875, 59.041015625, 61.7431640625, 64.4453125, 67.1474609375, 69.849609375, 72.5517578125, 75.25390625, 77.9560546875, 80.658203125, 83.3603515625, 86.0625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 13.0, 9.0, 16.0, 20.0, 42.0, 51.0, 119.0, 196.0, 296.0, 525.0, 727.0, 726.0, 541.0, 315.0, 191.0, 102.0, 59.0, 43.0, 25.0, 19.0, 6.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.296875, -30.134033203125, -28.97119140625, -27.808349609375, -26.6455078125, -25.482666015625, -24.31982421875, -23.156982421875, -21.994140625, -20.831298828125, -19.66845703125, -18.505615234375, -17.3427734375, -16.179931640625, -15.01708984375, -13.854248046875, -12.69140625, -11.528564453125, -10.36572265625, -9.202880859375, -8.0400390625, -6.877197265625, -5.71435546875, -4.551513671875, -3.388671875, -2.225830078125, -1.06298828125, 0.099853515625, 1.2626953125, 2.425537109375, 3.58837890625, 4.751220703125, 5.9140625, 7.076904296875, 8.23974609375, 9.402587890625, 10.5654296875, 11.728271484375, 12.89111328125, 14.053955078125, 15.216796875, 16.379638671875, 17.54248046875, 18.705322265625, 19.8681640625, 21.031005859375, 22.19384765625, 23.356689453125, 24.51953125, 25.682373046875, 26.84521484375, 28.008056640625, 29.1708984375, 30.333740234375, 31.49658203125, 32.659423828125, 33.822265625, 34.985107421875, 36.14794921875, 37.310791015625, 38.4736328125, 39.636474609375, 40.79931640625, 41.962158203125, 43.125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 3.0, 7.0, 11.0, 9.0, 20.0, 18.0, 29.0, 34.0, 54.0, 84.0, 134.0, 311.0, 671.0, 1946.0, 30769.0, 4002033.0, 152943.0, 3438.0, 844.0, 374.0, 206.0, 107.0, 53.0, 40.0, 23.0, 32.0, 19.0, 12.0, 6.0, 14.0, 5.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-98.125, -94.81640625, -91.5078125, -88.19921875, -84.890625, -81.58203125, -78.2734375, -74.96484375, -71.65625, -68.34765625, -65.0390625, -61.73046875, -58.421875, -55.11328125, -51.8046875, -48.49609375, -45.1875, -41.87890625, -38.5703125, -35.26171875, -31.953125, -28.64453125, -25.3359375, -22.02734375, -18.71875, -15.41015625, -12.1015625, -8.79296875, -5.484375, -2.17578125, 1.1328125, 4.44140625, 7.75, 11.05859375, 14.3671875, 17.67578125, 20.984375, 24.29296875, 27.6015625, 30.91015625, 34.21875, 37.52734375, 40.8359375, 44.14453125, 47.453125, 50.76171875, 54.0703125, 57.37890625, 60.6875, 63.99609375, 67.3046875, 70.61328125, 73.921875, 77.23046875, 80.5390625, 83.84765625, 87.15625, 90.46484375, 93.7734375, 97.08203125, 100.390625, 103.69921875, 107.0078125, 110.31640625, 113.625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 25.0, 169.0, 473.0, 287.0, 53.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-408.4092712402344, -398.10357666015625, -387.7978515625, -377.4921569824219, -367.1864318847656, -356.8807373046875, -346.57501220703125, -336.2693176269531, -325.963623046875, -315.6579284667969, -305.3522033691406, -295.0465087890625, -284.74078369140625, -274.4350891113281, -264.1293640136719, -253.82366943359375, -243.5179443359375, -233.2122344970703, -222.90652465820312, -212.60081481933594, -202.29510498046875, -191.98941040039062, -181.68370056152344, -171.37799072265625, -161.07228088378906, -150.76657104492188, -140.4608612060547, -130.1551513671875, -119.84944915771484, -109.54373931884766, -99.238037109375, -88.93232727050781, -78.62661743164062, -68.32090759277344, -58.015201568603516, -47.709495544433594, -37.403785705566406, -27.09807586669922, -16.792369842529297, -6.486663818359375, 3.8190460205078125, 14.124753952026367, 24.430461883544922, 34.736167907714844, 45.04187774658203, 55.34758758544922, 65.65328979492188, 75.95899963378906, 86.26470947265625, 96.57041931152344, 106.87612915039062, 117.18183135986328, 127.48754119873047, 137.79324340820312, 148.0989532470703, 158.4046630859375, 168.7103729248047, 179.01608276367188, 189.32179260253906, 199.62750244140625, 209.93319702148438, 220.23892211914062, 230.54461669921875, 240.85032653808594, 251.15603637695312]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 0.0, 4.0, 6.0, 7.0, 9.0, 7.0, 16.0, 13.0, 20.0, 23.0, 19.0, 24.0, 25.0, 42.0, 32.0, 43.0, 47.0, 55.0, 35.0, 52.0, 44.0, 45.0, 42.0, 42.0, 44.0, 35.0, 44.0, 31.0, 31.0, 26.0, 22.0, 21.0, 25.0, 13.0, 12.0, 16.0, 8.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.32467651367188, -92.9963607788086, -89.66804504394531, -86.3397216796875, -83.01140594482422, -79.68309020996094, -76.35476684570312, -73.02645111083984, -69.69813537597656, -66.36981964111328, -63.041500091552734, -59.71318054199219, -56.384864807128906, -53.056549072265625, -49.72822952270508, -46.39990997314453, -43.07159423828125, -39.74327850341797, -36.41495895385742, -33.086639404296875, -29.758323669433594, -26.43000602722168, -23.101688385009766, -19.77337074279785, -16.445053100585938, -13.116735458374023, -9.78841781616211, -6.460100173950195, -3.1317825317382812, 0.1965351104736328, 3.524852752685547, 6.853170394897461, 10.181488037109375, 13.509805679321289, 16.838123321533203, 20.166440963745117, 23.49475860595703, 26.823076248168945, 30.15139389038086, 33.479713439941406, 36.80802917480469, 40.13634490966797, 43.464664459228516, 46.79298400878906, 50.121299743652344, 53.449615478515625, 56.77793502807617, 60.10625457763672, 63.4345703125, 66.76288604736328, 70.09120178222656, 73.41952514648438, 76.74784088134766, 80.07615661621094, 83.40447998046875, 86.73279571533203, 90.06111145019531, 93.3894271850586, 96.71774291992188, 100.04606628417969, 103.37438201904297, 106.70269775390625, 110.03102111816406, 113.35933685302734, 116.68765258789062]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 10.0, 11.0, 12.0, 16.0, 26.0, 30.0, 22.0, 23.0, 31.0, 28.0, 45.0, 41.0, 44.0, 44.0, 34.0, 49.0, 33.0, 51.0, 48.0, 40.0, 40.0, 36.0, 46.0, 32.0, 29.0, 24.0, 22.0, 20.0, 14.0, 14.0, 17.0, 10.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.552978515625, -16.90283203125, -16.252685546875, -15.6025390625, -14.952392578125, -14.30224609375, -13.652099609375, -13.001953125, -12.351806640625, -11.70166015625, -11.051513671875, -10.4013671875, -9.751220703125, -9.10107421875, -8.450927734375, -7.80078125, -7.150634765625, -6.50048828125, -5.850341796875, -5.2001953125, -4.550048828125, -3.89990234375, -3.249755859375, -2.599609375, -1.949462890625, -1.29931640625, -0.649169921875, 0.0009765625, 0.651123046875, 1.30126953125, 1.951416015625, 2.6015625, 3.251708984375, 3.90185546875, 4.552001953125, 5.2021484375, 5.852294921875, 6.50244140625, 7.152587890625, 7.802734375, 8.452880859375, 9.10302734375, 9.753173828125, 10.4033203125, 11.053466796875, 11.70361328125, 12.353759765625, 13.00390625, 13.654052734375, 14.30419921875, 14.954345703125, 15.6044921875, 16.254638671875, 16.90478515625, 17.554931640625, 18.205078125, 18.855224609375, 19.50537109375, 20.155517578125, 20.8056640625, 21.455810546875, 22.10595703125, 22.756103515625, 23.40625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 4.0, 10.0, 28.0, 29.0, 37.0, 49.0, 89.0, 160.0, 211.0, 332.0, 594.0, 820.0, 1254.0, 1828.0, 2839.0, 4475.0, 6936.0, 10994.0, 17989.0, 29282.0, 50793.0, 91573.0, 200215.0, 336755.0, 126333.0, 66068.0, 38215.0, 22545.0, 13781.0, 8672.0, 5393.0, 3605.0, 2290.0, 1537.0, 923.0, 663.0, 422.0, 249.0, 186.0, 144.0, 81.0, 38.0, 35.0, 40.0, 11.0, 10.0, 2.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.7869873046875, -4.628662109375, -4.4703369140625, -4.31201171875, -4.1536865234375, -3.995361328125, -3.8370361328125, -3.6787109375, -3.5203857421875, -3.362060546875, -3.2037353515625, -3.04541015625, -2.8870849609375, -2.728759765625, -2.5704345703125, -2.412109375, -2.2537841796875, -2.095458984375, -1.9371337890625, -1.77880859375, -1.6204833984375, -1.462158203125, -1.3038330078125, -1.1455078125, -0.9871826171875, -0.828857421875, -0.6705322265625, -0.51220703125, -0.3538818359375, -0.195556640625, -0.0372314453125, 0.12109375, 0.2794189453125, 0.437744140625, 0.5960693359375, 0.75439453125, 0.9127197265625, 1.071044921875, 1.2293701171875, 1.3876953125, 1.5460205078125, 1.704345703125, 1.8626708984375, 2.02099609375, 2.1793212890625, 2.337646484375, 2.4959716796875, 2.654296875, 2.8126220703125, 2.970947265625, 3.1292724609375, 3.28759765625, 3.4459228515625, 3.604248046875, 3.7625732421875, 3.9208984375, 4.0792236328125, 4.237548828125, 4.3958740234375, 4.55419921875, 4.7125244140625, 4.870849609375, 5.0291748046875, 5.1875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 5.0, 9.0, 4.0, 25.0, 13.0, 13.0, 18.0, 23.0, 34.0, 24.0, 27.0, 36.0, 41.0, 40.0, 57.0, 29.0, 37.0, 42.0, 1067.0, 48.0, 43.0, 41.0, 43.0, 30.0, 34.0, 36.0, 31.0, 23.0, 22.0, 26.0, 22.0, 16.0, 20.0, 10.0, 9.0, 6.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.6171875, -12.2119140625, -11.806640625, -11.4013671875, -10.99609375, -10.5908203125, -10.185546875, -9.7802734375, -9.375, -8.9697265625, -8.564453125, -8.1591796875, -7.75390625, -7.3486328125, -6.943359375, -6.5380859375, -6.1328125, -5.7275390625, -5.322265625, -4.9169921875, -4.51171875, -4.1064453125, -3.701171875, -3.2958984375, -2.890625, -2.4853515625, -2.080078125, -1.6748046875, -1.26953125, -0.8642578125, -0.458984375, -0.0537109375, 0.3515625, 0.7568359375, 1.162109375, 1.5673828125, 1.97265625, 2.3779296875, 2.783203125, 3.1884765625, 3.59375, 3.9990234375, 4.404296875, 4.8095703125, 5.21484375, 5.6201171875, 6.025390625, 6.4306640625, 6.8359375, 7.2412109375, 7.646484375, 8.0517578125, 8.45703125, 8.8623046875, 9.267578125, 9.6728515625, 10.078125, 10.4833984375, 10.888671875, 11.2939453125, 11.69921875, 12.1044921875, 12.509765625, 12.9150390625, 13.3203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 0.0, 7.0, 6.0, 8.0, 9.0, 20.0, 22.0, 47.0, 42.0, 65.0, 99.0, 116.0, 186.0, 294.0, 413.0, 613.0, 934.0, 1410.0, 2230.0, 3374.0, 5574.0, 9107.0, 14725.0, 24769.0, 41250.0, 71407.0, 133371.0, 1386452.0, 180568.0, 90938.0, 51024.0, 30332.0, 18149.0, 11019.0, 6732.0, 4043.0, 2614.0, 1724.0, 1090.0, 736.0, 506.0, 351.0, 243.0, 156.0, 104.0, 58.0, 61.0, 37.0, 32.0, 20.0, 16.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 4.0], "bins": [-5.203125, -5.04400634765625, -4.8848876953125, -4.72576904296875, -4.566650390625, -4.40753173828125, -4.2484130859375, -4.08929443359375, -3.93017578125, -3.77105712890625, -3.6119384765625, -3.45281982421875, -3.293701171875, -3.13458251953125, -2.9754638671875, -2.81634521484375, -2.6572265625, -2.49810791015625, -2.3389892578125, -2.17987060546875, -2.020751953125, -1.86163330078125, -1.7025146484375, -1.54339599609375, -1.38427734375, -1.22515869140625, -1.0660400390625, -0.90692138671875, -0.747802734375, -0.58868408203125, -0.4295654296875, -0.27044677734375, -0.111328125, 0.04779052734375, 0.2069091796875, 0.36602783203125, 0.525146484375, 0.68426513671875, 0.8433837890625, 1.00250244140625, 1.16162109375, 1.32073974609375, 1.4798583984375, 1.63897705078125, 1.798095703125, 1.95721435546875, 2.1163330078125, 2.27545166015625, 2.4345703125, 2.59368896484375, 2.7528076171875, 2.91192626953125, 3.071044921875, 3.23016357421875, 3.3892822265625, 3.54840087890625, 3.70751953125, 3.86663818359375, 4.0257568359375, 4.18487548828125, 4.343994140625, 4.50311279296875, 4.6622314453125, 4.82135009765625, 4.98046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0, 6.0, 11.0, 6.0, 8.0, 13.0, 12.0, 25.0, 18.0, 28.0, 46.0, 33.0, 52.0, 76.0, 112.0, 123.0, 108.0, 67.0, 49.0, 41.0, 25.0, 25.0, 20.0, 19.0, 16.0, 9.0, 5.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004314422607421875, -0.004176199436187744, -0.004037976264953613, -0.0038997530937194824, -0.0037615299224853516, -0.0036233067512512207, -0.00348508358001709, -0.003346860408782959, -0.003208637237548828, -0.0030704140663146973, -0.0029321908950805664, -0.0027939677238464355, -0.0026557445526123047, -0.002517521381378174, -0.002379298210144043, -0.002241075038909912, -0.0021028518676757812, -0.0019646286964416504, -0.0018264055252075195, -0.0016881823539733887, -0.0015499591827392578, -0.001411736011505127, -0.001273512840270996, -0.0011352896690368652, -0.0009970664978027344, -0.0008588433265686035, -0.0007206201553344727, -0.0005823969841003418, -0.00044417381286621094, -0.0003059506416320801, -0.00016772747039794922, -2.950429916381836e-05, 0.0001087188720703125, 0.00024694204330444336, 0.0003851652145385742, 0.0005233883857727051, 0.0006616115570068359, 0.0007998347282409668, 0.0009380578994750977, 0.0010762810707092285, 0.0012145042419433594, 0.0013527274131774902, 0.001490950584411621, 0.001629173755645752, 0.0017673969268798828, 0.0019056200981140137, 0.0020438432693481445, 0.0021820664405822754, 0.0023202896118164062, 0.002458512783050537, 0.002596735954284668, 0.002734959125518799, 0.0028731822967529297, 0.0030114054679870605, 0.0031496286392211914, 0.0032878518104553223, 0.003426074981689453, 0.003564298152923584, 0.003702521324157715, 0.0038407444953918457, 0.0039789676666259766, 0.004117190837860107, 0.004255414009094238, 0.004393637180328369, 0.0045318603515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 6.0, 6.0, 6.0, 5.0, 12.0, 11.0, 20.0, 20.0, 23.0, 47.0, 46.0, 70.0, 115.0, 193.0, 455.0, 1622.0, 1041587.0, 3126.0, 553.0, 217.0, 117.0, 81.0, 52.0, 40.0, 18.0, 17.0, 15.0, 15.0, 12.0, 11.0, 8.0, 6.0, 5.0, 0.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09722614288330078, -0.09404945373535156, -0.09087276458740234, -0.08769607543945312, -0.0845193862915039, -0.08134269714355469, -0.07816600799560547, -0.07498931884765625, -0.07181262969970703, -0.06863594055175781, -0.0654592514038086, -0.062282562255859375, -0.059105873107910156, -0.05592918395996094, -0.05275249481201172, -0.0495758056640625, -0.04639911651611328, -0.04322242736816406, -0.040045738220214844, -0.036869049072265625, -0.033692359924316406, -0.030515670776367188, -0.02733898162841797, -0.02416229248046875, -0.02098560333251953, -0.017808914184570312, -0.014632225036621094, -0.011455535888671875, -0.008278846740722656, -0.0051021575927734375, -0.0019254684448242188, 0.001251220703125, 0.004427909851074219, 0.0076045989990234375, 0.010781288146972656, 0.013957977294921875, 0.017134666442871094, 0.020311355590820312, 0.02348804473876953, 0.02666473388671875, 0.02984142303466797, 0.03301811218261719, 0.036194801330566406, 0.039371490478515625, 0.042548179626464844, 0.04572486877441406, 0.04890155792236328, 0.0520782470703125, 0.05525493621826172, 0.05843162536621094, 0.061608314514160156, 0.06478500366210938, 0.0679616928100586, 0.07113838195800781, 0.07431507110595703, 0.07749176025390625, 0.08066844940185547, 0.08384513854980469, 0.0870218276977539, 0.09019851684570312, 0.09337520599365234, 0.09655189514160156, 0.09972858428955078, 0.1029052734375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 17.0, 81.0, 241.0, 416.0, 195.0, 47.0, 12.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009025088511407375, -0.0007608350133523345, -0.0006191612337715924, -0.0004774874250870198, -0.0003358136164024472, -0.0001941397786140442, -5.246599903330207e-05, 8.920778054744005e-05, 0.00023088161833584309, 0.00037255542702041566, 0.0005142292357049882, 0.0006559030152857304, 0.0007975768530741334, 0.0009392506908625364, 0.0010809244122356176, 0.0012225982500240207, 0.0013642720878124237, 0.0015059459256008267, 0.0016476197633892298, 0.001789293484762311, 0.001930967322550714, 0.002072641160339117, 0.0022143148817121983, 0.0023559886030852795, 0.0024976625572890043, 0.0026393362786620855, 0.0027810102328658104, 0.0029226839542388916, 0.003064357675611973, 0.0032060316298156977, 0.003347705351188779, 0.0034893793053925037, 0.0036310534924268723, 0.0037727272137999535, 0.003914400935173035, 0.004056075122207403, 0.004197748843580484, 0.004339422564953566, 0.004481096286326647, 0.004622770007699728, 0.0047644441947340965, 0.004906117916107178, 0.005047791637480259, 0.0051894658245146275, 0.005331139545887709, 0.00547281326726079, 0.005614486988633871, 0.005756160710006952, 0.0058978344313800335, 0.006039508152753115, 0.006181181874126196, 0.006322856061160564, 0.006464529782533646, 0.006606203503906727, 0.006747877225279808, 0.006889550946652889, 0.0070312246680259705, 0.007172898389399052, 0.007314572110772133, 0.007456246297806501, 0.007597920019179583, 0.007739593740552664, 0.007881267927587032, 0.008022941648960114, 0.008164615370333195]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 16.0, 7.0, 8.0, 14.0, 8.0, 18.0, 17.0, 20.0, 27.0, 27.0, 27.0, 24.0, 32.0, 38.0, 36.0, 31.0, 34.0, 45.0, 51.0, 39.0, 51.0, 39.0, 35.0, 32.0, 36.0, 33.0, 23.0, 34.0, 26.0, 18.0, 26.0, 24.0, 20.0, 18.0, 14.0, 8.0, 4.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001797020435333252, -0.0017392486333847046, -0.0016814768314361572, -0.0016237050294876099, -0.0015659332275390625, -0.0015081614255905151, -0.0014503896236419678, -0.0013926178216934204, -0.001334846019744873, -0.0012770742177963257, -0.0012193024158477783, -0.001161530613899231, -0.0011037588119506836, -0.0010459870100021362, -0.0009882152080535889, -0.0009304434061050415, -0.0008726716041564941, -0.0008148998022079468, -0.0007571280002593994, -0.000699356198310852, -0.0006415843963623047, -0.0005838125944137573, -0.00052604079246521, -0.0004682689905166626, -0.00041049718856811523, -0.00035272538661956787, -0.0002949535846710205, -0.00023718178272247314, -0.00017940998077392578, -0.00012163817882537842, -6.386637687683105e-05, -6.094574928283691e-06, 5.167722702026367e-05, 0.00010944902896881104, 0.0001672208309173584, 0.00022499263286590576, 0.0002827644348144531, 0.0003405362367630005, 0.00039830803871154785, 0.0004560798406600952, 0.0005138516426086426, 0.0005716234445571899, 0.0006293952465057373, 0.0006871670484542847, 0.000744938850402832, 0.0008027106523513794, 0.0008604824542999268, 0.0009182542562484741, 0.0009760260581970215, 0.0010337978601455688, 0.0010915696620941162, 0.0011493414640426636, 0.001207113265991211, 0.0012648850679397583, 0.0013226568698883057, 0.001380428671836853, 0.0014382004737854004, 0.0014959722757339478, 0.0015537440776824951, 0.0016115158796310425, 0.0016692876815795898, 0.0017270594835281372, 0.0017848312854766846, 0.001842603087425232, 0.0019003748893737793]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 10.0, 11.0, 12.0, 16.0, 26.0, 30.0, 22.0, 23.0, 31.0, 28.0, 45.0, 41.0, 44.0, 44.0, 34.0, 49.0, 33.0, 51.0, 48.0, 40.0, 40.0, 36.0, 46.0, 32.0, 29.0, 24.0, 22.0, 20.0, 14.0, 14.0, 17.0, 10.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.552978515625, -16.90283203125, -16.252685546875, -15.6025390625, -14.952392578125, -14.30224609375, -13.652099609375, -13.001953125, -12.351806640625, -11.70166015625, -11.051513671875, -10.4013671875, -9.751220703125, -9.10107421875, -8.450927734375, -7.80078125, -7.150634765625, -6.50048828125, -5.850341796875, -5.2001953125, -4.550048828125, -3.89990234375, -3.249755859375, -2.599609375, -1.949462890625, -1.29931640625, -0.649169921875, 0.0009765625, 0.651123046875, 1.30126953125, 1.951416015625, 2.6015625, 3.251708984375, 3.90185546875, 4.552001953125, 5.2021484375, 5.852294921875, 6.50244140625, 7.152587890625, 7.802734375, 8.452880859375, 9.10302734375, 9.753173828125, 10.4033203125, 11.053466796875, 11.70361328125, 12.353759765625, 13.00390625, 13.654052734375, 14.30419921875, 14.954345703125, 15.6044921875, 16.254638671875, 16.90478515625, 17.554931640625, 18.205078125, 18.855224609375, 19.50537109375, 20.155517578125, 20.8056640625, 21.455810546875, 22.10595703125, 22.756103515625, 23.40625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 11.0, 11.0, 12.0, 21.0, 37.0, 46.0, 55.0, 77.0, 125.0, 145.0, 201.0, 330.0, 425.0, 693.0, 1144.0, 2465.0, 6970.0, 27853.0, 136964.0, 487145.0, 298887.0, 62665.0, 13854.0, 4113.0, 1606.0, 837.0, 575.0, 351.0, 267.0, 196.0, 143.0, 90.0, 75.0, 41.0, 41.0, 22.0, 21.0, 13.0, 14.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.608154296875, -23.85693359375, -23.105712890625, -22.3544921875, -21.603271484375, -20.85205078125, -20.100830078125, -19.349609375, -18.598388671875, -17.84716796875, -17.095947265625, -16.3447265625, -15.593505859375, -14.84228515625, -14.091064453125, -13.33984375, -12.588623046875, -11.83740234375, -11.086181640625, -10.3349609375, -9.583740234375, -8.83251953125, -8.081298828125, -7.330078125, -6.578857421875, -5.82763671875, -5.076416015625, -4.3251953125, -3.573974609375, -2.82275390625, -2.071533203125, -1.3203125, -0.569091796875, 0.18212890625, 0.933349609375, 1.6845703125, 2.435791015625, 3.18701171875, 3.938232421875, 4.689453125, 5.440673828125, 6.19189453125, 6.943115234375, 7.6943359375, 8.445556640625, 9.19677734375, 9.947998046875, 10.69921875, 11.450439453125, 12.20166015625, 12.952880859375, 13.7041015625, 14.455322265625, 15.20654296875, 15.957763671875, 16.708984375, 17.460205078125, 18.21142578125, 18.962646484375, 19.7138671875, 20.465087890625, 21.21630859375, 21.967529296875, 22.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 11.0, 12.0, 18.0, 19.0, 24.0, 21.0, 33.0, 36.0, 44.0, 42.0, 68.0, 59.0, 115.0, 419.0, 1585.0, 126.0, 65.0, 64.0, 42.0, 41.0, 36.0, 33.0, 25.0, 25.0, 19.0, 11.0, 12.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.3125, -74.13671875, -71.9609375, -69.78515625, -67.609375, -65.43359375, -63.2578125, -61.08203125, -58.90625, -56.73046875, -54.5546875, -52.37890625, -50.203125, -48.02734375, -45.8515625, -43.67578125, -41.5, -39.32421875, -37.1484375, -34.97265625, -32.796875, -30.62109375, -28.4453125, -26.26953125, -24.09375, -21.91796875, -19.7421875, -17.56640625, -15.390625, -13.21484375, -11.0390625, -8.86328125, -6.6875, -4.51171875, -2.3359375, -0.16015625, 2.015625, 4.19140625, 6.3671875, 8.54296875, 10.71875, 12.89453125, 15.0703125, 17.24609375, 19.421875, 21.59765625, 23.7734375, 25.94921875, 28.125, 30.30078125, 32.4765625, 34.65234375, 36.828125, 39.00390625, 41.1796875, 43.35546875, 45.53125, 47.70703125, 49.8828125, 52.05859375, 54.234375, 56.41015625, 58.5859375, 60.76171875, 62.9375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 9.0, 4.0, 10.0, 17.0, 30.0, 37.0, 47.0, 61.0, 88.0, 115.0, 146.0, 232.0, 415.0, 845.0, 4301.0, 2116383.0, 1017412.0, 3465.0, 768.0, 413.0, 251.0, 161.0, 115.0, 90.0, 78.0, 47.0, 33.0, 40.0, 19.0, 21.0, 16.0, 5.0, 8.0, 7.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-85.3125, -82.3671875, -79.421875, -76.4765625, -73.53125, -70.5859375, -67.640625, -64.6953125, -61.75, -58.8046875, -55.859375, -52.9140625, -49.96875, -47.0234375, -44.078125, -41.1328125, -38.1875, -35.2421875, -32.296875, -29.3515625, -26.40625, -23.4609375, -20.515625, -17.5703125, -14.625, -11.6796875, -8.734375, -5.7890625, -2.84375, 0.1015625, 3.046875, 5.9921875, 8.9375, 11.8828125, 14.828125, 17.7734375, 20.71875, 23.6640625, 26.609375, 29.5546875, 32.5, 35.4453125, 38.390625, 41.3359375, 44.28125, 47.2265625, 50.171875, 53.1171875, 56.0625, 59.0078125, 61.953125, 64.8984375, 67.84375, 70.7890625, 73.734375, 76.6796875, 79.625, 82.5703125, 85.515625, 88.4609375, 91.40625, 94.3515625, 97.296875, 100.2421875, 103.1875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 63.0, 600.0, 342.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.21719360351562, -145.96815490722656, -136.71913146972656, -127.4700927734375, -118.22106170654297, -108.97203063964844, -99.72299194335938, -90.47396087646484, -81.22492980957031, -71.97589874267578, -62.726863861083984, -53.47782897949219, -44.228797912597656, -34.979766845703125, -25.730731964111328, -16.48169708251953, -7.232666015625, 2.016366958618164, 11.265399932861328, 20.514432907104492, 29.763465881347656, 39.01249694824219, 48.261531829833984, 57.51056671142578, 66.75959777832031, 76.00862884521484, 85.25765991210938, 94.50669860839844, 103.75572967529297, 113.0047607421875, 122.25379943847656, 131.50283813476562, 140.7518310546875, 150.00086975097656, 159.24989318847656, 168.49893188476562, 177.74795532226562, 186.9969940185547, 196.24603271484375, 205.49505615234375, 214.7440948486328, 223.99313354492188, 233.24215698242188, 242.49119567871094, 251.740234375, 260.9892578125, 270.23828125, 279.4873352050781, 288.7363586425781, 297.9853820800781, 307.23443603515625, 316.48345947265625, 325.73248291015625, 334.98150634765625, 344.2305603027344, 353.4795837402344, 362.7286376953125, 371.9776611328125, 381.2267150878906, 390.4757385253906, 399.7247619628906, 408.97381591796875, 418.22283935546875, 427.47186279296875, 436.72088623046875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 7.0, 15.0, 13.0, 16.0, 35.0, 23.0, 33.0, 27.0, 37.0, 27.0, 49.0, 41.0, 45.0, 44.0, 63.0, 40.0, 51.0, 45.0, 50.0, 36.0, 32.0, 32.0, 28.0, 30.0, 22.0, 29.0, 23.0, 15.0, 12.0, 10.0, 14.0, 11.0, 10.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-164.99261474609375, -160.4075927734375, -155.8225555419922, -151.23751831054688, -146.65249633789062, -142.06747436523438, -137.48243713378906, -132.89739990234375, -128.3123779296875, -123.72734832763672, -119.14231872558594, -114.55728912353516, -109.97225952148438, -105.3872299194336, -100.80220031738281, -96.21717071533203, -91.63214111328125, -87.04711151123047, -82.46208190917969, -77.8770523071289, -73.29202270507812, -68.70699310302734, -64.12196350097656, -59.53693389892578, -54.951904296875, -50.36687469482422, -45.78184509277344, -41.196815490722656, -36.611785888671875, -32.026756286621094, -27.441726684570312, -22.85669708251953, -18.271652221679688, -13.686622619628906, -9.101593017578125, -4.516563415527344, 0.0684661865234375, 4.653495788574219, 9.238525390625, 13.823554992675781, 18.408584594726562, 22.993614196777344, 27.578643798828125, 32.163673400878906, 36.74870300292969, 41.33373260498047, 45.91876220703125, 50.50379180908203, 55.08882141113281, 59.673851013183594, 64.25888061523438, 68.84391021728516, 73.42893981933594, 78.01396942138672, 82.5989990234375, 87.18402862548828, 91.76905822753906, 96.35408782958984, 100.93911743164062, 105.5241470336914, 110.10917663574219, 114.69420623779297, 119.27923583984375, 123.86426544189453, 128.4492950439453]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 17.0, 11.0, 10.0, 15.0, 21.0, 29.0, 13.0, 21.0, 35.0, 22.0, 31.0, 26.0, 42.0, 36.0, 47.0, 43.0, 38.0, 47.0, 41.0, 45.0, 53.0, 40.0, 42.0, 22.0, 26.0, 26.0, 32.0, 19.0, 25.0, 13.0, 15.0, 17.0, 15.0, 11.0, 6.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.19580078125, -16.5791015625, -15.96240234375, -15.345703125, -14.72900390625, -14.1123046875, -13.49560546875, -12.87890625, -12.26220703125, -11.6455078125, -11.02880859375, -10.412109375, -9.79541015625, -9.1787109375, -8.56201171875, -7.9453125, -7.32861328125, -6.7119140625, -6.09521484375, -5.478515625, -4.86181640625, -4.2451171875, -3.62841796875, -3.01171875, -2.39501953125, -1.7783203125, -1.16162109375, -0.544921875, 0.07177734375, 0.6884765625, 1.30517578125, 1.921875, 2.53857421875, 3.1552734375, 3.77197265625, 4.388671875, 5.00537109375, 5.6220703125, 6.23876953125, 6.85546875, 7.47216796875, 8.0888671875, 8.70556640625, 9.322265625, 9.93896484375, 10.5556640625, 11.17236328125, 11.7890625, 12.40576171875, 13.0224609375, 13.63916015625, 14.255859375, 14.87255859375, 15.4892578125, 16.10595703125, 16.72265625, 17.33935546875, 17.9560546875, 18.57275390625, 19.189453125, 19.80615234375, 20.4228515625, 21.03955078125, 21.65625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 8.0, 1.0, 5.0, 12.0, 6.0, 18.0, 15.0, 14.0, 30.0, 24.0, 40.0, 33.0, 56.0, 68.0, 87.0, 117.0, 160.0, 212.0, 280.0, 309.0, 420.0, 1244.0, 4187377.0, 1756.0, 448.0, 337.0, 275.0, 187.0, 159.0, 136.0, 88.0, 65.0, 65.0, 44.0, 34.0, 24.0, 19.0, 21.0, 14.0, 13.0, 13.0, 10.0, 6.0, 8.0, 2.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-719.5, -696.7109375, -673.921875, -651.1328125, -628.34375, -605.5546875, -582.765625, -559.9765625, -537.1875, -514.3984375, -491.609375, -468.8203125, -446.03125, -423.2421875, -400.453125, -377.6640625, -354.875, -332.0859375, -309.296875, -286.5078125, -263.71875, -240.9296875, -218.140625, -195.3515625, -172.5625, -149.7734375, -126.984375, -104.1953125, -81.40625, -58.6171875, -35.828125, -13.0390625, 9.75, 32.5390625, 55.328125, 78.1171875, 100.90625, 123.6953125, 146.484375, 169.2734375, 192.0625, 214.8515625, 237.640625, 260.4296875, 283.21875, 306.0078125, 328.796875, 351.5859375, 374.375, 397.1640625, 419.953125, 442.7421875, 465.53125, 488.3203125, 511.109375, 533.8984375, 556.6875, 579.4765625, 602.265625, 625.0546875, 647.84375, 670.6328125, 693.421875, 716.2109375, 739.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 6.0, 7.0, 13.0, 17.0, 26.0, 30.0, 42.0, 52.0, 66.0, 118.0, 130.0, 259.0, 419.0, 672.0, 770.0, 560.0, 296.0, 157.0, 133.0, 87.0, 56.0, 40.0, 22.0, 17.0, 17.0, 12.0, 15.0, 5.0, 12.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.9375, -35.7900390625, -34.642578125, -33.4951171875, -32.34765625, -31.2001953125, -30.052734375, -28.9052734375, -27.7578125, -26.6103515625, -25.462890625, -24.3154296875, -23.16796875, -22.0205078125, -20.873046875, -19.7255859375, -18.578125, -17.4306640625, -16.283203125, -15.1357421875, -13.98828125, -12.8408203125, -11.693359375, -10.5458984375, -9.3984375, -8.2509765625, -7.103515625, -5.9560546875, -4.80859375, -3.6611328125, -2.513671875, -1.3662109375, -0.21875, 0.9287109375, 2.076171875, 3.2236328125, 4.37109375, 5.5185546875, 6.666015625, 7.8134765625, 8.9609375, 10.1083984375, 11.255859375, 12.4033203125, 13.55078125, 14.6982421875, 15.845703125, 16.9931640625, 18.140625, 19.2880859375, 20.435546875, 21.5830078125, 22.73046875, 23.8779296875, 25.025390625, 26.1728515625, 27.3203125, 28.4677734375, 29.615234375, 30.7626953125, 31.91015625, 33.0576171875, 34.205078125, 35.3525390625, 36.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 9.0, 5.0, 7.0, 10.0, 7.0, 20.0, 14.0, 25.0, 32.0, 37.0, 49.0, 55.0, 75.0, 68.0, 175.0, 784.0, 4185804.0, 6349.0, 260.0, 115.0, 81.0, 47.0, 48.0, 39.0, 49.0, 26.0, 15.0, 13.0, 14.0, 17.0, 12.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-548.0, -533.46484375, -518.9296875, -504.39453125, -489.859375, -475.32421875, -460.7890625, -446.25390625, -431.71875, -417.18359375, -402.6484375, -388.11328125, -373.578125, -359.04296875, -344.5078125, -329.97265625, -315.4375, -300.90234375, -286.3671875, -271.83203125, -257.296875, -242.76171875, -228.2265625, -213.69140625, -199.15625, -184.62109375, -170.0859375, -155.55078125, -141.015625, -126.48046875, -111.9453125, -97.41015625, -82.875, -68.33984375, -53.8046875, -39.26953125, -24.734375, -10.19921875, 4.3359375, 18.87109375, 33.40625, 47.94140625, 62.4765625, 77.01171875, 91.546875, 106.08203125, 120.6171875, 135.15234375, 149.6875, 164.22265625, 178.7578125, 193.29296875, 207.828125, 222.36328125, 236.8984375, 251.43359375, 265.96875, 280.50390625, 295.0390625, 309.57421875, 324.109375, 338.64453125, 353.1796875, 367.71484375, 382.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 781.0, 229.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1926.530029296875, -1891.3984375, -1856.266845703125, -1821.1353759765625, -1786.0037841796875, -1750.8721923828125, -1715.74072265625, -1680.609130859375, -1645.4775390625, -1610.345947265625, -1575.21435546875, -1540.0828857421875, -1504.9512939453125, -1469.8197021484375, -1434.688232421875, -1399.556640625, -1364.425048828125, -1329.29345703125, -1294.161865234375, -1259.0303955078125, -1223.8988037109375, -1188.7672119140625, -1153.6357421875, -1118.504150390625, -1083.37255859375, -1048.240966796875, -1013.1094360351562, -977.9779052734375, -942.8463134765625, -907.7147216796875, -872.5831909179688, -837.45166015625, -802.3201904296875, -767.1885986328125, -732.0570678710938, -696.925537109375, -661.7939453125, -626.662353515625, -591.5308227539062, -556.3992919921875, -521.2677001953125, -486.1361389160156, -451.00457763671875, -415.8730163574219, -380.741455078125, -345.6098937988281, -310.47833251953125, -275.3467712402344, -240.21517944335938, -205.0836181640625, -169.95205688476562, -134.82049560546875, -99.68893432617188, -64.557373046875, -29.425811767578125, 5.70574951171875, 40.837310791015625, 75.9688720703125, 111.10043334960938, 146.23199462890625, 181.36355590820312, 216.4951171875, 251.62667846679688, 286.75823974609375, 321.8898010253906]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 12.0, 10.0, 7.0, 15.0, 13.0, 24.0, 19.0, 21.0, 24.0, 28.0, 33.0, 32.0, 34.0, 41.0, 25.0, 32.0, 41.0, 37.0, 37.0, 50.0, 41.0, 37.0, 33.0, 44.0, 24.0, 37.0, 29.0, 32.0, 21.0, 27.0, 26.0, 16.0, 22.0, 8.0, 5.0, 13.0, 9.0, 6.0, 11.0, 7.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.19889831542969, -105.59849548339844, -101.99808502197266, -98.3976821899414, -94.79727935791016, -91.19686889648438, -87.59646606445312, -83.99606323242188, -80.39566040039062, -76.79525756835938, -73.1948471069336, -69.59444427490234, -65.9940414428711, -62.39363479614258, -58.79322814941406, -55.19282531738281, -51.5924186706543, -47.99201202392578, -44.39160919189453, -40.791202545166016, -37.190799713134766, -33.59039306640625, -29.989988327026367, -26.389583587646484, -22.7891788482666, -19.18877410888672, -15.588369369506836, -11.987963676452637, -8.387558937072754, -4.787153244018555, -1.1867485046386719, 2.413656234741211, 6.014060974121094, 9.614465713500977, 13.21487045288086, 16.815277099609375, 20.415679931640625, 24.01608657836914, 27.616491317749023, 31.216896057128906, 34.817298889160156, 38.41770553588867, 42.01810836791992, 45.61851501464844, 49.21891784667969, 52.8193244934082, 56.41973114013672, 60.02013397216797, 63.620540618896484, 67.220947265625, 70.82135009765625, 74.4217529296875, 78.02216339111328, 81.62256622314453, 85.22296905517578, 88.82337951660156, 92.42378234863281, 96.02418518066406, 99.62459564208984, 103.2249984741211, 106.82540130615234, 110.42581176757812, 114.02621459960938, 117.62661743164062, 121.22702026367188]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 9.0, 6.0, 7.0, 7.0, 12.0, 15.0, 20.0, 17.0, 26.0, 23.0, 24.0, 24.0, 25.0, 31.0, 37.0, 41.0, 39.0, 43.0, 43.0, 35.0, 59.0, 46.0, 52.0, 35.0, 36.0, 23.0, 35.0, 25.0, 38.0, 29.0, 23.0, 23.0, 16.0, 17.0, 12.0, 8.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.40625, -17.7666015625, -17.126953125, -16.4873046875, -15.84765625, -15.2080078125, -14.568359375, -13.9287109375, -13.2890625, -12.6494140625, -12.009765625, -11.3701171875, -10.73046875, -10.0908203125, -9.451171875, -8.8115234375, -8.171875, -7.5322265625, -6.892578125, -6.2529296875, -5.61328125, -4.9736328125, -4.333984375, -3.6943359375, -3.0546875, -2.4150390625, -1.775390625, -1.1357421875, -0.49609375, 0.1435546875, 0.783203125, 1.4228515625, 2.0625, 2.7021484375, 3.341796875, 3.9814453125, 4.62109375, 5.2607421875, 5.900390625, 6.5400390625, 7.1796875, 7.8193359375, 8.458984375, 9.0986328125, 9.73828125, 10.3779296875, 11.017578125, 11.6572265625, 12.296875, 12.9365234375, 13.576171875, 14.2158203125, 14.85546875, 15.4951171875, 16.134765625, 16.7744140625, 17.4140625, 18.0537109375, 18.693359375, 19.3330078125, 19.97265625, 20.6123046875, 21.251953125, 21.8916015625, 22.53125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 4.0, 8.0, 3.0, 7.0, 14.0, 15.0, 24.0, 39.0, 42.0, 61.0, 86.0, 155.0, 192.0, 318.0, 438.0, 691.0, 1019.0, 1532.0, 2378.0, 3625.0, 5555.0, 8874.0, 13742.0, 21304.0, 33654.0, 56547.0, 104699.0, 258083.0, 273884.0, 107494.0, 58261.0, 34796.0, 21599.0, 13911.0, 8830.0, 5717.0, 3698.0, 2380.0, 1616.0, 1079.0, 694.0, 477.0, 326.0, 213.0, 161.0, 107.0, 73.0, 51.0, 25.0, 25.0, 15.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.9609375, -4.801025390625, -4.64111328125, -4.481201171875, -4.3212890625, -4.161376953125, -4.00146484375, -3.841552734375, -3.681640625, -3.521728515625, -3.36181640625, -3.201904296875, -3.0419921875, -2.882080078125, -2.72216796875, -2.562255859375, -2.40234375, -2.242431640625, -2.08251953125, -1.922607421875, -1.7626953125, -1.602783203125, -1.44287109375, -1.282958984375, -1.123046875, -0.963134765625, -0.80322265625, -0.643310546875, -0.4833984375, -0.323486328125, -0.16357421875, -0.003662109375, 0.15625, 0.316162109375, 0.47607421875, 0.635986328125, 0.7958984375, 0.955810546875, 1.11572265625, 1.275634765625, 1.435546875, 1.595458984375, 1.75537109375, 1.915283203125, 2.0751953125, 2.235107421875, 2.39501953125, 2.554931640625, 2.71484375, 2.874755859375, 3.03466796875, 3.194580078125, 3.3544921875, 3.514404296875, 3.67431640625, 3.834228515625, 3.994140625, 4.154052734375, 4.31396484375, 4.473876953125, 4.6337890625, 4.793701171875, 4.95361328125, 5.113525390625, 5.2734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 12.0, 13.0, 7.0, 17.0, 10.0, 19.0, 23.0, 23.0, 25.0, 36.0, 26.0, 27.0, 37.0, 58.0, 44.0, 43.0, 43.0, 1059.0, 38.0, 48.0, 43.0, 41.0, 32.0, 30.0, 26.0, 23.0, 24.0, 24.0, 26.0, 25.0, 25.0, 17.0, 8.0, 10.0, 12.0, 6.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.609375, -13.214599609375, -12.81982421875, -12.425048828125, -12.0302734375, -11.635498046875, -11.24072265625, -10.845947265625, -10.451171875, -10.056396484375, -9.66162109375, -9.266845703125, -8.8720703125, -8.477294921875, -8.08251953125, -7.687744140625, -7.29296875, -6.898193359375, -6.50341796875, -6.108642578125, -5.7138671875, -5.319091796875, -4.92431640625, -4.529541015625, -4.134765625, -3.739990234375, -3.34521484375, -2.950439453125, -2.5556640625, -2.160888671875, -1.76611328125, -1.371337890625, -0.9765625, -0.581787109375, -0.18701171875, 0.207763671875, 0.6025390625, 0.997314453125, 1.39208984375, 1.786865234375, 2.181640625, 2.576416015625, 2.97119140625, 3.365966796875, 3.7607421875, 4.155517578125, 4.55029296875, 4.945068359375, 5.33984375, 5.734619140625, 6.12939453125, 6.524169921875, 6.9189453125, 7.313720703125, 7.70849609375, 8.103271484375, 8.498046875, 8.892822265625, 9.28759765625, 9.682373046875, 10.0771484375, 10.471923828125, 10.86669921875, 11.261474609375, 11.65625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 12.0, 25.0, 28.0, 35.0, 51.0, 80.0, 118.0, 171.0, 263.0, 351.0, 532.0, 808.0, 1252.0, 1831.0, 2861.0, 4611.0, 7144.0, 11425.0, 18492.0, 30241.0, 49848.0, 88510.0, 191000.0, 1386723.0, 129951.0, 66820.0, 39256.0, 24335.0, 14913.0, 9022.0, 5871.0, 3677.0, 2248.0, 1502.0, 967.0, 669.0, 449.0, 317.0, 216.0, 141.0, 95.0, 83.0, 45.0, 45.0, 27.0, 19.0, 11.0, 5.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.109375, -4.94598388671875, -4.7825927734375, -4.61920166015625, -4.455810546875, -4.29241943359375, -4.1290283203125, -3.96563720703125, -3.80224609375, -3.63885498046875, -3.4754638671875, -3.31207275390625, -3.148681640625, -2.98529052734375, -2.8218994140625, -2.65850830078125, -2.4951171875, -2.33172607421875, -2.1683349609375, -2.00494384765625, -1.841552734375, -1.67816162109375, -1.5147705078125, -1.35137939453125, -1.18798828125, -1.02459716796875, -0.8612060546875, -0.69781494140625, -0.534423828125, -0.37103271484375, -0.2076416015625, -0.04425048828125, 0.119140625, 0.28253173828125, 0.4459228515625, 0.60931396484375, 0.772705078125, 0.93609619140625, 1.0994873046875, 1.26287841796875, 1.42626953125, 1.58966064453125, 1.7530517578125, 1.91644287109375, 2.079833984375, 2.24322509765625, 2.4066162109375, 2.57000732421875, 2.7333984375, 2.89678955078125, 3.0601806640625, 3.22357177734375, 3.386962890625, 3.55035400390625, 3.7137451171875, 3.87713623046875, 4.04052734375, 4.20391845703125, 4.3673095703125, 4.53070068359375, 4.694091796875, 4.85748291015625, 5.0208740234375, 5.18426513671875, 5.34765625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 1.0, 5.0, 9.0, 8.0, 13.0, 13.0, 25.0, 18.0, 21.0, 38.0, 35.0, 41.0, 55.0, 77.0, 91.0, 86.0, 78.0, 59.0, 60.0, 47.0, 45.0, 30.0, 17.0, 21.0, 25.0, 12.0, 12.0, 4.0, 5.0, 6.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002590179443359375, -0.002496868371963501, -0.002403557300567627, -0.002310246229171753, -0.002216935157775879, -0.002123624086380005, -0.002030313014984131, -0.0019370019435882568, -0.0018436908721923828, -0.0017503798007965088, -0.0016570687294006348, -0.0015637576580047607, -0.0014704465866088867, -0.0013771355152130127, -0.0012838244438171387, -0.0011905133724212646, -0.0010972023010253906, -0.0010038912296295166, -0.0009105801582336426, -0.0008172690868377686, -0.0007239580154418945, -0.0006306469440460205, -0.0005373358726501465, -0.00044402480125427246, -0.00035071372985839844, -0.0002574026584625244, -0.0001640915870666504, -7.078051567077637e-05, 2.2530555725097656e-05, 0.00011584162712097168, 0.0002091526985168457, 0.0003024637699127197, 0.00039577484130859375, 0.0004890859127044678, 0.0005823969841003418, 0.0006757080554962158, 0.0007690191268920898, 0.0008623301982879639, 0.0009556412696838379, 0.001048952341079712, 0.001142263412475586, 0.00123557448387146, 0.001328885555267334, 0.001422196626663208, 0.001515507698059082, 0.001608818769454956, 0.00170212984085083, 0.001795440912246704, 0.0018887519836425781, 0.001982063055038452, 0.002075374126434326, 0.0021686851978302, 0.0022619962692260742, 0.0023553073406219482, 0.0024486184120178223, 0.0025419294834136963, 0.0026352405548095703, 0.0027285516262054443, 0.0028218626976013184, 0.0029151737689971924, 0.0030084848403930664, 0.0031017959117889404, 0.0031951069831848145, 0.0032884180545806885, 0.0033817291259765625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 3.0, 12.0, 12.0, 7.0, 9.0, 23.0, 14.0, 17.0, 30.0, 37.0, 74.0, 69.0, 106.0, 104.0, 179.0, 294.0, 416.0, 944.0, 63625.0, 978326.0, 2410.0, 623.0, 366.0, 199.0, 153.0, 97.0, 84.0, 72.0, 50.0, 36.0, 32.0, 19.0, 13.0, 19.0, 9.0, 5.0, 6.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0], "bins": [-0.05828857421875, -0.05667877197265625, -0.0550689697265625, -0.05345916748046875, -0.051849365234375, -0.05023956298828125, -0.0486297607421875, -0.04701995849609375, -0.04541015625, -0.04380035400390625, -0.0421905517578125, -0.04058074951171875, -0.038970947265625, -0.03736114501953125, -0.0357513427734375, -0.03414154052734375, -0.03253173828125, -0.03092193603515625, -0.0293121337890625, -0.02770233154296875, -0.026092529296875, -0.02448272705078125, -0.0228729248046875, -0.02126312255859375, -0.0196533203125, -0.01804351806640625, -0.0164337158203125, -0.01482391357421875, -0.013214111328125, -0.01160430908203125, -0.0099945068359375, -0.00838470458984375, -0.00677490234375, -0.00516510009765625, -0.0035552978515625, -0.00194549560546875, -0.000335693359375, 0.00127410888671875, 0.0028839111328125, 0.00449371337890625, 0.006103515625, 0.00771331787109375, 0.0093231201171875, 0.01093292236328125, 0.012542724609375, 0.01415252685546875, 0.0157623291015625, 0.01737213134765625, 0.01898193359375, 0.02059173583984375, 0.0222015380859375, 0.02381134033203125, 0.025421142578125, 0.02703094482421875, 0.0286407470703125, 0.03025054931640625, 0.0318603515625, 0.03347015380859375, 0.0350799560546875, 0.03668975830078125, 0.038299560546875, 0.03990936279296875, 0.0415191650390625, 0.04312896728515625, 0.04473876953125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 34.0, 603.0, 366.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008557157590985298, -0.008226508274674416, -0.007895859889686108, -0.007565210573375225, -0.00723456172272563, -0.0069039128720760345, -0.006573263555765152, -0.006242614705115557, -0.0059119658544659615, -0.005581317003816366, -0.005250668153166771, -0.004920018836855888, -0.004589369986206293, -0.004258721135556698, -0.003928071819245815, -0.00359742296859622, -0.0032667741179466248, -0.0029361252672970295, -0.0026054761838167906, -0.0022748271003365517, -0.0019441782496869564, -0.0016135292826220393, -0.0012828803155571222, -0.0009522312320768833, -0.0006215823814272881, -0.00029093341436237097, 3.971555270254612e-05, 0.0003703645197674632, 0.0007010134868323803, 0.0010316624538972974, 0.0013623114209622145, 0.0016929605044424534, 0.0020236093550920486, 0.002354258205741644, 0.002684907289221883, 0.0030155563727021217, 0.003346205223351717, 0.0036768540740013123, 0.004007503390312195, 0.00433815224096179, 0.004668801091611385, 0.004999449942260981, 0.005330098792910576, 0.0056607481092214584, 0.005991396959871054, 0.006322045810520649, 0.0066526951268315315, 0.006983343977481127, 0.007313992828130722, 0.007644641678780317, 0.007975290529429913, 0.008305939845740795, 0.008636588230729103, 0.008967237547039986, 0.009297886863350868, 0.00962853617966175, 0.009959184564650059, 0.010289833880960941, 0.01062048226594925, 0.010951131582260132, 0.011281780898571014, 0.011612429283559322, 0.011943078599870205, 0.012273726984858513, 0.012604376301169395]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 8.0, 10.0, 10.0, 15.0, 22.0, 13.0, 17.0, 32.0, 16.0, 24.0, 30.0, 32.0, 35.0, 35.0, 34.0, 34.0, 38.0, 38.0, 56.0, 42.0, 46.0, 44.0, 46.0, 40.0, 36.0, 33.0, 31.0, 22.0, 18.0, 27.0, 23.0, 12.0, 13.0, 14.0, 8.0, 11.0, 2.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015007257461547852, -0.0014536334201693535, -0.0014065410941839218, -0.0013594487681984901, -0.0013123564422130585, -0.0012652641162276268, -0.0012181717902421951, -0.0011710794642567635, -0.0011239871382713318, -0.0010768948122859001, -0.0010298024863004684, -0.0009827101603150368, -0.0009356178343296051, -0.0008885255083441734, -0.0008414331823587418, -0.0007943408563733101, -0.0007472485303878784, -0.0007001562044024467, -0.0006530638784170151, -0.0006059715524315834, -0.0005588792264461517, -0.0005117869004607201, -0.0004646945744752884, -0.0004176022484898567, -0.00037050992250442505, -0.0003234175965189934, -0.0002763252705335617, -0.00022923294454813004, -0.00018214061856269836, -0.0001350482925772667, -8.795596659183502e-05, -4.086364060640335e-05, 6.22868537902832e-06, 5.332101136445999e-05, 0.00010041333734989166, 0.00014750566333532333, 0.000194597989320755, 0.00024169031530618668, 0.00028878264129161835, 0.00033587496727705, 0.0003829672932624817, 0.00043005961924791336, 0.00047715194523334503, 0.0005242442712187767, 0.0005713365972042084, 0.00061842892318964, 0.0006655212491750717, 0.0007126135751605034, 0.0007597059011459351, 0.0008067982271313667, 0.0008538905531167984, 0.0009009828791022301, 0.0009480752050876617, 0.0009951675310730934, 0.001042259857058525, 0.0010893521830439568, 0.0011364445090293884, 0.00118353683501482, 0.0012306291610002518, 0.0012777214869856834, 0.0013248138129711151, 0.0013719061389565468, 0.0014189984649419785, 0.0014660907909274101, 0.0015131831169128418]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 9.0, 6.0, 7.0, 7.0, 12.0, 15.0, 20.0, 17.0, 26.0, 23.0, 24.0, 24.0, 25.0, 31.0, 37.0, 41.0, 39.0, 43.0, 43.0, 35.0, 59.0, 46.0, 51.0, 36.0, 36.0, 23.0, 35.0, 25.0, 38.0, 29.0, 23.0, 23.0, 16.0, 17.0, 12.0, 8.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.40625, -17.7666015625, -17.126953125, -16.4873046875, -15.84765625, -15.2080078125, -14.568359375, -13.9287109375, -13.2890625, -12.6494140625, -12.009765625, -11.3701171875, -10.73046875, -10.0908203125, -9.451171875, -8.8115234375, -8.171875, -7.5322265625, -6.892578125, -6.2529296875, -5.61328125, -4.9736328125, -4.333984375, -3.6943359375, -3.0546875, -2.4150390625, -1.775390625, -1.1357421875, -0.49609375, 0.1435546875, 0.783203125, 1.4228515625, 2.0625, 2.7021484375, 3.341796875, 3.9814453125, 4.62109375, 5.2607421875, 5.900390625, 6.5400390625, 7.1796875, 7.8193359375, 8.458984375, 9.0986328125, 9.73828125, 10.3779296875, 11.017578125, 11.6572265625, 12.296875, 12.9365234375, 13.576171875, 14.2158203125, 14.85546875, 15.4951171875, 16.134765625, 16.7744140625, 17.4140625, 18.0537109375, 18.693359375, 19.3330078125, 19.97265625, 20.6123046875, 21.251953125, 21.8916015625, 22.53125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 14.0, 14.0, 22.0, 30.0, 49.0, 61.0, 73.0, 90.0, 157.0, 177.0, 272.0, 346.0, 495.0, 634.0, 821.0, 1012.0, 1496.0, 2768.0, 9117.0, 66735.0, 534497.0, 373951.0, 41375.0, 6594.0, 2347.0, 1309.0, 1017.0, 769.0, 598.0, 466.0, 344.0, 238.0, 171.0, 130.0, 102.0, 67.0, 55.0, 31.0, 34.0, 18.0, 17.0, 7.0, 8.0, 3.0, 6.0, 0.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.5625, -31.54150390625, -30.5205078125, -29.49951171875, -28.478515625, -27.45751953125, -26.4365234375, -25.41552734375, -24.39453125, -23.37353515625, -22.3525390625, -21.33154296875, -20.310546875, -19.28955078125, -18.2685546875, -17.24755859375, -16.2265625, -15.20556640625, -14.1845703125, -13.16357421875, -12.142578125, -11.12158203125, -10.1005859375, -9.07958984375, -8.05859375, -7.03759765625, -6.0166015625, -4.99560546875, -3.974609375, -2.95361328125, -1.9326171875, -0.91162109375, 0.109375, 1.13037109375, 2.1513671875, 3.17236328125, 4.193359375, 5.21435546875, 6.2353515625, 7.25634765625, 8.27734375, 9.29833984375, 10.3193359375, 11.34033203125, 12.361328125, 13.38232421875, 14.4033203125, 15.42431640625, 16.4453125, 17.46630859375, 18.4873046875, 19.50830078125, 20.529296875, 21.55029296875, 22.5712890625, 23.59228515625, 24.61328125, 25.63427734375, 26.6552734375, 27.67626953125, 28.697265625, 29.71826171875, 30.7392578125, 31.76025390625, 32.78125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 7.0, 10.0, 14.0, 16.0, 13.0, 14.0, 22.0, 28.0, 29.0, 32.0, 29.0, 42.0, 47.0, 49.0, 54.0, 95.0, 352.0, 1648.0, 117.0, 64.0, 45.0, 36.0, 41.0, 37.0, 36.0, 28.0, 20.0, 23.0, 17.0, 12.0, 16.0, 9.0, 5.0, 3.0, 7.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.71875, -56.83203125, -54.9453125, -53.05859375, -51.171875, -49.28515625, -47.3984375, -45.51171875, -43.625, -41.73828125, -39.8515625, -37.96484375, -36.078125, -34.19140625, -32.3046875, -30.41796875, -28.53125, -26.64453125, -24.7578125, -22.87109375, -20.984375, -19.09765625, -17.2109375, -15.32421875, -13.4375, -11.55078125, -9.6640625, -7.77734375, -5.890625, -4.00390625, -2.1171875, -0.23046875, 1.65625, 3.54296875, 5.4296875, 7.31640625, 9.203125, 11.08984375, 12.9765625, 14.86328125, 16.75, 18.63671875, 20.5234375, 22.41015625, 24.296875, 26.18359375, 28.0703125, 29.95703125, 31.84375, 33.73046875, 35.6171875, 37.50390625, 39.390625, 41.27734375, 43.1640625, 45.05078125, 46.9375, 48.82421875, 50.7109375, 52.59765625, 54.484375, 56.37109375, 58.2578125, 60.14453125, 62.03125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 4.0, 8.0, 16.0, 10.0, 14.0, 21.0, 25.0, 27.0, 34.0, 38.0, 49.0, 74.0, 85.0, 123.0, 213.0, 410.0, 926.0, 4828.0, 3129581.0, 6918.0, 999.0, 444.0, 223.0, 151.0, 111.0, 73.0, 59.0, 48.0, 44.0, 38.0, 22.0, 22.0, 16.0, 12.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-168.25, -163.37890625, -158.5078125, -153.63671875, -148.765625, -143.89453125, -139.0234375, -134.15234375, -129.28125, -124.41015625, -119.5390625, -114.66796875, -109.796875, -104.92578125, -100.0546875, -95.18359375, -90.3125, -85.44140625, -80.5703125, -75.69921875, -70.828125, -65.95703125, -61.0859375, -56.21484375, -51.34375, -46.47265625, -41.6015625, -36.73046875, -31.859375, -26.98828125, -22.1171875, -17.24609375, -12.375, -7.50390625, -2.6328125, 2.23828125, 7.109375, 11.98046875, 16.8515625, 21.72265625, 26.59375, 31.46484375, 36.3359375, 41.20703125, 46.078125, 50.94921875, 55.8203125, 60.69140625, 65.5625, 70.43359375, 75.3046875, 80.17578125, 85.046875, 89.91796875, 94.7890625, 99.66015625, 104.53125, 109.40234375, 114.2734375, 119.14453125, 124.015625, 128.88671875, 133.7578125, 138.62890625, 143.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 901.0, 113.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.2674560546875, -287.7272644042969, -263.18707275390625, -238.64686584472656, -214.10667419433594, -189.5664825439453, -165.02627563476562, -140.486083984375, -115.94589233398438, -91.40570068359375, -66.8655014038086, -42.32530212402344, -17.785110473632812, 6.7550811767578125, 31.2952880859375, 55.835479736328125, 80.37567138671875, 104.91586303710938, 129.4560546875, 153.9962615966797, 178.5364532470703, 203.07664489746094, 227.61685180664062, 252.15704345703125, 276.6972351074219, 301.2374267578125, 325.7776184082031, 350.31781005859375, 374.8580322265625, 399.398193359375, 423.93841552734375, 448.4786071777344, 473.018798828125, 497.5589904785156, 522.0991821289062, 546.639404296875, 571.1795654296875, 595.7197875976562, 620.260009765625, 644.8001708984375, 669.34033203125, 693.8805541992188, 718.4207153320312, 742.9609375, 767.5010986328125, 792.0413208007812, 816.58154296875, 841.1217041015625, 865.6619262695312, 890.2021484375, 914.7423095703125, 939.2825317382812, 963.8226928710938, 988.3629150390625, 1012.903076171875, 1037.443359375, 1061.9835205078125, 1086.523681640625, 1111.06396484375, 1135.6041259765625, 1160.144287109375, 1184.6844482421875, 1209.2247314453125, 1233.764892578125, 1258.3050537109375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 7.0, 2.0, 7.0, 17.0, 14.0, 16.0, 15.0, 30.0, 25.0, 21.0, 31.0, 37.0, 41.0, 33.0, 38.0, 49.0, 50.0, 45.0, 43.0, 45.0, 57.0, 38.0, 41.0, 30.0, 28.0, 36.0, 27.0, 19.0, 23.0, 19.0, 22.0, 20.0, 13.0, 10.0, 15.0, 5.0, 4.0, 4.0, 4.0, 1.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.41815185546875, -146.560791015625, -141.70343017578125, -136.8460693359375, -131.98870849609375, -127.13134765625, -122.27399444580078, -117.41663360595703, -112.55927276611328, -107.70191192626953, -102.84455108642578, -97.98719024658203, -93.12983703613281, -88.27247619628906, -83.41511535644531, -78.55775451660156, -73.70039367675781, -68.84303283691406, -63.98567199707031, -59.12831497192383, -54.27095413208008, -49.41359329223633, -44.556236267089844, -39.698875427246094, -34.841514587402344, -29.984153747558594, -25.126794815063477, -20.26943588256836, -15.41207504272461, -10.55471420288086, -5.697355270385742, -0.839996337890625, 4.0173797607421875, 8.874739646911621, 13.732099533081055, 18.589458465576172, 23.446819305419922, 28.304180145263672, 33.161537170410156, 38.018898010253906, 42.876258850097656, 47.733619689941406, 52.590980529785156, 57.44833755493164, 62.30569839477539, 67.16305541992188, 72.02041625976562, 76.87777709960938, 81.73513793945312, 86.59249877929688, 91.44985961914062, 96.30722045898438, 101.16458129882812, 106.02194213867188, 110.8792953491211, 115.73665618896484, 120.5940170288086, 125.45137786865234, 130.30873107910156, 135.1660919189453, 140.02345275878906, 144.8808135986328, 149.73817443847656, 154.5955352783203, 159.45289611816406]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 3.0, 5.0, 11.0, 11.0, 11.0, 8.0, 22.0, 15.0, 19.0, 19.0, 18.0, 25.0, 25.0, 25.0, 29.0, 30.0, 42.0, 41.0, 43.0, 41.0, 45.0, 44.0, 48.0, 37.0, 47.0, 33.0, 36.0, 28.0, 26.0, 28.0, 19.0, 25.0, 24.0, 18.0, 18.0, 12.0, 12.0, 13.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.59375, -15.99951171875, -15.4052734375, -14.81103515625, -14.216796875, -13.62255859375, -13.0283203125, -12.43408203125, -11.83984375, -11.24560546875, -10.6513671875, -10.05712890625, -9.462890625, -8.86865234375, -8.2744140625, -7.68017578125, -7.0859375, -6.49169921875, -5.8974609375, -5.30322265625, -4.708984375, -4.11474609375, -3.5205078125, -2.92626953125, -2.33203125, -1.73779296875, -1.1435546875, -0.54931640625, 0.044921875, 0.63916015625, 1.2333984375, 1.82763671875, 2.421875, 3.01611328125, 3.6103515625, 4.20458984375, 4.798828125, 5.39306640625, 5.9873046875, 6.58154296875, 7.17578125, 7.77001953125, 8.3642578125, 8.95849609375, 9.552734375, 10.14697265625, 10.7412109375, 11.33544921875, 11.9296875, 12.52392578125, 13.1181640625, 13.71240234375, 14.306640625, 14.90087890625, 15.4951171875, 16.08935546875, 16.68359375, 17.27783203125, 17.8720703125, 18.46630859375, 19.060546875, 19.65478515625, 20.2490234375, 20.84326171875, 21.4375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 7.0, 0.0, 5.0, 5.0, 5.0, 13.0, 3.0, 15.0, 11.0, 26.0, 21.0, 29.0, 38.0, 44.0, 59.0, 71.0, 82.0, 91.0, 105.0, 137.0, 149.0, 194.0, 321.0, 798.0, 3113.0, 41856.0, 2844203.0, 1284106.0, 14762.0, 2066.0, 651.0, 296.0, 186.0, 129.0, 114.0, 94.0, 71.0, 84.0, 60.0, 49.0, 50.0, 28.0, 35.0, 21.0, 16.0, 23.0, 10.0, 5.0, 6.0, 11.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-72.875, -70.4345703125, -67.994140625, -65.5537109375, -63.11328125, -60.6728515625, -58.232421875, -55.7919921875, -53.3515625, -50.9111328125, -48.470703125, -46.0302734375, -43.58984375, -41.1494140625, -38.708984375, -36.2685546875, -33.828125, -31.3876953125, -28.947265625, -26.5068359375, -24.06640625, -21.6259765625, -19.185546875, -16.7451171875, -14.3046875, -11.8642578125, -9.423828125, -6.9833984375, -4.54296875, -2.1025390625, 0.337890625, 2.7783203125, 5.21875, 7.6591796875, 10.099609375, 12.5400390625, 14.98046875, 17.4208984375, 19.861328125, 22.3017578125, 24.7421875, 27.1826171875, 29.623046875, 32.0634765625, 34.50390625, 36.9443359375, 39.384765625, 41.8251953125, 44.265625, 46.7060546875, 49.146484375, 51.5869140625, 54.02734375, 56.4677734375, 58.908203125, 61.3486328125, 63.7890625, 66.2294921875, 68.669921875, 71.1103515625, 73.55078125, 75.9912109375, 78.431640625, 80.8720703125, 83.3125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 9.0, 10.0, 10.0, 15.0, 13.0, 24.0, 24.0, 48.0, 46.0, 63.0, 82.0, 134.0, 166.0, 235.0, 347.0, 465.0, 553.0, 467.0, 386.0, 245.0, 175.0, 128.0, 85.0, 85.0, 62.0, 47.0, 49.0, 28.0, 15.0, 15.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -28.888671875, -27.83984375, -26.791015625, -25.7421875, -24.693359375, -23.64453125, -22.595703125, -21.546875, -20.498046875, -19.44921875, -18.400390625, -17.3515625, -16.302734375, -15.25390625, -14.205078125, -13.15625, -12.107421875, -11.05859375, -10.009765625, -8.9609375, -7.912109375, -6.86328125, -5.814453125, -4.765625, -3.716796875, -2.66796875, -1.619140625, -0.5703125, 0.478515625, 1.52734375, 2.576171875, 3.625, 4.673828125, 5.72265625, 6.771484375, 7.8203125, 8.869140625, 9.91796875, 10.966796875, 12.015625, 13.064453125, 14.11328125, 15.162109375, 16.2109375, 17.259765625, 18.30859375, 19.357421875, 20.40625, 21.455078125, 22.50390625, 23.552734375, 24.6015625, 25.650390625, 26.69921875, 27.748046875, 28.796875, 29.845703125, 30.89453125, 31.943359375, 32.9921875, 34.041015625, 35.08984375, 36.138671875, 37.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 13.0, 27.0, 43.0, 45.0, 71.0, 70.0, 134.0, 328.0, 732.0, 4171.0, 3850383.0, 334855.0, 2241.0, 550.0, 210.0, 134.0, 77.0, 42.0, 40.0, 32.0, 24.0, 14.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.625, -199.890625, -194.15625, -188.421875, -182.6875, -176.953125, -171.21875, -165.484375, -159.75, -154.015625, -148.28125, -142.546875, -136.8125, -131.078125, -125.34375, -119.609375, -113.875, -108.140625, -102.40625, -96.671875, -90.9375, -85.203125, -79.46875, -73.734375, -68.0, -62.265625, -56.53125, -50.796875, -45.0625, -39.328125, -33.59375, -27.859375, -22.125, -16.390625, -10.65625, -4.921875, 0.8125, 6.546875, 12.28125, 18.015625, 23.75, 29.484375, 35.21875, 40.953125, 46.6875, 52.421875, 58.15625, 63.890625, 69.625, 75.359375, 81.09375, 86.828125, 92.5625, 98.296875, 104.03125, 109.765625, 115.5, 121.234375, 126.96875, 132.703125, 138.4375, 144.171875, 149.90625, 155.640625, 161.375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 166.0, 666.0, 167.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-939.5484008789062, -921.32373046875, -903.0990600585938, -884.8743896484375, -866.6497192382812, -848.425048828125, -830.2003784179688, -811.9757080078125, -793.7510375976562, -775.5263671875, -757.3016967773438, -739.0770263671875, -720.8523559570312, -702.627685546875, -684.4030151367188, -666.1783447265625, -647.9536743164062, -629.72900390625, -611.5043334960938, -593.2796630859375, -575.0549926757812, -556.830322265625, -538.6056518554688, -520.3809814453125, -502.15631103515625, -483.931640625, -465.70697021484375, -447.4822998046875, -429.25762939453125, -411.032958984375, -392.80828857421875, -374.5836181640625, -356.35894775390625, -338.13427734375, -319.90960693359375, -301.6849365234375, -283.46026611328125, -265.235595703125, -247.01092529296875, -228.7862548828125, -210.56158447265625, -192.3369140625, -174.11224365234375, -155.8875732421875, -137.66290283203125, -119.438232421875, -101.21356201171875, -82.9888916015625, -64.76422119140625, -46.53955078125, -28.31488037109375, -10.0902099609375, 8.13446044921875, 26.359130859375, 44.58380126953125, 62.8084716796875, 81.03314208984375, 99.2578125, 117.48248291015625, 135.7071533203125, 153.93182373046875, 172.156494140625, 190.38116455078125, 208.6058349609375, 226.83050537109375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 7.0, 11.0, 15.0, 12.0, 13.0, 17.0, 18.0, 27.0, 26.0, 34.0, 36.0, 29.0, 42.0, 46.0, 38.0, 39.0, 38.0, 44.0, 37.0, 42.0, 45.0, 35.0, 29.0, 49.0, 37.0, 28.0, 37.0, 36.0, 14.0, 10.0, 14.0, 13.0, 13.0, 13.0, 5.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.36776733398438, -124.41398620605469, -120.460205078125, -116.50642395019531, -112.55264282226562, -108.59886169433594, -104.64508056640625, -100.69129943847656, -96.73751831054688, -92.78373718261719, -88.8299560546875, -84.87617492675781, -80.92239379882812, -76.96861267089844, -73.01483154296875, -69.06105041503906, -65.1072769165039, -61.15349578857422, -57.19971466064453, -53.245933532714844, -49.292152404785156, -45.33837127685547, -41.38459396362305, -37.43081283569336, -33.47703170776367, -29.523250579833984, -25.569469451904297, -21.615690231323242, -17.661909103393555, -13.708127975463867, -9.754348754882812, -5.800567626953125, -1.8467864990234375, 2.106994152069092, 6.060774803161621, 10.014554977416992, 13.96833610534668, 17.922117233276367, 21.875896453857422, 25.82967758178711, 29.783458709716797, 33.737239837646484, 37.69102096557617, 41.644798278808594, 45.59857940673828, 49.55236053466797, 53.506141662597656, 57.459922790527344, 61.41370391845703, 65.36748504638672, 69.3212661743164, 73.2750473022461, 77.22882843017578, 81.18260955810547, 85.13638305664062, 89.09016418457031, 93.0439453125, 96.99772644042969, 100.95150756835938, 104.90528869628906, 108.85906982421875, 112.81285095214844, 116.76663208007812, 120.72041320800781, 124.6741943359375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 9.0, 12.0, 16.0, 27.0, 19.0, 23.0, 31.0, 32.0, 36.0, 31.0, 36.0, 44.0, 37.0, 55.0, 37.0, 40.0, 39.0, 44.0, 41.0, 29.0, 38.0, 40.0, 29.0, 32.0, 19.0, 20.0, 25.0, 22.0, 12.0, 18.0, 13.0, 17.0, 9.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.015625, -14.492431640625, -13.96923828125, -13.446044921875, -12.9228515625, -12.399658203125, -11.87646484375, -11.353271484375, -10.830078125, -10.306884765625, -9.78369140625, -9.260498046875, -8.7373046875, -8.214111328125, -7.69091796875, -7.167724609375, -6.64453125, -6.121337890625, -5.59814453125, -5.074951171875, -4.5517578125, -4.028564453125, -3.50537109375, -2.982177734375, -2.458984375, -1.935791015625, -1.41259765625, -0.889404296875, -0.3662109375, 0.156982421875, 0.68017578125, 1.203369140625, 1.7265625, 2.249755859375, 2.77294921875, 3.296142578125, 3.8193359375, 4.342529296875, 4.86572265625, 5.388916015625, 5.912109375, 6.435302734375, 6.95849609375, 7.481689453125, 8.0048828125, 8.528076171875, 9.05126953125, 9.574462890625, 10.09765625, 10.620849609375, 11.14404296875, 11.667236328125, 12.1904296875, 12.713623046875, 13.23681640625, 13.760009765625, 14.283203125, 14.806396484375, 15.32958984375, 15.852783203125, 16.3759765625, 16.899169921875, 17.42236328125, 17.945556640625, 18.46875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 11.0, 15.0, 32.0, 47.0, 64.0, 82.0, 132.0, 172.0, 278.0, 474.0, 667.0, 955.0, 1496.0, 2398.0, 3567.0, 5414.0, 8607.0, 13479.0, 22053.0, 36298.0, 62411.0, 114014.0, 314254.0, 224145.0, 96828.0, 54737.0, 32256.0, 19398.0, 12185.0, 7730.0, 5015.0, 3222.0, 2014.0, 1396.0, 940.0, 582.0, 352.0, 276.0, 210.0, 113.0, 81.0, 55.0, 24.0, 24.0, 14.0, 18.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.01715087890625, -3.8780517578125, -3.73895263671875, -3.599853515625, -3.46075439453125, -3.3216552734375, -3.18255615234375, -3.04345703125, -2.90435791015625, -2.7652587890625, -2.62615966796875, -2.487060546875, -2.34796142578125, -2.2088623046875, -2.06976318359375, -1.9306640625, -1.79156494140625, -1.6524658203125, -1.51336669921875, -1.374267578125, -1.23516845703125, -1.0960693359375, -0.95697021484375, -0.81787109375, -0.67877197265625, -0.5396728515625, -0.40057373046875, -0.261474609375, -0.12237548828125, 0.0167236328125, 0.15582275390625, 0.294921875, 0.43402099609375, 0.5731201171875, 0.71221923828125, 0.851318359375, 0.99041748046875, 1.1295166015625, 1.26861572265625, 1.40771484375, 1.54681396484375, 1.6859130859375, 1.82501220703125, 1.964111328125, 2.10321044921875, 2.2423095703125, 2.38140869140625, 2.5205078125, 2.65960693359375, 2.7987060546875, 2.93780517578125, 3.076904296875, 3.21600341796875, 3.3551025390625, 3.49420166015625, 3.63330078125, 3.77239990234375, 3.9114990234375, 4.05059814453125, 4.189697265625, 4.32879638671875, 4.4678955078125, 4.60699462890625, 4.74609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 6.0, 15.0, 14.0, 16.0, 19.0, 22.0, 13.0, 30.0, 20.0, 23.0, 25.0, 30.0, 31.0, 35.0, 46.0, 30.0, 40.0, 23.0, 1074.0, 44.0, 31.0, 38.0, 38.0, 32.0, 37.0, 40.0, 29.0, 25.0, 22.0, 32.0, 18.0, 15.0, 15.0, 9.0, 13.0, 7.0, 11.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.171875, -9.83984375, -9.5078125, -9.17578125, -8.84375, -8.51171875, -8.1796875, -7.84765625, -7.515625, -7.18359375, -6.8515625, -6.51953125, -6.1875, -5.85546875, -5.5234375, -5.19140625, -4.859375, -4.52734375, -4.1953125, -3.86328125, -3.53125, -3.19921875, -2.8671875, -2.53515625, -2.203125, -1.87109375, -1.5390625, -1.20703125, -0.875, -0.54296875, -0.2109375, 0.12109375, 0.453125, 0.78515625, 1.1171875, 1.44921875, 1.78125, 2.11328125, 2.4453125, 2.77734375, 3.109375, 3.44140625, 3.7734375, 4.10546875, 4.4375, 4.76953125, 5.1015625, 5.43359375, 5.765625, 6.09765625, 6.4296875, 6.76171875, 7.09375, 7.42578125, 7.7578125, 8.08984375, 8.421875, 8.75390625, 9.0859375, 9.41796875, 9.75, 10.08203125, 10.4140625, 10.74609375, 11.078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 5.0, 12.0, 8.0, 19.0, 26.0, 34.0, 50.0, 80.0, 112.0, 150.0, 218.0, 294.0, 396.0, 643.0, 962.0, 1406.0, 2051.0, 3039.0, 4744.0, 7168.0, 11281.0, 17361.0, 27209.0, 43004.0, 71200.0, 127564.0, 1366214.0, 173213.0, 91475.0, 53278.0, 33262.0, 21217.0, 13330.0, 8843.0, 5808.0, 3787.0, 2448.0, 1590.0, 1115.0, 766.0, 538.0, 376.0, 231.0, 193.0, 117.0, 92.0, 57.0, 48.0, 31.0, 17.0, 17.0, 14.0, 7.0, 8.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.34375, -4.21099853515625, -4.0782470703125, -3.94549560546875, -3.812744140625, -3.67999267578125, -3.5472412109375, -3.41448974609375, -3.28173828125, -3.14898681640625, -3.0162353515625, -2.88348388671875, -2.750732421875, -2.61798095703125, -2.4852294921875, -2.35247802734375, -2.2197265625, -2.08697509765625, -1.9542236328125, -1.82147216796875, -1.688720703125, -1.55596923828125, -1.4232177734375, -1.29046630859375, -1.15771484375, -1.02496337890625, -0.8922119140625, -0.75946044921875, -0.626708984375, -0.49395751953125, -0.3612060546875, -0.22845458984375, -0.095703125, 0.03704833984375, 0.1697998046875, 0.30255126953125, 0.435302734375, 0.56805419921875, 0.7008056640625, 0.83355712890625, 0.96630859375, 1.09906005859375, 1.2318115234375, 1.36456298828125, 1.497314453125, 1.63006591796875, 1.7628173828125, 1.89556884765625, 2.0283203125, 2.16107177734375, 2.2938232421875, 2.42657470703125, 2.559326171875, 2.69207763671875, 2.8248291015625, 2.95758056640625, 3.09033203125, 3.22308349609375, 3.3558349609375, 3.48858642578125, 3.621337890625, 3.75408935546875, 3.8868408203125, 4.01959228515625, 4.15234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 8.0, 15.0, 14.0, 12.0, 15.0, 30.0, 28.0, 35.0, 40.0, 59.0, 67.0, 82.0, 86.0, 105.0, 73.0, 62.0, 44.0, 45.0, 32.0, 32.0, 24.0, 17.0, 16.0, 14.0, 13.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0035800933837890625, -0.0034882426261901855, -0.0033963918685913086, -0.0033045411109924316, -0.0032126903533935547, -0.0031208395957946777, -0.0030289888381958008, -0.002937138080596924, -0.002845287322998047, -0.00275343656539917, -0.002661585807800293, -0.002569735050201416, -0.002477884292602539, -0.002386033535003662, -0.002294182777404785, -0.002202332019805908, -0.0021104812622070312, -0.0020186305046081543, -0.0019267797470092773, -0.0018349289894104004, -0.0017430782318115234, -0.0016512274742126465, -0.0015593767166137695, -0.0014675259590148926, -0.0013756752014160156, -0.0012838244438171387, -0.0011919736862182617, -0.0011001229286193848, -0.0010082721710205078, -0.0009164214134216309, -0.0008245706558227539, -0.000732719898223877, -0.000640869140625, -0.000549018383026123, -0.0004571676254272461, -0.00036531686782836914, -0.0002734661102294922, -0.00018161535263061523, -8.976459503173828e-05, 2.086162567138672e-06, 9.393692016601562e-05, 0.00018578767776489258, 0.00027763843536376953, 0.0003694891929626465, 0.00046133995056152344, 0.0005531907081604004, 0.0006450414657592773, 0.0007368922233581543, 0.0008287429809570312, 0.0009205937385559082, 0.0010124444961547852, 0.0011042952537536621, 0.001196146011352539, 0.001287996768951416, 0.001379847526550293, 0.00147169828414917, 0.0015635490417480469, 0.0016553997993469238, 0.0017472505569458008, 0.0018391013145446777, 0.0019309520721435547, 0.0020228028297424316, 0.0021146535873413086, 0.0022065043449401855, 0.0022983551025390625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 11.0, 15.0, 12.0, 30.0, 30.0, 40.0, 51.0, 77.0, 91.0, 139.0, 207.0, 406.0, 747.0, 3497.0, 1035536.0, 5629.0, 741.0, 387.0, 256.0, 187.0, 126.0, 71.0, 54.0, 47.0, 31.0, 28.0, 18.0, 19.0, 10.0, 8.0, 9.0, 4.0, 10.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04396772384643555, -0.042311668395996094, -0.04065561294555664, -0.03899955749511719, -0.037343502044677734, -0.03568744659423828, -0.03403139114379883, -0.032375335693359375, -0.030719280242919922, -0.02906322479248047, -0.027407169342041016, -0.025751113891601562, -0.02409505844116211, -0.022439002990722656, -0.020782947540283203, -0.01912689208984375, -0.017470836639404297, -0.015814781188964844, -0.01415872573852539, -0.012502670288085938, -0.010846614837646484, -0.009190559387207031, -0.007534503936767578, -0.005878448486328125, -0.004222393035888672, -0.0025663375854492188, -0.0009102821350097656, 0.0007457733154296875, 0.0024018287658691406, 0.004057884216308594, 0.005713939666748047, 0.0073699951171875, 0.009026050567626953, 0.010682106018066406, 0.01233816146850586, 0.013994216918945312, 0.015650272369384766, 0.01730632781982422, 0.018962383270263672, 0.020618438720703125, 0.022274494171142578, 0.02393054962158203, 0.025586605072021484, 0.027242660522460938, 0.02889871597290039, 0.030554771423339844, 0.0322108268737793, 0.03386688232421875, 0.0355229377746582, 0.037178993225097656, 0.03883504867553711, 0.04049110412597656, 0.042147159576416016, 0.04380321502685547, 0.04545927047729492, 0.047115325927734375, 0.04877138137817383, 0.05042743682861328, 0.052083492279052734, 0.05373954772949219, 0.05539560317993164, 0.057051658630371094, 0.05870771408081055, 0.06036376953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 170.0, 670.0, 159.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00956297479569912, -0.009348027408123016, -0.009133080020546913, -0.00891813263297081, -0.008703185245394707, -0.008488238789141178, -0.008273291401565075, -0.008058344013988972, -0.007843396626412868, -0.007628449238836765, -0.007413501851260662, -0.007198554929345846, -0.006983607541769743, -0.00676866015419364, -0.006553713232278824, -0.006338765844702721, -0.006123818457126617, -0.005908871069550514, -0.005693923681974411, -0.005478976760059595, -0.005264029372483492, -0.005049081984907389, -0.004834135062992573, -0.00461918767541647, -0.004404240287840366, -0.004189292900264263, -0.00397434551268816, -0.003759398590773344, -0.003544451203197241, -0.0033295038156211376, -0.003114556660875678, -0.0028996095061302185, -0.0026846625842154026, -0.0024697151966392994, -0.00225476804189384, -0.0020398208871483803, -0.001824873499572277, -0.0016099262284114957, -0.0013949789572507143, -0.001180031686089933, -0.0009650844149291515, -0.0007501371437683702, -0.0005351898726075888, -0.0003202426014468074, -0.000105295330286026, 0.00010965194087475538, 0.00032459921203553677, 0.0005395464831963181, 0.0007544937543570995, 0.0009694410255178809, 0.0011843882966786623, 0.0013993355678394437, 0.001614282839000225, 0.0018292301101610065, 0.002044177381321788, 0.0022591245360672474, 0.0024740719236433506, 0.002689019311219454, 0.0029039664659649134, 0.003118913620710373, 0.003333861008286476, 0.0035488083958625793, 0.003763755550608039, 0.0039787027053534985, 0.004193650092929602]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 12.0, 12.0, 9.0, 18.0, 14.0, 13.0, 23.0, 17.0, 26.0, 21.0, 38.0, 31.0, 30.0, 46.0, 42.0, 35.0, 31.0, 37.0, 38.0, 42.0, 38.0, 57.0, 33.0, 37.0, 39.0, 34.0, 24.0, 17.0, 31.0, 17.0, 15.0, 15.0, 11.0, 16.0, 11.0, 10.0, 9.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013030171394348145, -0.0012640319764614105, -0.0012250468134880066, -0.0011860616505146027, -0.0011470764875411987, -0.0011080913245677948, -0.0010691061615943909, -0.001030120998620987, -0.000991135835647583, -0.0009521506726741791, -0.0009131655097007751, -0.0008741803467273712, -0.0008351951837539673, -0.0007962100207805634, -0.0007572248578071594, -0.0007182396948337555, -0.0006792545318603516, -0.0006402693688869476, -0.0006012842059135437, -0.0005622990429401398, -0.0005233138799667358, -0.0004843287169933319, -0.000445343554019928, -0.00040635839104652405, -0.0003673732280731201, -0.0003283880650997162, -0.00028940290212631226, -0.0002504177391529083, -0.0002114325761795044, -0.00017244741320610046, -0.00013346225023269653, -9.44770872592926e-05, -5.549192428588867e-05, -1.650676131248474e-05, 2.247840166091919e-05, 6.146356463432312e-05, 0.00010044872760772705, 0.00013943389058113098, 0.0001784190535545349, 0.00021740421652793884, 0.0002563893795013428, 0.0002953745424747467, 0.00033435970544815063, 0.00037334486842155457, 0.0004123300313949585, 0.0004513151943683624, 0.0004903003573417664, 0.0005292855203151703, 0.0005682706832885742, 0.0006072558462619781, 0.0006462410092353821, 0.000685226172208786, 0.0007242113351821899, 0.0007631964981555939, 0.0008021816611289978, 0.0008411668241024017, 0.0008801519870758057, 0.0009191371500492096, 0.0009581223130226135, 0.0009971074759960175, 0.0010360926389694214, 0.0010750778019428253, 0.0011140629649162292, 0.0011530481278896332, 0.0011920332908630371]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 9.0, 12.0, 16.0, 27.0, 19.0, 23.0, 31.0, 32.0, 36.0, 31.0, 36.0, 44.0, 37.0, 55.0, 37.0, 40.0, 39.0, 44.0, 41.0, 29.0, 38.0, 40.0, 29.0, 32.0, 19.0, 20.0, 25.0, 22.0, 12.0, 18.0, 13.0, 17.0, 9.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.015625, -14.492431640625, -13.96923828125, -13.446044921875, -12.9228515625, -12.399658203125, -11.87646484375, -11.353271484375, -10.830078125, -10.306884765625, -9.78369140625, -9.260498046875, -8.7373046875, -8.214111328125, -7.69091796875, -7.167724609375, -6.64453125, -6.121337890625, -5.59814453125, -5.074951171875, -4.5517578125, -4.028564453125, -3.50537109375, -2.982177734375, -2.458984375, -1.935791015625, -1.41259765625, -0.889404296875, -0.3662109375, 0.156982421875, 0.68017578125, 1.203369140625, 1.7265625, 2.249755859375, 2.77294921875, 3.296142578125, 3.8193359375, 4.342529296875, 4.86572265625, 5.388916015625, 5.912109375, 6.435302734375, 6.95849609375, 7.481689453125, 8.0048828125, 8.528076171875, 9.05126953125, 9.574462890625, 10.09765625, 10.620849609375, 11.14404296875, 11.667236328125, 12.1904296875, 12.713623046875, 13.23681640625, 13.760009765625, 14.283203125, 14.806396484375, 15.32958984375, 15.852783203125, 16.3759765625, 16.899169921875, 17.42236328125, 17.945556640625, 18.46875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 3.0, 12.0, 11.0, 17.0, 22.0, 28.0, 41.0, 58.0, 77.0, 99.0, 132.0, 214.0, 328.0, 465.0, 684.0, 978.0, 1591.0, 2521.0, 5229.0, 20721.0, 249693.0, 691998.0, 55634.0, 8887.0, 3282.0, 1954.0, 1262.0, 844.0, 539.0, 374.0, 235.0, 186.0, 125.0, 95.0, 58.0, 42.0, 30.0, 21.0, 11.0, 18.0, 12.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-47.3125, -45.93017578125, -44.5478515625, -43.16552734375, -41.783203125, -40.40087890625, -39.0185546875, -37.63623046875, -36.25390625, -34.87158203125, -33.4892578125, -32.10693359375, -30.724609375, -29.34228515625, -27.9599609375, -26.57763671875, -25.1953125, -23.81298828125, -22.4306640625, -21.04833984375, -19.666015625, -18.28369140625, -16.9013671875, -15.51904296875, -14.13671875, -12.75439453125, -11.3720703125, -9.98974609375, -8.607421875, -7.22509765625, -5.8427734375, -4.46044921875, -3.078125, -1.69580078125, -0.3134765625, 1.06884765625, 2.451171875, 3.83349609375, 5.2158203125, 6.59814453125, 7.98046875, 9.36279296875, 10.7451171875, 12.12744140625, 13.509765625, 14.89208984375, 16.2744140625, 17.65673828125, 19.0390625, 20.42138671875, 21.8037109375, 23.18603515625, 24.568359375, 25.95068359375, 27.3330078125, 28.71533203125, 30.09765625, 31.47998046875, 32.8623046875, 34.24462890625, 35.626953125, 37.00927734375, 38.3916015625, 39.77392578125, 41.15625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 5.0, 9.0, 10.0, 12.0, 13.0, 22.0, 33.0, 20.0, 47.0, 52.0, 66.0, 58.0, 91.0, 419.0, 1756.0, 82.0, 58.0, 50.0, 42.0, 48.0, 42.0, 26.0, 24.0, 18.0, 17.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0625, -71.75390625, -69.4453125, -67.13671875, -64.828125, -62.51953125, -60.2109375, -57.90234375, -55.59375, -53.28515625, -50.9765625, -48.66796875, -46.359375, -44.05078125, -41.7421875, -39.43359375, -37.125, -34.81640625, -32.5078125, -30.19921875, -27.890625, -25.58203125, -23.2734375, -20.96484375, -18.65625, -16.34765625, -14.0390625, -11.73046875, -9.421875, -7.11328125, -4.8046875, -2.49609375, -0.1875, 2.12109375, 4.4296875, 6.73828125, 9.046875, 11.35546875, 13.6640625, 15.97265625, 18.28125, 20.58984375, 22.8984375, 25.20703125, 27.515625, 29.82421875, 32.1328125, 34.44140625, 36.75, 39.05859375, 41.3671875, 43.67578125, 45.984375, 48.29296875, 50.6015625, 52.91015625, 55.21875, 57.52734375, 59.8359375, 62.14453125, 64.453125, 66.76171875, 69.0703125, 71.37890625, 73.6875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 15.0, 20.0, 26.0, 40.0, 61.0, 90.0, 150.0, 214.0, 482.0, 2560.0, 3136547.0, 4147.0, 614.0, 278.0, 147.0, 83.0, 59.0, 52.0, 30.0, 18.0, 10.0, 13.0, 9.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-241.875, -234.451171875, -227.02734375, -219.603515625, -212.1796875, -204.755859375, -197.33203125, -189.908203125, -182.484375, -175.060546875, -167.63671875, -160.212890625, -152.7890625, -145.365234375, -137.94140625, -130.517578125, -123.09375, -115.669921875, -108.24609375, -100.822265625, -93.3984375, -85.974609375, -78.55078125, -71.126953125, -63.703125, -56.279296875, -48.85546875, -41.431640625, -34.0078125, -26.583984375, -19.16015625, -11.736328125, -4.3125, 3.111328125, 10.53515625, 17.958984375, 25.3828125, 32.806640625, 40.23046875, 47.654296875, 55.078125, 62.501953125, 69.92578125, 77.349609375, 84.7734375, 92.197265625, 99.62109375, 107.044921875, 114.46875, 121.892578125, 129.31640625, 136.740234375, 144.1640625, 151.587890625, 159.01171875, 166.435546875, 173.859375, 181.283203125, 188.70703125, 196.130859375, 203.5546875, 210.978515625, 218.40234375, 225.826171875, 233.25]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 12.0, 73.0, 348.0, 458.0, 103.0, 16.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-310.4275207519531, -302.28631591796875, -294.1451416015625, -286.0039367675781, -277.86273193359375, -269.7215270996094, -261.5803527832031, -253.43914794921875, -245.29794311523438, -237.15675354003906, -229.0155487060547, -220.87435913085938, -212.733154296875, -204.5919647216797, -196.45077514648438, -188.3095703125, -180.1683807373047, -172.02719116210938, -163.885986328125, -155.7447967529297, -147.6035919189453, -139.46240234375, -131.32119750976562, -123.18000793457031, -115.03881072998047, -106.89761352539062, -98.75641632080078, -90.61521911621094, -82.47402954101562, -74.33282470703125, -66.19163513183594, -58.050437927246094, -49.90922546386719, -41.768028259277344, -33.6268310546875, -25.485637664794922, -17.344440460205078, -9.203243255615234, -1.0620498657226562, 7.0791473388671875, 15.220344543457031, 23.361541748046875, 31.502737045288086, 39.6439323425293, 47.78512954711914, 55.926326751708984, 64.06752014160156, 72.2087173461914, 80.34991455078125, 88.4911117553711, 96.63230895996094, 104.77349853515625, 112.91470336914062, 121.05589294433594, 129.19708251953125, 137.33828735351562, 145.4794921875, 153.6206817626953, 161.7618865966797, 169.903076171875, 178.04428100585938, 186.1854705810547, 194.32666015625, 202.46786499023438, 210.6090545654297]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 6.0, 11.0, 8.0, 15.0, 19.0, 10.0, 33.0, 26.0, 31.0, 32.0, 32.0, 58.0, 38.0, 53.0, 46.0, 49.0, 64.0, 50.0, 47.0, 37.0, 40.0, 35.0, 48.0, 28.0, 33.0, 24.0, 25.0, 15.0, 13.0, 13.0, 11.0, 7.0, 7.0, 1.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.732421875, -178.00909423828125, -172.2857666015625, -166.5624237060547, -160.83909606933594, -155.1157684326172, -149.39242553710938, -143.66909790039062, -137.94577026367188, -132.22244262695312, -126.49910736083984, -120.77577209472656, -115.05244445800781, -109.32911682128906, -103.60578155517578, -97.8824462890625, -92.15911865234375, -86.435791015625, -80.71245574951172, -74.98912048339844, -69.26579284667969, -63.54246139526367, -57.819129943847656, -52.09579849243164, -46.372467041015625, -40.64913558959961, -34.925804138183594, -29.202472686767578, -23.479141235351562, -17.755809783935547, -12.032478332519531, -6.309146881103516, -0.5858154296875, 5.137516021728516, 10.860847473144531, 16.584178924560547, 22.307510375976562, 28.030841827392578, 33.754173278808594, 39.47750473022461, 45.200836181640625, 50.92416763305664, 56.647499084472656, 62.37083053588867, 68.09416198730469, 73.81748962402344, 79.54082489013672, 85.26416015625, 90.98748779296875, 96.7108154296875, 102.43415069580078, 108.15748596191406, 113.88081359863281, 119.60414123535156, 125.32747650146484, 131.05081176757812, 136.77413940429688, 142.49746704101562, 148.22079467773438, 153.9441375732422, 159.66746520996094, 165.3907928466797, 171.1141357421875, 176.83746337890625, 182.560791015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 12.0, 11.0, 12.0, 12.0, 20.0, 18.0, 26.0, 26.0, 37.0, 35.0, 35.0, 37.0, 43.0, 44.0, 41.0, 49.0, 35.0, 36.0, 34.0, 39.0, 39.0, 38.0, 45.0, 38.0, 36.0, 36.0, 25.0, 25.0, 18.0, 16.0, 8.0, 12.0, 14.0, 8.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.491943359375, -15.92138671875, -15.350830078125, -14.7802734375, -14.209716796875, -13.63916015625, -13.068603515625, -12.498046875, -11.927490234375, -11.35693359375, -10.786376953125, -10.2158203125, -9.645263671875, -9.07470703125, -8.504150390625, -7.93359375, -7.363037109375, -6.79248046875, -6.221923828125, -5.6513671875, -5.080810546875, -4.51025390625, -3.939697265625, -3.369140625, -2.798583984375, -2.22802734375, -1.657470703125, -1.0869140625, -0.516357421875, 0.05419921875, 0.624755859375, 1.1953125, 1.765869140625, 2.33642578125, 2.906982421875, 3.4775390625, 4.048095703125, 4.61865234375, 5.189208984375, 5.759765625, 6.330322265625, 6.90087890625, 7.471435546875, 8.0419921875, 8.612548828125, 9.18310546875, 9.753662109375, 10.32421875, 10.894775390625, 11.46533203125, 12.035888671875, 12.6064453125, 13.177001953125, 13.74755859375, 14.318115234375, 14.888671875, 15.459228515625, 16.02978515625, 16.600341796875, 17.1708984375, 17.741455078125, 18.31201171875, 18.882568359375, 19.453125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 9.0, 11.0, 7.0, 18.0, 23.0, 34.0, 43.0, 56.0, 82.0, 120.0, 173.0, 215.0, 341.0, 556.0, 863.0, 1592.0, 3026.0, 7011.0, 19091.0, 73102.0, 418454.0, 1755248.0, 1505954.0, 322875.0, 57151.0, 16250.0, 5869.0, 2597.0, 1302.0, 777.0, 428.0, 304.0, 214.0, 158.0, 94.0, 56.0, 57.0, 42.0, 32.0, 21.0, 8.0, 3.0, 7.0, 8.0, 3.0, 3.0], "bins": [-33.53125, -32.69140625, -31.8515625, -31.01171875, -30.171875, -29.33203125, -28.4921875, -27.65234375, -26.8125, -25.97265625, -25.1328125, -24.29296875, -23.453125, -22.61328125, -21.7734375, -20.93359375, -20.09375, -19.25390625, -18.4140625, -17.57421875, -16.734375, -15.89453125, -15.0546875, -14.21484375, -13.375, -12.53515625, -11.6953125, -10.85546875, -10.015625, -9.17578125, -8.3359375, -7.49609375, -6.65625, -5.81640625, -4.9765625, -4.13671875, -3.296875, -2.45703125, -1.6171875, -0.77734375, 0.0625, 0.90234375, 1.7421875, 2.58203125, 3.421875, 4.26171875, 5.1015625, 5.94140625, 6.78125, 7.62109375, 8.4609375, 9.30078125, 10.140625, 10.98046875, 11.8203125, 12.66015625, 13.5, 14.33984375, 15.1796875, 16.01953125, 16.859375, 17.69921875, 18.5390625, 19.37890625, 20.21875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 21.0, 27.0, 42.0, 75.0, 129.0, 161.0, 251.0, 324.0, 564.0, 703.0, 571.0, 379.0, 227.0, 184.0, 120.0, 80.0, 56.0, 31.0, 29.0, 23.0, 10.0, 9.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.4375, -48.12451171875, -46.8115234375, -45.49853515625, -44.185546875, -42.87255859375, -41.5595703125, -40.24658203125, -38.93359375, -37.62060546875, -36.3076171875, -34.99462890625, -33.681640625, -32.36865234375, -31.0556640625, -29.74267578125, -28.4296875, -27.11669921875, -25.8037109375, -24.49072265625, -23.177734375, -21.86474609375, -20.5517578125, -19.23876953125, -17.92578125, -16.61279296875, -15.2998046875, -13.98681640625, -12.673828125, -11.36083984375, -10.0478515625, -8.73486328125, -7.421875, -6.10888671875, -4.7958984375, -3.48291015625, -2.169921875, -0.85693359375, 0.4560546875, 1.76904296875, 3.08203125, 4.39501953125, 5.7080078125, 7.02099609375, 8.333984375, 9.64697265625, 10.9599609375, 12.27294921875, 13.5859375, 14.89892578125, 16.2119140625, 17.52490234375, 18.837890625, 20.15087890625, 21.4638671875, 22.77685546875, 24.08984375, 25.40283203125, 26.7158203125, 28.02880859375, 29.341796875, 30.65478515625, 31.9677734375, 33.28076171875, 34.59375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 8.0, 10.0, 12.0, 23.0, 21.0, 46.0, 77.0, 120.0, 208.0, 475.0, 1361.0, 12156.0, 4169807.0, 7856.0, 1156.0, 456.0, 187.0, 132.0, 48.0, 40.0, 25.0, 12.0, 16.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-147.875, -142.0625, -136.25, -130.4375, -124.625, -118.8125, -113.0, -107.1875, -101.375, -95.5625, -89.75, -83.9375, -78.125, -72.3125, -66.5, -60.6875, -54.875, -49.0625, -43.25, -37.4375, -31.625, -25.8125, -20.0, -14.1875, -8.375, -2.5625, 3.25, 9.0625, 14.875, 20.6875, 26.5, 32.3125, 38.125, 43.9375, 49.75, 55.5625, 61.375, 67.1875, 73.0, 78.8125, 84.625, 90.4375, 96.25, 102.0625, 107.875, 113.6875, 119.5, 125.3125, 131.125, 136.9375, 142.75, 148.5625, 154.375, 160.1875, 166.0, 171.8125, 177.625, 183.4375, 189.25, 195.0625, 200.875, 206.6875, 212.5, 218.3125, 224.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 25.0, 891.0, 98.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1605.8795166015625, -1576.4716796875, -1547.0638427734375, -1517.656005859375, -1488.2481689453125, -1458.84033203125, -1429.4324951171875, -1400.024658203125, -1370.6168212890625, -1341.208984375, -1311.8011474609375, -1282.393310546875, -1252.9854736328125, -1223.57763671875, -1194.1697998046875, -1164.761962890625, -1135.3541259765625, -1105.9462890625, -1076.5384521484375, -1047.130615234375, -1017.7227783203125, -988.31494140625, -958.9071044921875, -929.499267578125, -900.0914916992188, -870.6836547851562, -841.2758178710938, -811.8679809570312, -782.4601440429688, -753.0523071289062, -723.6444702148438, -694.2366333007812, -664.828857421875, -635.4210205078125, -606.01318359375, -576.6053466796875, -547.197509765625, -517.7896728515625, -488.3818359375, -458.9739990234375, -429.566162109375, -400.1583251953125, -370.75048828125, -341.3426513671875, -311.934814453125, -282.5269775390625, -253.11915588378906, -223.71131896972656, -194.303466796875, -164.8956298828125, -135.48779296875, -106.07996368408203, -76.67212677001953, -47.26429748535156, -17.856460571289062, 11.551376342773438, 40.95921325683594, 70.36705017089844, 99.77488708496094, 129.18270874023438, 158.59054565429688, 187.99838256835938, 217.40621948242188, 246.81405639648438, 276.2218933105469]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 5.0, 5.0, 9.0, 10.0, 17.0, 17.0, 24.0, 20.0, 25.0, 23.0, 35.0, 32.0, 31.0, 34.0, 36.0, 31.0, 39.0, 45.0, 28.0, 38.0, 31.0, 31.0, 32.0, 27.0, 29.0, 37.0, 33.0, 37.0, 21.0, 28.0, 25.0, 24.0, 16.0, 14.0, 19.0, 16.0, 13.0, 9.0, 6.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.27886962890625, -116.34530639648438, -112.4117431640625, -108.47817993164062, -104.54461669921875, -100.61105346679688, -96.677490234375, -92.74392700195312, -88.81036376953125, -84.87680053710938, -80.9432373046875, -77.00967407226562, -73.07611083984375, -69.14254760742188, -65.208984375, -61.27542495727539, -57.34186553955078, -53.408302307128906, -49.47473907470703, -45.541175842285156, -41.60761260986328, -37.674049377441406, -33.7404899597168, -29.806926727294922, -25.873363494873047, -21.939800262451172, -18.006237030029297, -14.072675704956055, -10.13911247253418, -6.205549240112305, -2.2719879150390625, 1.6615753173828125, 5.5951385498046875, 9.528701782226562, 13.462264060974121, 17.39582633972168, 21.329389572143555, 25.26295280456543, 29.196514129638672, 33.13007736206055, 37.06364059448242, 40.9972038269043, 44.93076705932617, 48.86432647705078, 52.797889709472656, 56.73145294189453, 60.665016174316406, 64.59857940673828, 68.53214263916016, 72.46570587158203, 76.3992691040039, 80.33283233642578, 84.26639556884766, 88.19995880126953, 92.13351440429688, 96.06707763671875, 100.00064086914062, 103.9342041015625, 107.86776733398438, 111.80133056640625, 115.73489379882812, 119.66845703125, 123.60202026367188, 127.53558349609375, 131.46914672851562]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 6.0, 10.0, 5.0, 18.0, 11.0, 20.0, 18.0, 21.0, 38.0, 31.0, 26.0, 43.0, 36.0, 33.0, 33.0, 36.0, 43.0, 40.0, 43.0, 46.0, 40.0, 38.0, 31.0, 26.0, 37.0, 25.0, 27.0, 28.0, 34.0, 19.0, 15.0, 17.0, 15.0, 12.0, 13.0, 11.0, 9.0, 6.0, 4.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.8515625, -14.4068603515625, -13.962158203125, -13.5174560546875, -13.07275390625, -12.6280517578125, -12.183349609375, -11.7386474609375, -11.2939453125, -10.8492431640625, -10.404541015625, -9.9598388671875, -9.51513671875, -9.0704345703125, -8.625732421875, -8.1810302734375, -7.736328125, -7.2916259765625, -6.846923828125, -6.4022216796875, -5.95751953125, -5.5128173828125, -5.068115234375, -4.6234130859375, -4.1787109375, -3.7340087890625, -3.289306640625, -2.8446044921875, -2.39990234375, -1.9552001953125, -1.510498046875, -1.0657958984375, -0.62109375, -0.1763916015625, 0.268310546875, 0.7130126953125, 1.15771484375, 1.6024169921875, 2.047119140625, 2.4918212890625, 2.9365234375, 3.3812255859375, 3.825927734375, 4.2706298828125, 4.71533203125, 5.1600341796875, 5.604736328125, 6.0494384765625, 6.494140625, 6.9388427734375, 7.383544921875, 7.8282470703125, 8.27294921875, 8.7176513671875, 9.162353515625, 9.6070556640625, 10.0517578125, 10.4964599609375, 10.941162109375, 11.3858642578125, 11.83056640625, 12.2752685546875, 12.719970703125, 13.1646728515625, 13.609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 8.0, 10.0, 13.0, 18.0, 33.0, 36.0, 47.0, 78.0, 101.0, 157.0, 226.0, 302.0, 420.0, 613.0, 841.0, 1220.0, 1694.0, 2405.0, 3275.0, 5025.0, 7349.0, 10295.0, 15571.0, 23003.0, 34849.0, 53355.0, 84900.0, 161762.0, 308315.0, 122307.0, 71286.0, 45286.0, 30314.0, 19840.0, 13299.0, 9231.0, 6391.0, 4354.0, 3069.0, 2041.0, 1530.0, 1099.0, 736.0, 542.0, 403.0, 287.0, 206.0, 124.0, 97.0, 59.0, 44.0, 27.0, 29.0, 15.0, 11.0, 7.0, 8.0, 3.0, 1.0, 2.0], "bins": [-3.228515625, -3.128631591796875, -3.02874755859375, -2.928863525390625, -2.8289794921875, -2.729095458984375, -2.62921142578125, -2.529327392578125, -2.429443359375, -2.329559326171875, -2.22967529296875, -2.129791259765625, -2.0299072265625, -1.930023193359375, -1.83013916015625, -1.730255126953125, -1.63037109375, -1.530487060546875, -1.43060302734375, -1.330718994140625, -1.2308349609375, -1.130950927734375, -1.03106689453125, -0.931182861328125, -0.831298828125, -0.731414794921875, -0.63153076171875, -0.531646728515625, -0.4317626953125, -0.331878662109375, -0.23199462890625, -0.132110595703125, -0.0322265625, 0.067657470703125, 0.16754150390625, 0.267425537109375, 0.3673095703125, 0.467193603515625, 0.56707763671875, 0.666961669921875, 0.766845703125, 0.866729736328125, 0.96661376953125, 1.066497802734375, 1.1663818359375, 1.266265869140625, 1.36614990234375, 1.466033935546875, 1.56591796875, 1.665802001953125, 1.76568603515625, 1.865570068359375, 1.9654541015625, 2.065338134765625, 2.16522216796875, 2.265106201171875, 2.364990234375, 2.464874267578125, 2.56475830078125, 2.664642333984375, 2.7645263671875, 2.864410400390625, 2.96429443359375, 3.064178466796875, 3.1640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 10.0, 12.0, 9.0, 16.0, 18.0, 21.0, 21.0, 25.0, 32.0, 24.0, 20.0, 35.0, 33.0, 33.0, 39.0, 40.0, 27.0, 38.0, 1053.0, 33.0, 32.0, 34.0, 52.0, 27.0, 35.0, 34.0, 38.0, 31.0, 23.0, 26.0, 22.0, 18.0, 19.0, 9.0, 11.0, 9.0, 9.0, 16.0, 8.0, 1.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.875, -8.601318359375, -8.32763671875, -8.053955078125, -7.7802734375, -7.506591796875, -7.23291015625, -6.959228515625, -6.685546875, -6.411865234375, -6.13818359375, -5.864501953125, -5.5908203125, -5.317138671875, -5.04345703125, -4.769775390625, -4.49609375, -4.222412109375, -3.94873046875, -3.675048828125, -3.4013671875, -3.127685546875, -2.85400390625, -2.580322265625, -2.306640625, -2.032958984375, -1.75927734375, -1.485595703125, -1.2119140625, -0.938232421875, -0.66455078125, -0.390869140625, -0.1171875, 0.156494140625, 0.43017578125, 0.703857421875, 0.9775390625, 1.251220703125, 1.52490234375, 1.798583984375, 2.072265625, 2.345947265625, 2.61962890625, 2.893310546875, 3.1669921875, 3.440673828125, 3.71435546875, 3.988037109375, 4.26171875, 4.535400390625, 4.80908203125, 5.082763671875, 5.3564453125, 5.630126953125, 5.90380859375, 6.177490234375, 6.451171875, 6.724853515625, 6.99853515625, 7.272216796875, 7.5458984375, 7.819580078125, 8.09326171875, 8.366943359375, 8.640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 14.0, 16.0, 28.0, 31.0, 42.0, 68.0, 94.0, 135.0, 180.0, 267.0, 337.0, 518.0, 755.0, 1152.0, 1657.0, 2389.0, 3621.0, 5450.0, 8340.0, 12956.0, 20102.0, 31766.0, 49995.0, 82414.0, 147354.0, 1351098.0, 150492.0, 83946.0, 50885.0, 31980.0, 20404.0, 13184.0, 8457.0, 5601.0, 3751.0, 2339.0, 1643.0, 1118.0, 781.0, 483.0, 402.0, 236.0, 182.0, 150.0, 84.0, 63.0, 45.0, 41.0, 22.0, 19.0, 13.0, 8.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0], "bins": [-3.37890625, -3.271697998046875, -3.16448974609375, -3.057281494140625, -2.9500732421875, -2.842864990234375, -2.73565673828125, -2.628448486328125, -2.521240234375, -2.414031982421875, -2.30682373046875, -2.199615478515625, -2.0924072265625, -1.985198974609375, -1.87799072265625, -1.770782470703125, -1.66357421875, -1.556365966796875, -1.44915771484375, -1.341949462890625, -1.2347412109375, -1.127532958984375, -1.02032470703125, -0.913116455078125, -0.805908203125, -0.698699951171875, -0.59149169921875, -0.484283447265625, -0.3770751953125, -0.269866943359375, -0.16265869140625, -0.055450439453125, 0.0517578125, 0.158966064453125, 0.26617431640625, 0.373382568359375, 0.4805908203125, 0.587799072265625, 0.69500732421875, 0.802215576171875, 0.909423828125, 1.016632080078125, 1.12384033203125, 1.231048583984375, 1.3382568359375, 1.445465087890625, 1.55267333984375, 1.659881591796875, 1.76708984375, 1.874298095703125, 1.98150634765625, 2.088714599609375, 2.1959228515625, 2.303131103515625, 2.41033935546875, 2.517547607421875, 2.624755859375, 2.731964111328125, 2.83917236328125, 2.946380615234375, 3.0535888671875, 3.160797119140625, 3.26800537109375, 3.375213623046875, 3.482421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 6.0, 4.0, 7.0, 7.0, 15.0, 12.0, 18.0, 18.0, 17.0, 29.0, 34.0, 29.0, 37.0, 48.0, 66.0, 63.0, 66.0, 77.0, 65.0, 49.0, 51.0, 47.0, 46.0, 32.0, 28.0, 19.0, 18.0, 11.0, 15.0, 9.0, 7.0, 10.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021190643310546875, -0.002045661211013794, -0.0019722580909729004, -0.0018988549709320068, -0.0018254518508911133, -0.0017520487308502197, -0.0016786456108093262, -0.0016052424907684326, -0.001531839370727539, -0.0014584362506866455, -0.001385033130645752, -0.0013116300106048584, -0.0012382268905639648, -0.0011648237705230713, -0.0010914206504821777, -0.0010180175304412842, -0.0009446144104003906, -0.0008712112903594971, -0.0007978081703186035, -0.00072440505027771, -0.0006510019302368164, -0.0005775988101959229, -0.0005041956901550293, -0.00043079257011413574, -0.0003573894500732422, -0.00028398633003234863, -0.00021058320999145508, -0.00013718008995056152, -6.377696990966797e-05, 9.626150131225586e-06, 8.302927017211914e-05, 0.0001564323902130127, 0.00022983551025390625, 0.0003032386302947998, 0.00037664175033569336, 0.0004500448703765869, 0.0005234479904174805, 0.000596851110458374, 0.0006702542304992676, 0.0007436573505401611, 0.0008170604705810547, 0.0008904635906219482, 0.0009638667106628418, 0.0010372698307037354, 0.001110672950744629, 0.0011840760707855225, 0.001257479190826416, 0.0013308823108673096, 0.0014042854309082031, 0.0014776885509490967, 0.0015510916709899902, 0.0016244947910308838, 0.0016978979110717773, 0.001771301031112671, 0.0018447041511535645, 0.001918107271194458, 0.0019915103912353516, 0.002064913511276245, 0.0021383166313171387, 0.0022117197513580322, 0.0022851228713989258, 0.0023585259914398193, 0.002431929111480713, 0.0025053322315216064, 0.0025787353515625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 3.0, 6.0, 18.0, 18.0, 21.0, 28.0, 30.0, 41.0, 44.0, 72.0, 103.0, 144.0, 214.0, 299.0, 575.0, 1172.0, 972154.0, 71247.0, 1002.0, 434.0, 257.0, 206.0, 130.0, 82.0, 71.0, 50.0, 23.0, 31.0, 17.0, 13.0, 8.0, 10.0, 2.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06396484375, -0.062230587005615234, -0.06049633026123047, -0.0587620735168457, -0.05702781677246094, -0.05529356002807617, -0.053559303283691406, -0.05182504653930664, -0.050090789794921875, -0.04835653305053711, -0.046622276306152344, -0.04488801956176758, -0.04315376281738281, -0.04141950607299805, -0.03968524932861328, -0.037950992584228516, -0.03621673583984375, -0.034482479095458984, -0.03274822235107422, -0.031013965606689453, -0.029279708862304688, -0.027545452117919922, -0.025811195373535156, -0.02407693862915039, -0.022342681884765625, -0.02060842514038086, -0.018874168395996094, -0.017139911651611328, -0.015405654907226562, -0.013671398162841797, -0.011937141418457031, -0.010202884674072266, -0.0084686279296875, -0.006734371185302734, -0.005000114440917969, -0.003265857696533203, -0.0015316009521484375, 0.00020265579223632812, 0.0019369125366210938, 0.0036711692810058594, 0.005405426025390625, 0.007139682769775391, 0.008873939514160156, 0.010608196258544922, 0.012342453002929688, 0.014076709747314453, 0.01581096649169922, 0.017545223236083984, 0.01927947998046875, 0.021013736724853516, 0.02274799346923828, 0.024482250213623047, 0.026216506958007812, 0.027950763702392578, 0.029685020446777344, 0.03141927719116211, 0.033153533935546875, 0.03488779067993164, 0.036622047424316406, 0.03835630416870117, 0.04009056091308594, 0.0418248176574707, 0.04355907440185547, 0.045293331146240234, 0.047027587890625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 118.0, 727.0, 160.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005897290073335171, -0.005704463925212622, -0.005511637777090073, -0.005318811628967524, -0.0051259854808449745, -0.0049331593327224255, -0.004740333184599876, -0.004547507036477327, -0.004354680888354778, -0.004161854740232229, -0.00396902859210968, -0.003776202443987131, -0.003583376295864582, -0.003390550147742033, -0.003197723999619484, -0.003004897851496935, -0.002812071703374386, -0.0026192455552518368, -0.0024264194071292877, -0.0022335932590067387, -0.0020407671108841896, -0.0018479409627616405, -0.0016551148146390915, -0.0014622886665165424, -0.0012694625183939934, -0.0010766363702714443, -0.0008838102221488953, -0.0006909840740263462, -0.0004981579259037971, -0.0003053317777812481, -0.00011250562965869904, 8.032051846385002e-05, 0.0002731471322476864, 0.00046597328037023544, 0.0006587994284927845, 0.0008516255766153336, 0.0010444517247378826, 0.0012372778728604317, 0.0014301040209829807, 0.0016229301691055298, 0.0018157563172280788, 0.002008582465350628, 0.002201408613473177, 0.002394234761595726, 0.002587060909718275, 0.002779887057840824, 0.002972713205963373, 0.0031655393540859222, 0.0033583655022084713, 0.0035511916503310204, 0.0037440177984535694, 0.0039368439465761185, 0.0041296700946986675, 0.004322496242821217, 0.004515322390943766, 0.004708148539066315, 0.004900974687188864, 0.005093800835311413, 0.005286626983433962, 0.005479453131556511, 0.00567227927967906, 0.005865105427801609, 0.006057931575924158, 0.006250757724046707, 0.006443583872169256]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 0.0, 5.0, 8.0, 9.0, 13.0, 12.0, 18.0, 17.0, 24.0, 16.0, 15.0, 35.0, 18.0, 31.0, 31.0, 39.0, 27.0, 38.0, 32.0, 49.0, 36.0, 43.0, 29.0, 31.0, 35.0, 42.0, 37.0, 43.0, 28.0, 29.0, 22.0, 15.0, 24.0, 22.0, 18.0, 16.0, 14.0, 16.0, 18.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.001126408576965332, -0.0010908087715506554, -0.0010552089661359787, -0.001019609160721302, -0.0009840093553066254, -0.0009484095498919487, -0.000912809744477272, -0.0008772099390625954, -0.0008416101336479187, -0.000806010328233242, -0.0007704105228185654, -0.0007348107174038887, -0.000699210911989212, -0.0006636111065745354, -0.0006280113011598587, -0.000592411495745182, -0.0005568116903305054, -0.0005212118849158287, -0.00048561207950115204, -0.00045001227408647537, -0.0004144124686717987, -0.00037881266325712204, -0.0003432128578424454, -0.0003076130524277687, -0.00027201324701309204, -0.00023641344159841537, -0.0002008136361837387, -0.00016521383076906204, -0.00012961402535438538, -9.401421993970871e-05, -5.8414414525032043e-05, -2.2814609110355377e-05, 1.2785196304321289e-05, 4.8385001718997955e-05, 8.398480713367462e-05, 0.00011958461254835129, 0.00015518441796302795, 0.00019078422337770462, 0.0002263840287923813, 0.00026198383420705795, 0.0002975836396217346, 0.0003331834450364113, 0.00036878325045108795, 0.0004043830558657646, 0.0004399828612804413, 0.00047558266669511795, 0.0005111824721097946, 0.0005467822775244713, 0.000582382082939148, 0.0006179818883538246, 0.0006535816937685013, 0.000689181499183178, 0.0007247813045978546, 0.0007603811100125313, 0.000795980915427208, 0.0008315807208418846, 0.0008671805262565613, 0.0009027803316712379, 0.0009383801370859146, 0.0009739799425005913, 0.001009579747915268, 0.0010451795533299446, 0.0010807793587446213, 0.001116379164159298, 0.0011519789695739746]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 7.0, 9.0, 5.0, 18.0, 12.0, 20.0, 17.0, 21.0, 39.0, 30.0, 26.0, 43.0, 36.0, 33.0, 33.0, 36.0, 43.0, 42.0, 41.0, 47.0, 39.0, 38.0, 31.0, 27.0, 36.0, 25.0, 27.0, 28.0, 34.0, 19.0, 15.0, 17.0, 15.0, 12.0, 13.0, 10.0, 10.0, 6.0, 4.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-14.84375, -14.399169921875, -13.95458984375, -13.510009765625, -13.0654296875, -12.620849609375, -12.17626953125, -11.731689453125, -11.287109375, -10.842529296875, -10.39794921875, -9.953369140625, -9.5087890625, -9.064208984375, -8.61962890625, -8.175048828125, -7.73046875, -7.285888671875, -6.84130859375, -6.396728515625, -5.9521484375, -5.507568359375, -5.06298828125, -4.618408203125, -4.173828125, -3.729248046875, -3.28466796875, -2.840087890625, -2.3955078125, -1.950927734375, -1.50634765625, -1.061767578125, -0.6171875, -0.172607421875, 0.27197265625, 0.716552734375, 1.1611328125, 1.605712890625, 2.05029296875, 2.494873046875, 2.939453125, 3.384033203125, 3.82861328125, 4.273193359375, 4.7177734375, 5.162353515625, 5.60693359375, 6.051513671875, 6.49609375, 6.940673828125, 7.38525390625, 7.829833984375, 8.2744140625, 8.718994140625, 9.16357421875, 9.608154296875, 10.052734375, 10.497314453125, 10.94189453125, 11.386474609375, 11.8310546875, 12.275634765625, 12.72021484375, 13.164794921875, 13.609375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 11.0, 7.0, 12.0, 15.0, 18.0, 21.0, 20.0, 30.0, 57.0, 63.0, 105.0, 138.0, 184.0, 298.0, 475.0, 684.0, 1167.0, 2142.0, 4431.0, 11084.0, 34463.0, 164895.0, 650627.0, 129585.0, 29226.0, 9671.0, 4042.0, 1956.0, 1098.0, 647.0, 391.0, 269.0, 219.0, 146.0, 75.0, 60.0, 55.0, 29.0, 35.0, 23.0, 13.0, 19.0, 14.0, 5.0, 10.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-29.828125, -28.93603515625, -28.0439453125, -27.15185546875, -26.259765625, -25.36767578125, -24.4755859375, -23.58349609375, -22.69140625, -21.79931640625, -20.9072265625, -20.01513671875, -19.123046875, -18.23095703125, -17.3388671875, -16.44677734375, -15.5546875, -14.66259765625, -13.7705078125, -12.87841796875, -11.986328125, -11.09423828125, -10.2021484375, -9.31005859375, -8.41796875, -7.52587890625, -6.6337890625, -5.74169921875, -4.849609375, -3.95751953125, -3.0654296875, -2.17333984375, -1.28125, -0.38916015625, 0.5029296875, 1.39501953125, 2.287109375, 3.17919921875, 4.0712890625, 4.96337890625, 5.85546875, 6.74755859375, 7.6396484375, 8.53173828125, 9.423828125, 10.31591796875, 11.2080078125, 12.10009765625, 12.9921875, 13.88427734375, 14.7763671875, 15.66845703125, 16.560546875, 17.45263671875, 18.3447265625, 19.23681640625, 20.12890625, 21.02099609375, 21.9130859375, 22.80517578125, 23.697265625, 24.58935546875, 25.4814453125, 26.37353515625, 27.265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 6.0, 7.0, 11.0, 9.0, 16.0, 12.0, 25.0, 18.0, 30.0, 29.0, 38.0, 54.0, 39.0, 55.0, 78.0, 160.0, 1752.0, 223.0, 79.0, 75.0, 51.0, 40.0, 45.0, 41.0, 18.0, 22.0, 15.0, 21.0, 15.0, 9.0, 8.0, 12.0, 3.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.59375, -41.203125, -39.8125, -38.421875, -37.03125, -35.640625, -34.25, -32.859375, -31.46875, -30.078125, -28.6875, -27.296875, -25.90625, -24.515625, -23.125, -21.734375, -20.34375, -18.953125, -17.5625, -16.171875, -14.78125, -13.390625, -12.0, -10.609375, -9.21875, -7.828125, -6.4375, -5.046875, -3.65625, -2.265625, -0.875, 0.515625, 1.90625, 3.296875, 4.6875, 6.078125, 7.46875, 8.859375, 10.25, 11.640625, 13.03125, 14.421875, 15.8125, 17.203125, 18.59375, 19.984375, 21.375, 22.765625, 24.15625, 25.546875, 26.9375, 28.328125, 29.71875, 31.109375, 32.5, 33.890625, 35.28125, 36.671875, 38.0625, 39.453125, 40.84375, 42.234375, 43.625, 45.015625, 46.40625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 13.0, 6.0, 13.0, 16.0, 15.0, 20.0, 28.0, 31.0, 52.0, 91.0, 120.0, 225.0, 445.0, 1062.0, 21853.0, 3117515.0, 2615.0, 677.0, 311.0, 191.0, 108.0, 64.0, 50.0, 38.0, 30.0, 10.0, 19.0, 13.0, 10.0, 10.0, 7.0, 4.0, 9.0, 4.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-136.875, -132.634765625, -128.39453125, -124.154296875, -119.9140625, -115.673828125, -111.43359375, -107.193359375, -102.953125, -98.712890625, -94.47265625, -90.232421875, -85.9921875, -81.751953125, -77.51171875, -73.271484375, -69.03125, -64.791015625, -60.55078125, -56.310546875, -52.0703125, -47.830078125, -43.58984375, -39.349609375, -35.109375, -30.869140625, -26.62890625, -22.388671875, -18.1484375, -13.908203125, -9.66796875, -5.427734375, -1.1875, 3.052734375, 7.29296875, 11.533203125, 15.7734375, 20.013671875, 24.25390625, 28.494140625, 32.734375, 36.974609375, 41.21484375, 45.455078125, 49.6953125, 53.935546875, 58.17578125, 62.416015625, 66.65625, 70.896484375, 75.13671875, 79.376953125, 83.6171875, 87.857421875, 92.09765625, 96.337890625, 100.578125, 104.818359375, 109.05859375, 113.298828125, 117.5390625, 121.779296875, 126.01953125, 130.259765625, 134.5]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 33.0, 931.0, 51.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-513.1840209960938, -498.74810791015625, -484.31219482421875, -469.8763122558594, -455.4403991699219, -441.0044860839844, -426.568603515625, -412.1326904296875, -397.69677734375, -383.2608642578125, -368.824951171875, -354.3890686035156, -339.9531555175781, -325.5172424316406, -311.08135986328125, -296.64544677734375, -282.20953369140625, -267.77362060546875, -253.3377227783203, -238.90182495117188, -224.46591186523438, -210.02999877929688, -195.59410095214844, -181.158203125, -166.7222900390625, -152.286376953125, -137.85047912597656, -123.4145736694336, -108.97866821289062, -94.54276275634766, -80.10685729980469, -65.67095184326172, -51.235015869140625, -36.799110412597656, -22.363204956054688, -7.927299499511719, 6.50860595703125, 20.94451141357422, 35.38041687011719, 49.816322326660156, 64.25222778320312, 78.6881332397461, 93.12403869628906, 107.55994415283203, 121.995849609375, 136.4317626953125, 150.86766052246094, 165.30355834960938, 179.73947143554688, 194.17538452148438, 208.6112823486328, 223.04718017578125, 237.48309326171875, 251.91900634765625, 266.35491943359375, 280.7908020019531, 295.2267150878906, 309.6626281738281, 324.0985107421875, 338.534423828125, 352.9703369140625, 367.40625, 381.8421630859375, 396.2780456542969, 410.7139587402344]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 12.0, 12.0, 12.0, 11.0, 15.0, 16.0, 24.0, 34.0, 26.0, 35.0, 33.0, 30.0, 37.0, 39.0, 35.0, 39.0, 33.0, 46.0, 57.0, 35.0, 41.0, 30.0, 27.0, 46.0, 28.0, 32.0, 21.0, 25.0, 34.0, 17.0, 19.0, 11.0, 9.0, 10.0, 6.0, 6.0, 10.0, 11.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-92.27191925048828, -89.3503646850586, -86.42880249023438, -83.50724792480469, -80.585693359375, -77.66413116455078, -74.7425765991211, -71.82101440429688, -68.89945983886719, -65.9779052734375, -63.05634689331055, -60.134788513183594, -57.21323013305664, -54.29167175292969, -51.3701171875, -48.44855880737305, -45.52700424194336, -42.605445861816406, -39.68389129638672, -36.762332916259766, -33.84077453613281, -30.919218063354492, -27.997661590576172, -25.07610321044922, -22.1545467376709, -19.232990264892578, -16.311431884765625, -13.389875411987305, -10.468317985534668, -7.546760559082031, -4.625204086303711, -1.7036457061767578, 1.2179107666015625, 4.139468193054199, 7.061025142669678, 9.982582092285156, 12.904139518737793, 15.82569694519043, 18.74725341796875, 21.668811798095703, 24.590368270874023, 27.511924743652344, 30.433483123779297, 33.35504150390625, 36.27659606933594, 39.19815444946289, 42.119712829589844, 45.04126739501953, 47.962825775146484, 50.88438415527344, 53.805938720703125, 56.72749710083008, 59.64905548095703, 62.57061004638672, 65.49217224121094, 68.41372680664062, 71.33528137207031, 74.2568359375, 77.17839813232422, 80.0999526977539, 83.0215072631836, 85.94306945800781, 88.8646240234375, 91.78617858886719, 94.7077407836914]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 4.0, 9.0, 4.0, 14.0, 15.0, 15.0, 12.0, 21.0, 13.0, 27.0, 23.0, 27.0, 24.0, 34.0, 36.0, 33.0, 43.0, 47.0, 29.0, 40.0, 34.0, 47.0, 36.0, 42.0, 38.0, 32.0, 30.0, 21.0, 27.0, 24.0, 24.0, 24.0, 16.0, 21.0, 13.0, 13.0, 10.0, 6.0, 15.0, 10.0, 3.0, 11.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.1484375, -14.6536865234375, -14.158935546875, -13.6641845703125, -13.16943359375, -12.6746826171875, -12.179931640625, -11.6851806640625, -11.1904296875, -10.6956787109375, -10.200927734375, -9.7061767578125, -9.21142578125, -8.7166748046875, -8.221923828125, -7.7271728515625, -7.232421875, -6.7376708984375, -6.242919921875, -5.7481689453125, -5.25341796875, -4.7586669921875, -4.263916015625, -3.7691650390625, -3.2744140625, -2.7796630859375, -2.284912109375, -1.7901611328125, -1.29541015625, -0.8006591796875, -0.305908203125, 0.1888427734375, 0.68359375, 1.1783447265625, 1.673095703125, 2.1678466796875, 2.66259765625, 3.1573486328125, 3.652099609375, 4.1468505859375, 4.6416015625, 5.1363525390625, 5.631103515625, 6.1258544921875, 6.62060546875, 7.1153564453125, 7.610107421875, 8.1048583984375, 8.599609375, 9.0943603515625, 9.589111328125, 10.0838623046875, 10.57861328125, 11.0733642578125, 11.568115234375, 12.0628662109375, 12.5576171875, 13.0523681640625, 13.547119140625, 14.0418701171875, 14.53662109375, 15.0313720703125, 15.526123046875, 16.0208740234375, 16.515625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 10.0, 10.0, 15.0, 15.0, 27.0, 39.0, 38.0, 40.0, 51.0, 45.0, 67.0, 93.0, 136.0, 177.0, 301.0, 468.0, 854.0, 2553.0, 41925.0, 4120564.0, 22268.0, 2279.0, 777.0, 450.0, 271.0, 191.0, 123.0, 93.0, 79.0, 66.0, 43.0, 37.0, 38.0, 26.0, 29.0, 19.0, 15.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-149.0, -144.41015625, -139.8203125, -135.23046875, -130.640625, -126.05078125, -121.4609375, -116.87109375, -112.28125, -107.69140625, -103.1015625, -98.51171875, -93.921875, -89.33203125, -84.7421875, -80.15234375, -75.5625, -70.97265625, -66.3828125, -61.79296875, -57.203125, -52.61328125, -48.0234375, -43.43359375, -38.84375, -34.25390625, -29.6640625, -25.07421875, -20.484375, -15.89453125, -11.3046875, -6.71484375, -2.125, 2.46484375, 7.0546875, 11.64453125, 16.234375, 20.82421875, 25.4140625, 30.00390625, 34.59375, 39.18359375, 43.7734375, 48.36328125, 52.953125, 57.54296875, 62.1328125, 66.72265625, 71.3125, 75.90234375, 80.4921875, 85.08203125, 89.671875, 94.26171875, 98.8515625, 103.44140625, 108.03125, 112.62109375, 117.2109375, 121.80078125, 126.390625, 130.98046875, 135.5703125, 140.16015625, 144.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 10.0, 17.0, 14.0, 32.0, 36.0, 101.0, 202.0, 430.0, 873.0, 1021.0, 665.0, 337.0, 145.0, 74.0, 42.0, 23.0, 9.0, 13.0, 6.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.72900390625, -44.2705078125, -42.81201171875, -41.353515625, -39.89501953125, -38.4365234375, -36.97802734375, -35.51953125, -34.06103515625, -32.6025390625, -31.14404296875, -29.685546875, -28.22705078125, -26.7685546875, -25.31005859375, -23.8515625, -22.39306640625, -20.9345703125, -19.47607421875, -18.017578125, -16.55908203125, -15.1005859375, -13.64208984375, -12.18359375, -10.72509765625, -9.2666015625, -7.80810546875, -6.349609375, -4.89111328125, -3.4326171875, -1.97412109375, -0.515625, 0.94287109375, 2.4013671875, 3.85986328125, 5.318359375, 6.77685546875, 8.2353515625, 9.69384765625, 11.15234375, 12.61083984375, 14.0693359375, 15.52783203125, 16.986328125, 18.44482421875, 19.9033203125, 21.36181640625, 22.8203125, 24.27880859375, 25.7373046875, 27.19580078125, 28.654296875, 30.11279296875, 31.5712890625, 33.02978515625, 34.48828125, 35.94677734375, 37.4052734375, 38.86376953125, 40.322265625, 41.78076171875, 43.2392578125, 44.69775390625, 46.15625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 8.0, 10.0, 17.0, 38.0, 64.0, 131.0, 310.0, 859.0, 3059.0, 31348.0, 3882538.0, 266717.0, 6812.0, 1491.0, 493.0, 191.0, 77.0, 42.0, 25.0, 11.0, 7.0, 11.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.125, -82.7421875, -80.359375, -77.9765625, -75.59375, -73.2109375, -70.828125, -68.4453125, -66.0625, -63.6796875, -61.296875, -58.9140625, -56.53125, -54.1484375, -51.765625, -49.3828125, -47.0, -44.6171875, -42.234375, -39.8515625, -37.46875, -35.0859375, -32.703125, -30.3203125, -27.9375, -25.5546875, -23.171875, -20.7890625, -18.40625, -16.0234375, -13.640625, -11.2578125, -8.875, -6.4921875, -4.109375, -1.7265625, 0.65625, 3.0390625, 5.421875, 7.8046875, 10.1875, 12.5703125, 14.953125, 17.3359375, 19.71875, 22.1015625, 24.484375, 26.8671875, 29.25, 31.6328125, 34.015625, 36.3984375, 38.78125, 41.1640625, 43.546875, 45.9296875, 48.3125, 50.6953125, 53.078125, 55.4609375, 57.84375, 60.2265625, 62.609375, 64.9921875, 67.375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 21.0, 28.0, 27.0, 43.0, 76.0, 101.0, 129.0, 135.0, 122.0, 97.0, 81.0, 50.0, 25.0, 17.0, 22.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.7713623046875, -149.88424682617188, -143.9971160888672, -138.11000061035156, -132.22286987304688, -126.33575439453125, -120.4486312866211, -114.56150817871094, -108.67438507080078, -102.78726196289062, -96.90013885498047, -91.01301574707031, -85.12590026855469, -79.23876953125, -73.35165405273438, -67.46453094482422, -61.57740783691406, -55.690284729003906, -49.80316162109375, -43.91604232788086, -38.0289192199707, -32.14179611206055, -26.254676818847656, -20.3675537109375, -14.480430603027344, -8.593308448791504, -2.706186294555664, 3.1809349060058594, 9.068058013916016, 14.955181121826172, 20.842300415039062, 26.72942352294922, 32.61653137207031, 38.50365447998047, 44.390777587890625, 50.277896881103516, 56.16501998901367, 62.05214309692383, 67.93926239013672, 73.82638549804688, 79.71350860595703, 85.60063171386719, 91.48775482177734, 97.3748779296875, 103.26199340820312, 109.14912414550781, 115.03623962402344, 120.9233627319336, 126.81048583984375, 132.69760131835938, 138.58473205566406, 144.4718475341797, 150.35897827148438, 156.24609375, 162.13320922851562, 168.0203399658203, 173.907470703125, 179.79458618164062, 185.6817169189453, 191.56883239746094, 197.45596313476562, 203.34307861328125, 209.23019409179688, 215.11732482910156, 221.0044403076172]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 18.0, 20.0, 11.0, 10.0, 19.0, 27.0, 18.0, 19.0, 24.0, 39.0, 35.0, 32.0, 32.0, 49.0, 40.0, 38.0, 51.0, 40.0, 29.0, 32.0, 31.0, 36.0, 44.0, 30.0, 29.0, 35.0, 32.0, 17.0, 21.0, 22.0, 14.0, 16.0, 20.0, 13.0, 11.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-86.59271240234375, -83.8228759765625, -81.05303955078125, -78.283203125, -75.51336669921875, -72.74353790283203, -69.97370147705078, -67.20386505126953, -64.43402862548828, -61.66419219970703, -58.89435577392578, -56.1245231628418, -53.35468673706055, -50.5848503112793, -47.81501770019531, -45.04518127441406, -42.27534484863281, -39.50550842285156, -36.73567199707031, -33.96583938598633, -31.196002960205078, -28.426166534423828, -25.65633201599121, -22.886497497558594, -20.116661071777344, -17.346824645996094, -14.576990127563477, -11.807154655456543, -9.03731918334961, -6.267483711242676, -3.497648239135742, -0.727813720703125, 2.042022705078125, 4.811858177185059, 7.581693649291992, 10.351529121398926, 13.12136459350586, 15.891200065612793, 18.661035537719727, 21.430870056152344, 24.200706481933594, 26.970542907714844, 29.74037742614746, 32.51021194458008, 35.28004837036133, 38.04988479614258, 40.81971740722656, 43.58955383300781, 46.35939025878906, 49.12922668457031, 51.89906311035156, 54.66889572143555, 57.4387321472168, 60.20856857299805, 62.97840118408203, 65.74823760986328, 68.51807403564453, 71.28791046142578, 74.05774688720703, 76.82758331298828, 79.597412109375, 82.36724853515625, 85.1370849609375, 87.90692138671875, 90.6767578125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 9.0, 11.0, 8.0, 19.0, 13.0, 19.0, 26.0, 21.0, 24.0, 30.0, 33.0, 36.0, 36.0, 45.0, 37.0, 45.0, 58.0, 41.0, 45.0, 33.0, 50.0, 44.0, 39.0, 32.0, 30.0, 45.0, 23.0, 22.0, 21.0, 15.0, 18.0, 17.0, 9.0, 4.0, 8.0, 10.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.625, -128.123046875, -123.62109375, -119.119140625, -114.6171875, -110.115234375, -105.61328125, -101.111328125, -96.609375, -92.107421875, -87.60546875, -83.103515625, -78.6015625, -74.099609375, -69.59765625, -65.095703125, -60.59375, -56.091796875, -51.58984375, -47.087890625, -42.5859375, -38.083984375, -33.58203125, -29.080078125, -24.578125, -20.076171875, -15.57421875, -11.072265625, -6.5703125, -2.068359375, 2.43359375, 6.935546875, 11.4375, 15.939453125, 20.44140625, 24.943359375, 29.4453125, 33.947265625, 38.44921875, 42.951171875, 47.453125, 51.955078125, 56.45703125, 60.958984375, 65.4609375, 69.962890625, 74.46484375, 78.966796875, 83.46875, 87.970703125, 92.47265625, 96.974609375, 101.4765625, 105.978515625, 110.48046875, 114.982421875, 119.484375, 123.986328125, 128.48828125, 132.990234375, 137.4921875, 141.994140625, 146.49609375, 150.998046875, 155.5]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 13.0, 25.0, 19.0, 31.0, 59.0, 67.0, 94.0, 122.0, 210.0, 319.0, 447.0, 612.0, 924.0, 1369.0, 1937.0, 2927.0, 4206.0, 6289.0, 9120.0, 13829.0, 20455.0, 31553.0, 49144.0, 82658.0, 158575.0, 323950.0, 133924.0, 73798.0, 44878.0, 28977.0, 18738.0, 12743.0, 8460.0, 5715.0, 3867.0, 2711.0, 1799.0, 1221.0, 858.0, 579.0, 422.0, 276.0, 186.0, 140.0, 88.0, 68.0, 47.0, 30.0, 21.0, 13.0, 16.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0], "bins": [-31.265625, -30.300537109375, -29.33544921875, -28.370361328125, -27.4052734375, -26.440185546875, -25.47509765625, -24.510009765625, -23.544921875, -22.579833984375, -21.61474609375, -20.649658203125, -19.6845703125, -18.719482421875, -17.75439453125, -16.789306640625, -15.82421875, -14.859130859375, -13.89404296875, -12.928955078125, -11.9638671875, -10.998779296875, -10.03369140625, -9.068603515625, -8.103515625, -7.138427734375, -6.17333984375, -5.208251953125, -4.2431640625, -3.278076171875, -2.31298828125, -1.347900390625, -0.3828125, 0.582275390625, 1.54736328125, 2.512451171875, 3.4775390625, 4.442626953125, 5.40771484375, 6.372802734375, 7.337890625, 8.302978515625, 9.26806640625, 10.233154296875, 11.1982421875, 12.163330078125, 13.12841796875, 14.093505859375, 15.05859375, 16.023681640625, 16.98876953125, 17.953857421875, 18.9189453125, 19.884033203125, 20.84912109375, 21.814208984375, 22.779296875, 23.744384765625, 24.70947265625, 25.674560546875, 26.6396484375, 27.604736328125, 28.56982421875, 29.534912109375, 30.5]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 10.0, 11.0, 13.0, 12.0, 18.0, 22.0, 19.0, 26.0, 33.0, 36.0, 38.0, 33.0, 32.0, 41.0, 42.0, 34.0, 46.0, 1050.0, 42.0, 39.0, 36.0, 48.0, 55.0, 29.0, 34.0, 30.0, 28.0, 22.0, 24.0, 13.0, 28.0, 13.0, 10.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-82.25, -79.5556640625, -76.861328125, -74.1669921875, -71.47265625, -68.7783203125, -66.083984375, -63.3896484375, -60.6953125, -58.0009765625, -55.306640625, -52.6123046875, -49.91796875, -47.2236328125, -44.529296875, -41.8349609375, -39.140625, -36.4462890625, -33.751953125, -31.0576171875, -28.36328125, -25.6689453125, -22.974609375, -20.2802734375, -17.5859375, -14.8916015625, -12.197265625, -9.5029296875, -6.80859375, -4.1142578125, -1.419921875, 1.2744140625, 3.96875, 6.6630859375, 9.357421875, 12.0517578125, 14.74609375, 17.4404296875, 20.134765625, 22.8291015625, 25.5234375, 28.2177734375, 30.912109375, 33.6064453125, 36.30078125, 38.9951171875, 41.689453125, 44.3837890625, 47.078125, 49.7724609375, 52.466796875, 55.1611328125, 57.85546875, 60.5498046875, 63.244140625, 65.9384765625, 68.6328125, 71.3271484375, 74.021484375, 76.7158203125, 79.41015625, 82.1044921875, 84.798828125, 87.4931640625, 90.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 4.0, 17.0, 18.0, 23.0, 43.0, 54.0, 78.0, 96.0, 149.0, 204.0, 313.0, 457.0, 679.0, 998.0, 1544.0, 2292.0, 3681.0, 5792.0, 9310.0, 15121.0, 24815.0, 41925.0, 72307.0, 133682.0, 1368701.0, 185624.0, 94379.0, 52786.0, 31401.0, 18913.0, 11619.0, 7026.0, 4520.0, 2858.0, 1883.0, 1207.0, 834.0, 562.0, 364.0, 260.0, 170.0, 126.0, 81.0, 60.0, 47.0, 33.0, 18.0, 16.0, 10.0, 9.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-35.375, -34.2939453125, -33.212890625, -32.1318359375, -31.05078125, -29.9697265625, -28.888671875, -27.8076171875, -26.7265625, -25.6455078125, -24.564453125, -23.4833984375, -22.40234375, -21.3212890625, -20.240234375, -19.1591796875, -18.078125, -16.9970703125, -15.916015625, -14.8349609375, -13.75390625, -12.6728515625, -11.591796875, -10.5107421875, -9.4296875, -8.3486328125, -7.267578125, -6.1865234375, -5.10546875, -4.0244140625, -2.943359375, -1.8623046875, -0.78125, 0.2998046875, 1.380859375, 2.4619140625, 3.54296875, 4.6240234375, 5.705078125, 6.7861328125, 7.8671875, 8.9482421875, 10.029296875, 11.1103515625, 12.19140625, 13.2724609375, 14.353515625, 15.4345703125, 16.515625, 17.5966796875, 18.677734375, 19.7587890625, 20.83984375, 21.9208984375, 23.001953125, 24.0830078125, 25.1640625, 26.2451171875, 27.326171875, 28.4072265625, 29.48828125, 30.5693359375, 31.650390625, 32.7314453125, 33.8125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0, 10.0, 9.0, 9.0, 9.0, 4.0, 16.0, 23.0, 29.0, 32.0, 39.0, 30.0, 51.0, 72.0, 75.0, 97.0, 84.0, 72.0, 61.0, 43.0, 36.0, 35.0, 26.0, 28.0, 25.0, 13.0, 19.0, 12.0, 13.0, 9.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.02593994140625, -0.025238037109375, -0.0245361328125, -0.023834228515625, -0.02313232421875, -0.022430419921875, -0.021728515625, -0.021026611328125, -0.02032470703125, -0.019622802734375, -0.0189208984375, -0.018218994140625, -0.01751708984375, -0.016815185546875, -0.01611328125, -0.015411376953125, -0.01470947265625, -0.014007568359375, -0.0133056640625, -0.012603759765625, -0.01190185546875, -0.011199951171875, -0.010498046875, -0.009796142578125, -0.00909423828125, -0.008392333984375, -0.0076904296875, -0.006988525390625, -0.00628662109375, -0.005584716796875, -0.0048828125, -0.004180908203125, -0.00347900390625, -0.002777099609375, -0.0020751953125, -0.001373291015625, -0.00067138671875, 3.0517578125e-05, 0.000732421875, 0.001434326171875, 0.00213623046875, 0.002838134765625, 0.0035400390625, 0.004241943359375, 0.00494384765625, 0.005645751953125, 0.00634765625, 0.007049560546875, 0.00775146484375, 0.008453369140625, 0.0091552734375, 0.009857177734375, 0.01055908203125, 0.011260986328125, 0.011962890625, 0.012664794921875, 0.01336669921875, 0.014068603515625, 0.0147705078125, 0.015472412109375, 0.01617431640625, 0.016876220703125, 0.017578125, 0.018280029296875, 0.01898193359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 5.0, 7.0, 7.0, 6.0, 14.0, 18.0, 24.0, 28.0, 39.0, 44.0, 57.0, 99.0, 152.0, 257.0, 481.0, 1223.0, 4731.0, 47368.0, 830884.0, 150323.0, 9476.0, 1762.0, 641.0, 299.0, 189.0, 106.0, 81.0, 56.0, 35.0, 29.0, 16.0, 22.0, 20.0, 18.0, 6.0, 4.0, 10.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2958984375, -0.2871131896972656, -0.27832794189453125, -0.2695426940917969, -0.2607574462890625, -0.2519721984863281, -0.24318695068359375, -0.23440170288085938, -0.225616455078125, -0.21683120727539062, -0.20804595947265625, -0.19926071166992188, -0.1904754638671875, -0.18169021606445312, -0.17290496826171875, -0.16411972045898438, -0.15533447265625, -0.14654922485351562, -0.13776397705078125, -0.12897872924804688, -0.1201934814453125, -0.11140823364257812, -0.10262298583984375, -0.09383773803710938, -0.085052490234375, -0.07626724243164062, -0.06748199462890625, -0.058696746826171875, -0.0499114990234375, -0.041126251220703125, -0.03234100341796875, -0.023555755615234375, -0.0147705078125, -0.005985260009765625, 0.00279998779296875, 0.011585235595703125, 0.0203704833984375, 0.029155731201171875, 0.03794097900390625, 0.046726226806640625, 0.055511474609375, 0.06429672241210938, 0.07308197021484375, 0.08186721801757812, 0.0906524658203125, 0.09943771362304688, 0.10822296142578125, 0.11700820922851562, 0.12579345703125, 0.13457870483398438, 0.14336395263671875, 0.15214920043945312, 0.1609344482421875, 0.16971969604492188, 0.17850494384765625, 0.18729019165039062, 0.196075439453125, 0.20486068725585938, 0.21364593505859375, 0.22243118286132812, 0.2312164306640625, 0.24000167846679688, 0.24878692626953125, 0.2575721740722656, 0.266357421875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 11.0, 23.0, 34.0, 98.0, 206.0, 259.0, 185.0, 111.0, 44.0, 20.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.052733127027750015, -0.05140402913093567, -0.05007493495941162, -0.048745837062597275, -0.04741674289107323, -0.04608764499425888, -0.04475855082273483, -0.043429452925920486, -0.04210035502910614, -0.040771257132291794, -0.039442162960767746, -0.0381130650639534, -0.03678397089242935, -0.035454872995615005, -0.03412577509880066, -0.03279668092727661, -0.031467586755752563, -0.030138490721583366, -0.02880939468741417, -0.027480296790599823, -0.026151202619075775, -0.02482210472226143, -0.023493008688092232, -0.022163912653923035, -0.020834816619753838, -0.01950572058558464, -0.018176624551415443, -0.016847528517246246, -0.015518431551754475, -0.014189335517585278, -0.012860238552093506, -0.011531142517924309, -0.010202042758464813, -0.008872946724295616, -0.007543850224465132, -0.006214753724634647, -0.00488565769046545, -0.003556561656296253, -0.0022274646908044815, -0.0008983686566352844, 0.00043072737753391266, 0.0017598236445337534, 0.003088919911533594, 0.0044180164113640785, 0.005747112445533276, 0.007076208479702473, 0.008405305445194244, 0.009734401479363441, 0.011063497513532639, 0.012392593547701836, 0.013721689581871033, 0.015050786547362804, 0.016379881650209427, 0.017708979547023773, 0.01903807558119297, 0.020367171615362167, 0.021696267649531364, 0.02302536368370056, 0.02435445971786976, 0.025683555752038956, 0.027012653648853302, 0.02834174782037735, 0.029670845717191696, 0.030999941751360893, 0.03232903778553009]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 0.0, 8.0, 6.0, 6.0, 7.0, 18.0, 18.0, 15.0, 23.0, 23.0, 21.0, 22.0, 24.0, 23.0, 32.0, 26.0, 36.0, 27.0, 28.0, 39.0, 38.0, 45.0, 50.0, 37.0, 35.0, 40.0, 31.0, 39.0, 25.0, 39.0, 36.0, 23.0, 27.0, 24.0, 18.0, 19.0, 23.0, 9.0, 5.0, 4.0, 8.0, 9.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00970923900604248, -0.009384767152369022, -0.009060295298695564, -0.008735823445022106, -0.008411351591348648, -0.00808687973767519, -0.007762407884001732, -0.007437936030328274, -0.007113464176654816, -0.006788992322981358, -0.0064645204693078995, -0.006140048615634441, -0.005815576761960983, -0.005491104908287525, -0.005166633054614067, -0.004842161200940609, -0.004517689347267151, -0.004193217493593693, -0.0038687456399202347, -0.0035442737862467766, -0.0032198019325733185, -0.0028953300788998604, -0.0025708582252264023, -0.002246386371552944, -0.001921914517879486, -0.001597442664206028, -0.0012729708105325699, -0.0009484989568591118, -0.0006240271031856537, -0.0002995552495121956, 2.4916604161262512e-05, 0.0003493884578347206, 0.0006738603115081787, 0.0009983321651816368, 0.001322804018855095, 0.001647275872528553, 0.001971747726202011, 0.002296219579875469, 0.0026206914335489273, 0.0029451632872223854, 0.0032696351408958435, 0.0035941069945693016, 0.00391857884824276, 0.004243050701916218, 0.004567522555589676, 0.004891994409263134, 0.005216466262936592, 0.00554093811661005, 0.005865409970283508, 0.006189881823956966, 0.0065143536776304245, 0.006838825531303883, 0.007163297384977341, 0.007487769238650799, 0.007812241092324257, 0.008136712945997715, 0.008461184799671173, 0.008785656653344631, 0.00911012850701809, 0.009434600360691547, 0.009759072214365005, 0.010083544068038464, 0.010408015921711922, 0.01073248777538538, 0.011056959629058838]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 8.0, 10.0, 10.0, 9.0, 19.0, 13.0, 19.0, 26.0, 21.0, 24.0, 30.0, 32.0, 34.0, 39.0, 43.0, 39.0, 45.0, 58.0, 40.0, 45.0, 34.0, 50.0, 44.0, 38.0, 33.0, 28.0, 46.0, 24.0, 22.0, 19.0, 16.0, 19.0, 17.0, 9.0, 4.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.75, -128.248046875, -123.74609375, -119.244140625, -114.7421875, -110.240234375, -105.73828125, -101.236328125, -96.734375, -92.232421875, -87.73046875, -83.228515625, -78.7265625, -74.224609375, -69.72265625, -65.220703125, -60.71875, -56.216796875, -51.71484375, -47.212890625, -42.7109375, -38.208984375, -33.70703125, -29.205078125, -24.703125, -20.201171875, -15.69921875, -11.197265625, -6.6953125, -2.193359375, 2.30859375, 6.810546875, 11.3125, 15.814453125, 20.31640625, 24.818359375, 29.3203125, 33.822265625, 38.32421875, 42.826171875, 47.328125, 51.830078125, 56.33203125, 60.833984375, 65.3359375, 69.837890625, 74.33984375, 78.841796875, 83.34375, 87.845703125, 92.34765625, 96.849609375, 101.3515625, 105.853515625, 110.35546875, 114.857421875, 119.359375, 123.861328125, 128.36328125, 132.865234375, 137.3671875, 141.869140625, 146.37109375, 150.873046875, 155.375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 1.0, 7.0, 11.0, 11.0, 8.0, 15.0, 23.0, 27.0, 40.0, 67.0, 73.0, 125.0, 169.0, 253.0, 402.0, 701.0, 1192.0, 2179.0, 4159.0, 9538.0, 28349.0, 136557.0, 628090.0, 181092.0, 34477.0, 10695.0, 4561.0, 2355.0, 1288.0, 714.0, 449.0, 273.0, 204.0, 136.0, 79.0, 64.0, 44.0, 37.0, 27.0, 16.0, 14.0, 10.0, 5.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.34375, -39.06591796875, -37.7880859375, -36.51025390625, -35.232421875, -33.95458984375, -32.6767578125, -31.39892578125, -30.12109375, -28.84326171875, -27.5654296875, -26.28759765625, -25.009765625, -23.73193359375, -22.4541015625, -21.17626953125, -19.8984375, -18.62060546875, -17.3427734375, -16.06494140625, -14.787109375, -13.50927734375, -12.2314453125, -10.95361328125, -9.67578125, -8.39794921875, -7.1201171875, -5.84228515625, -4.564453125, -3.28662109375, -2.0087890625, -0.73095703125, 0.546875, 1.82470703125, 3.1025390625, 4.38037109375, 5.658203125, 6.93603515625, 8.2138671875, 9.49169921875, 10.76953125, 12.04736328125, 13.3251953125, 14.60302734375, 15.880859375, 17.15869140625, 18.4365234375, 19.71435546875, 20.9921875, 22.27001953125, 23.5478515625, 24.82568359375, 26.103515625, 27.38134765625, 28.6591796875, 29.93701171875, 31.21484375, 32.49267578125, 33.7705078125, 35.04833984375, 36.326171875, 37.60400390625, 38.8818359375, 40.15966796875, 41.4375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 7.0, 8.0, 13.0, 12.0, 20.0, 35.0, 53.0, 52.0, 86.0, 82.0, 92.0, 2124.0, 83.0, 77.0, 86.0, 54.0, 49.0, 36.0, 15.0, 21.0, 13.0, 12.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-461.0, -449.31640625, -437.6328125, -425.94921875, -414.265625, -402.58203125, -390.8984375, -379.21484375, -367.53125, -355.84765625, -344.1640625, -332.48046875, -320.796875, -309.11328125, -297.4296875, -285.74609375, -274.0625, -262.37890625, -250.6953125, -239.01171875, -227.328125, -215.64453125, -203.9609375, -192.27734375, -180.59375, -168.91015625, -157.2265625, -145.54296875, -133.859375, -122.17578125, -110.4921875, -98.80859375, -87.125, -75.44140625, -63.7578125, -52.07421875, -40.390625, -28.70703125, -17.0234375, -5.33984375, 6.34375, 18.02734375, 29.7109375, 41.39453125, 53.078125, 64.76171875, 76.4453125, 88.12890625, 99.8125, 111.49609375, 123.1796875, 134.86328125, 146.546875, 158.23046875, 169.9140625, 181.59765625, 193.28125, 204.96484375, 216.6484375, 228.33203125, 240.015625, 251.69921875, 263.3828125, 275.06640625, 286.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 19.0, 30.0, 64.0, 90.0, 178.0, 437.0, 1087.0, 4807.0, 425224.0, 2706102.0, 5670.0, 1118.0, 447.0, 202.0, 87.0, 56.0, 40.0, 11.0, 11.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-145.375, -141.103515625, -136.83203125, -132.560546875, -128.2890625, -124.017578125, -119.74609375, -115.474609375, -111.203125, -106.931640625, -102.66015625, -98.388671875, -94.1171875, -89.845703125, -85.57421875, -81.302734375, -77.03125, -72.759765625, -68.48828125, -64.216796875, -59.9453125, -55.673828125, -51.40234375, -47.130859375, -42.859375, -38.587890625, -34.31640625, -30.044921875, -25.7734375, -21.501953125, -17.23046875, -12.958984375, -8.6875, -4.416015625, -0.14453125, 4.126953125, 8.3984375, 12.669921875, 16.94140625, 21.212890625, 25.484375, 29.755859375, 34.02734375, 38.298828125, 42.5703125, 46.841796875, 51.11328125, 55.384765625, 59.65625, 63.927734375, 68.19921875, 72.470703125, 76.7421875, 81.013671875, 85.28515625, 89.556640625, 93.828125, 98.099609375, 102.37109375, 106.642578125, 110.9140625, 115.185546875, 119.45703125, 123.728515625, 128.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 20.0, 23.0, 63.0, 107.0, 238.0, 234.0, 138.0, 93.0, 29.0, 21.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.71250915527344, -237.0719757080078, -221.43145751953125, -205.79092407226562, -190.150390625, -174.50985717773438, -158.86932373046875, -143.2288055419922, -127.58827209472656, -111.94773864746094, -96.30721282958984, -80.66668701171875, -65.02615356445312, -49.3856201171875, -33.745094299316406, -18.104568481445312, -2.4640350341796875, 13.176494598388672, 28.81702423095703, 44.45755386352539, 60.09808349609375, 75.73861694335938, 91.37914276123047, 107.01966857910156, 122.66020202636719, 138.3007354736328, 153.94125366210938, 169.581787109375, 185.22232055664062, 200.86285400390625, 216.50338745117188, 232.14390563964844, 247.784423828125, 263.4249572753906, 279.06549072265625, 294.7060241699219, 310.3465576171875, 325.987060546875, 341.6275939941406, 357.26812744140625, 372.9086608886719, 388.5491943359375, 404.1897277832031, 419.83026123046875, 435.47076416015625, 451.111328125, 466.7518310546875, 482.3923645019531, 498.03289794921875, 513.6734008789062, 529.31396484375, 544.9544677734375, 560.5950317382812, 576.2355346679688, 591.8760986328125, 607.5166015625, 623.1571044921875, 638.797607421875, 654.4381713867188, 670.0786743164062, 685.71923828125, 701.3597412109375, 717.0003051757812, 732.6408081054688, 748.2813720703125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 6.0, 5.0, 7.0, 14.0, 10.0, 11.0, 14.0, 18.0, 22.0, 25.0, 31.0, 31.0, 39.0, 37.0, 42.0, 51.0, 50.0, 49.0, 51.0, 55.0, 40.0, 44.0, 51.0, 39.0, 26.0, 29.0, 31.0, 36.0, 20.0, 16.0, 22.0, 22.0, 11.0, 12.0, 4.0, 1.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-337.32763671875, -327.73046875, -318.1333312988281, -308.5361633300781, -298.9389953613281, -289.34185791015625, -279.74468994140625, -270.14752197265625, -260.55035400390625, -250.9532012939453, -241.3560333251953, -231.75888061523438, -222.16171264648438, -212.56455993652344, -202.9674072265625, -193.3702392578125, -183.77310180664062, -174.1759490966797, -164.5787811279297, -154.98162841796875, -145.38446044921875, -135.7873077392578, -126.19015502929688, -116.5929946899414, -106.99583435058594, -97.39867401123047, -87.801513671875, -78.20436096191406, -68.6072006225586, -59.010040283203125, -49.41288375854492, -39.81572723388672, -30.218536376953125, -20.62137794494629, -11.024219512939453, -1.4270610809326172, 8.170097351074219, 17.767257690429688, 27.36441421508789, 36.961570739746094, 46.55873107910156, 56.15589141845703, 65.7530517578125, 75.35020446777344, 84.9473648071289, 94.54452514648438, 104.14167785644531, 113.73883819580078, 123.33599853515625, 132.9331512451172, 142.5303192138672, 152.12747192382812, 161.72463989257812, 171.32179260253906, 180.9189453125, 190.51611328125, 200.11326599121094, 209.71041870117188, 219.30758666992188, 228.9047393798828, 238.50189208984375, 248.09906005859375, 257.69622802734375, 267.2933654785156, 276.8905334472656]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 3.0, 6.0, 4.0, 14.0, 12.0, 26.0, 32.0, 43.0, 50.0, 79.0, 97.0, 121.0, 192.0, 263.0, 366.0, 559.0, 743.0, 1275.0, 1041330.0, 989.0, 644.0, 471.0, 327.0, 247.0, 162.0, 127.0, 108.0, 61.0, 43.0, 38.0, 17.0, 16.0, 21.0, 14.0, 9.0, 16.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-125.7390365600586, -122.27841186523438, -118.81777954101562, -115.3571548461914, -111.89653015136719, -108.43589782714844, -104.97527313232422, -101.5146484375, -98.05401611328125, -94.59339141845703, -91.13275909423828, -87.67213439941406, -84.21150970458984, -80.75088500976562, -77.29025268554688, -73.82962799072266, -70.36900329589844, -66.90837860107422, -63.447750091552734, -59.98712158203125, -56.52649688720703, -53.06586837768555, -49.60523986816406, -46.144615173339844, -42.68398666381836, -39.223358154296875, -35.762733459472656, -32.30210494995117, -28.84147834777832, -25.38085174560547, -21.920223236083984, -18.459596633911133, -14.998970031738281, -11.53834342956543, -8.077715873718262, -4.617088317871094, -1.1564617156982422, 2.3041648864746094, 5.764793395996094, 9.225419998168945, 12.686046600341797, 16.14667320251465, 19.6072998046875, 23.067928314208984, 26.528554916381836, 29.989181518554688, 33.44981002807617, 36.910438537597656, 40.371063232421875, 43.83169174194336, 47.29231643676758, 50.75294494628906, 54.21356964111328, 57.674198150634766, 61.13482666015625, 64.59545135498047, 68.05607604980469, 71.5167007446289, 74.97733306884766, 78.43795776367188, 81.8985824584961, 85.35920715332031, 88.81983947753906, 92.28046417236328, 95.74109649658203]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 9.0, 9.0, 5.0, 8.0, 4.0, 13.0, 13.0, 15.0, 24.0, 50.0, 227.0, 51462156.0, 430.0, 70.0, 26.0, 15.0, 17.0, 8.0, 7.0, 5.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13485.986328125, -12866.3193359375, -12246.6513671875, -11626.984375, -11007.31640625, -10387.6494140625, -9767.982421875, -9148.314453125, -8528.646484375, -7908.97900390625, -7289.3115234375, -6669.64453125, -6049.9765625, -5430.3095703125, -4810.64208984375, -4190.974609375, -3571.3076171875, -2951.64013671875, -2331.97265625, -1712.305419921875, -1092.637939453125, -472.970458984375, 146.69677734375, 766.3642578125, 1386.03173828125, 2005.69921875, 2625.36669921875, 3245.033935546875, 3864.701416015625, 4484.369140625, 5104.0361328125, 5723.70361328125, 6343.37109375, 6963.03857421875, 7582.7060546875, 8202.373046875, 8822.041015625, 9441.7080078125, 10061.375, 10681.04296875, 11300.7109375, 11920.3779296875, 12540.0458984375, 13159.712890625, 13779.380859375, 14399.0478515625, 15018.71484375, 15638.3828125, 16258.0498046875, 16877.716796875, 17497.384765625, 18117.052734375, 18736.71875, 19356.38671875, 19976.0546875, 20595.72265625, 21215.388671875, 21835.056640625, 22454.72265625, 23074.390625, 23694.05859375, 24313.7265625, 24933.392578125, 25553.060546875, 26172.728515625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 16.0, 40.0, 47.0, 69.0, 106.0, 137.0, 252.0, 364.0, 475.0, 701.0, 1090.0, 1565.0, 2250.0, 3257.0, 4673.0, 6849.0, 9702.0, 14014.0, 20077.0, 28282.0, 40835.0, 59264.0, 88928.0, 133632.0, 218055.0, 436426.0, 3647388.0, 794100.0, 281460.0, 165256.0, 105698.0, 69818.0, 47786.0, 33016.0, 23160.0, 15765.0, 11427.0, 7702.0, 5441.0, 3850.0, 2689.0, 1793.0, 1298.0, 932.0, 581.0, 402.0, 276.0, 187.0, 106.0, 61.0, 51.0, 35.0, 19.0, 18.0, 10.0, 4.0, 4.0, 3.0], "bins": [-12.9453125, -12.5496826171875, -12.154052734375, -11.7584228515625, -11.36279296875, -10.9671630859375, -10.571533203125, -10.1759033203125, -9.7802734375, -9.3846435546875, -8.989013671875, -8.5933837890625, -8.19775390625, -7.8021240234375, -7.406494140625, -7.0108642578125, -6.615234375, -6.2196044921875, -5.823974609375, -5.4283447265625, -5.03271484375, -4.6370849609375, -4.241455078125, -3.8458251953125, -3.4501953125, -3.0545654296875, -2.658935546875, -2.2633056640625, -1.86767578125, -1.4720458984375, -1.076416015625, -0.6807861328125, -0.28515625, 0.1104736328125, 0.506103515625, 0.9017333984375, 1.29736328125, 1.6929931640625, 2.088623046875, 2.4842529296875, 2.8798828125, 3.2755126953125, 3.671142578125, 4.0667724609375, 4.46240234375, 4.8580322265625, 5.253662109375, 5.6492919921875, 6.044921875, 6.4405517578125, 6.836181640625, 7.2318115234375, 7.62744140625, 8.0230712890625, 8.418701171875, 8.8143310546875, 9.2099609375, 9.6055908203125, 10.001220703125, 10.3968505859375, 10.79248046875, 11.1881103515625, 11.583740234375, 11.9793701171875, 12.375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 7.0, 11.0, 6.0, 14.0, 19.0, 24.0, 16.0, 27.0, 30.0, 23.0, 17.0, 25.0, 47.0, 30.0, 42.0, 59.0, 99.0, 233.0, 596.0, 190.0, 68.0, 48.0, 39.0, 32.0, 33.0, 46.0, 19.0, 20.0, 21.0, 20.0, 17.0, 18.0, 19.0, 18.0, 14.0, 10.0, 13.0, 5.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.01611328125, -26.1259765625, -25.23583984375, -24.345703125, -23.45556640625, -22.5654296875, -21.67529296875, -20.78515625, -19.89501953125, -19.0048828125, -18.11474609375, -17.224609375, -16.33447265625, -15.4443359375, -14.55419921875, -13.6640625, -12.77392578125, -11.8837890625, -10.99365234375, -10.103515625, -9.21337890625, -8.3232421875, -7.43310546875, -6.54296875, -5.65283203125, -4.7626953125, -3.87255859375, -2.982421875, -2.09228515625, -1.2021484375, -0.31201171875, 0.578125, 1.46826171875, 2.3583984375, 3.24853515625, 4.138671875, 5.02880859375, 5.9189453125, 6.80908203125, 7.69921875, 8.58935546875, 9.4794921875, 10.36962890625, 11.259765625, 12.14990234375, 13.0400390625, 13.93017578125, 14.8203125, 15.71044921875, 16.6005859375, 17.49072265625, 18.380859375, 19.27099609375, 20.1611328125, 21.05126953125, 21.94140625, 22.83154296875, 23.7216796875, 24.61181640625, 25.501953125, 26.39208984375, 27.2822265625, 28.17236328125, 29.0625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 14.0, 17.0, 12.0, 28.0, 43.0, 63.0, 73.0, 135.0, 207.0, 300.0, 471.0, 665.0, 1054.0, 1687.0, 2603.0, 4207.0, 6650.0, 11053.0, 18449.0, 30572.0, 53078.0, 96567.0, 185941.0, 409939.0, 3680958.0, 1132874.0, 312323.0, 150147.0, 79773.0, 44684.0, 25918.0, 15827.0, 9298.0, 5766.0, 3451.0, 2401.0, 1485.0, 897.0, 613.0, 377.0, 293.0, 180.0, 102.0, 79.0, 63.0, 30.0, 22.0, 21.0, 6.0, 7.0, 8.0, 0.0, 3.0, 4.0, 5.0], "bins": [-17.84375, -17.3165283203125, -16.789306640625, -16.2620849609375, -15.73486328125, -15.2076416015625, -14.680419921875, -14.1531982421875, -13.6259765625, -13.0987548828125, -12.571533203125, -12.0443115234375, -11.51708984375, -10.9898681640625, -10.462646484375, -9.9354248046875, -9.408203125, -8.8809814453125, -8.353759765625, -7.8265380859375, -7.29931640625, -6.7720947265625, -6.244873046875, -5.7176513671875, -5.1904296875, -4.6632080078125, -4.135986328125, -3.6087646484375, -3.08154296875, -2.5543212890625, -2.027099609375, -1.4998779296875, -0.97265625, -0.4454345703125, 0.081787109375, 0.6090087890625, 1.13623046875, 1.6634521484375, 2.190673828125, 2.7178955078125, 3.2451171875, 3.7723388671875, 4.299560546875, 4.8267822265625, 5.35400390625, 5.8812255859375, 6.408447265625, 6.9356689453125, 7.462890625, 7.9901123046875, 8.517333984375, 9.0445556640625, 9.57177734375, 10.0989990234375, 10.626220703125, 11.1534423828125, 11.6806640625, 12.2078857421875, 12.735107421875, 13.2623291015625, 13.78955078125, 14.3167724609375, 14.843994140625, 15.3712158203125, 15.8984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 5.0, 9.0, 13.0, 17.0, 17.0, 24.0, 23.0, 20.0, 20.0, 32.0, 37.0, 49.0, 52.0, 48.0, 61.0, 134.0, 371.0, 469.0, 150.0, 70.0, 53.0, 45.0, 39.0, 38.0, 35.0, 27.0, 29.0, 24.0, 17.0, 21.0, 16.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.578125, -20.860107421875, -20.14208984375, -19.424072265625, -18.7060546875, -17.988037109375, -17.27001953125, -16.552001953125, -15.833984375, -15.115966796875, -14.39794921875, -13.679931640625, -12.9619140625, -12.243896484375, -11.52587890625, -10.807861328125, -10.08984375, -9.371826171875, -8.65380859375, -7.935791015625, -7.2177734375, -6.499755859375, -5.78173828125, -5.063720703125, -4.345703125, -3.627685546875, -2.90966796875, -2.191650390625, -1.4736328125, -0.755615234375, -0.03759765625, 0.680419921875, 1.3984375, 2.116455078125, 2.83447265625, 3.552490234375, 4.2705078125, 4.988525390625, 5.70654296875, 6.424560546875, 7.142578125, 7.860595703125, 8.57861328125, 9.296630859375, 10.0146484375, 10.732666015625, 11.45068359375, 12.168701171875, 12.88671875, 13.604736328125, 14.32275390625, 15.040771484375, 15.7587890625, 16.476806640625, 17.19482421875, 17.912841796875, 18.630859375, 19.348876953125, 20.06689453125, 20.784912109375, 21.5029296875, 22.220947265625, 22.93896484375, 23.656982421875, 24.375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 2.0, 1.0, 12.0, 16.0, 37.0, 10.0, 20.0, 29.0, 32.0, 42.0, 59.0, 109.0, 115.0, 121.0, 201.0, 249.0, 341.0, 463.0, 584.0, 740.0, 1262.0, 1755.0, 2761.0, 4830.0, 8913.0, 18778.0, 50505.0, 333083.0, 5755173.0, 63563.0, 22568.0, 10138.0, 5366.0, 2906.0, 1981.0, 1227.0, 836.0, 674.0, 486.0, 328.0, 260.0, 184.0, 180.0, 144.0, 63.0, 61.0, 36.0, 45.0, 29.0, 35.0, 28.0, 20.0, 11.0, 8.0, 9.0, 12.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-42.375, -41.01220703125, -39.6494140625, -38.28662109375, -36.923828125, -35.56103515625, -34.1982421875, -32.83544921875, -31.47265625, -30.10986328125, -28.7470703125, -27.38427734375, -26.021484375, -24.65869140625, -23.2958984375, -21.93310546875, -20.5703125, -19.20751953125, -17.8447265625, -16.48193359375, -15.119140625, -13.75634765625, -12.3935546875, -11.03076171875, -9.66796875, -8.30517578125, -6.9423828125, -5.57958984375, -4.216796875, -2.85400390625, -1.4912109375, -0.12841796875, 1.234375, 2.59716796875, 3.9599609375, 5.32275390625, 6.685546875, 8.04833984375, 9.4111328125, 10.77392578125, 12.13671875, 13.49951171875, 14.8623046875, 16.22509765625, 17.587890625, 18.95068359375, 20.3134765625, 21.67626953125, 23.0390625, 24.40185546875, 25.7646484375, 27.12744140625, 28.490234375, 29.85302734375, 31.2158203125, 32.57861328125, 33.94140625, 35.30419921875, 36.6669921875, 38.02978515625, 39.392578125, 40.75537109375, 42.1181640625, 43.48095703125, 44.84375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 11.0, 9.0, 13.0, 14.0, 16.0, 23.0, 32.0, 23.0, 14.0, 35.0, 32.0, 33.0, 41.0, 66.0, 85.0, 123.0, 303.0, 428.0, 174.0, 108.0, 61.0, 45.0, 36.0, 32.0, 37.0, 43.0, 24.0, 21.0, 23.0, 18.0, 15.0, 14.0, 11.0, 4.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -14.125244140625, -13.65673828125, -13.188232421875, -12.7197265625, -12.251220703125, -11.78271484375, -11.314208984375, -10.845703125, -10.377197265625, -9.90869140625, -9.440185546875, -8.9716796875, -8.503173828125, -8.03466796875, -7.566162109375, -7.09765625, -6.629150390625, -6.16064453125, -5.692138671875, -5.2236328125, -4.755126953125, -4.28662109375, -3.818115234375, -3.349609375, -2.881103515625, -2.41259765625, -1.944091796875, -1.4755859375, -1.007080078125, -0.53857421875, -0.070068359375, 0.3984375, 0.866943359375, 1.33544921875, 1.803955078125, 2.2724609375, 2.740966796875, 3.20947265625, 3.677978515625, 4.146484375, 4.614990234375, 5.08349609375, 5.552001953125, 6.0205078125, 6.489013671875, 6.95751953125, 7.426025390625, 7.89453125, 8.363037109375, 8.83154296875, 9.300048828125, 9.7685546875, 10.237060546875, 10.70556640625, 11.174072265625, 11.642578125, 12.111083984375, 12.57958984375, 13.048095703125, 13.5166015625, 13.985107421875, 14.45361328125, 14.922119140625, 15.390625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 14.0, 27.0, 35.0, 66.0, 98.0, 310.0, 229.0, 90.0, 42.0, 29.0, 23.0, 8.0, 7.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-54.848812103271484, -53.179542541503906, -51.51027297973633, -49.84100341796875, -48.17173767089844, -46.50246810913086, -44.83319854736328, -43.1639289855957, -41.494659423828125, -39.82538986206055, -38.15612030029297, -36.486854553222656, -34.81758499145508, -33.1483154296875, -31.479045867919922, -29.809776306152344, -28.1405086517334, -26.47123908996582, -24.801971435546875, -23.132701873779297, -21.46343231201172, -19.79416275024414, -18.124895095825195, -16.455625534057617, -14.786356925964355, -13.117088317871094, -11.447818756103516, -9.778550148010254, -8.109281539916992, -6.440011978149414, -4.770743370056152, -3.101473808288574, -1.4322052001953125, 0.23706376552581787, 1.9063327312469482, 3.575601577758789, 5.244870662689209, 6.914139747619629, 8.58340835571289, 10.252677917480469, 11.92194652557373, 13.591215133666992, 15.26048469543457, 16.929752349853516, 18.599021911621094, 20.268291473388672, 21.93756103515625, 23.606830596923828, 25.276098251342773, 26.94536781311035, 28.614635467529297, 30.283905029296875, 31.953174591064453, 33.62244415283203, 35.291709899902344, 36.96098327636719, 38.6302490234375, 40.29951858520508, 41.968788146972656, 43.63805389404297, 45.30732345581055, 46.976593017578125, 48.6458625793457, 50.31513214111328, 51.98440170288086]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 6.0, 7.0, 3.0, 14.0, 19.0, 14.0, 12.0, 17.0, 17.0, 30.0, 26.0, 32.0, 39.0, 33.0, 30.0, 41.0, 44.0, 45.0, 39.0, 30.0, 26.0, 32.0, 40.0, 37.0, 38.0, 35.0, 25.0, 33.0, 24.0, 32.0, 22.0, 23.0, 18.0, 17.0, 18.0, 9.0, 13.0, 6.0, 14.0, 4.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-19.893896102905273, -19.29180145263672, -18.68970489501953, -18.087610244750977, -17.485515594482422, -16.883419036865234, -16.28132438659668, -15.679228782653809, -15.077133178710938, -14.475037574768066, -13.872941970825195, -13.27084732055664, -12.66875171661377, -12.066656112670898, -11.464561462402344, -10.862465858459473, -10.260370254516602, -9.65827465057373, -9.05617904663086, -8.454084396362305, -7.851988792419434, -7.2498931884765625, -6.64779806137085, -6.045702934265137, -5.443607330322266, -4.8415117263793945, -4.239416599273682, -3.6373212337493896, -3.0352258682250977, -2.4331305027008057, -1.8310351371765137, -1.2289400100708008, -0.6268444061279297, -0.024749040603637695, 0.5773463249206543, 1.1794416904449463, 1.7815370559692383, 2.3836324214935303, 2.9857277870178223, 3.587822914123535, 4.189918518066406, 4.792014122009277, 5.39410924911499, 5.996204376220703, 6.598299980163574, 7.200395584106445, 7.802490711212158, 8.404585838317871, 9.006681442260742, 9.608777046203613, 10.210872650146484, 10.812967300415039, 11.41506290435791, 12.017158508300781, 12.619253158569336, 13.221348762512207, 13.823444366455078, 14.42553997039795, 15.02763557434082, 15.629730224609375, 16.231826782226562, 16.833921432495117, 17.436016082763672, 18.03811264038086, 18.640207290649414]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 18.0, 32.0, 30.0, 56.0, 73.0, 102.0, 196.0, 320.0, 504.0, 847.0, 1361.0, 2524.0, 4584.0, 9146.0, 22506.0, 4033760.0, 80575.0, 17740.0, 7877.0, 4305.0, 2541.0, 1605.0, 1069.0, 669.0, 515.0, 349.0, 234.0, 176.0, 145.0, 88.0, 73.0, 57.0, 50.0, 31.0, 12.0, 18.0, 14.0, 15.0, 8.0, 6.0, 3.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03741455078125, -0.036070823669433594, -0.03472709655761719, -0.03338336944580078, -0.032039642333984375, -0.03069591522216797, -0.029352188110351562, -0.028008460998535156, -0.02666473388671875, -0.025321006774902344, -0.023977279663085938, -0.02263355255126953, -0.021289825439453125, -0.01994609832763672, -0.018602371215820312, -0.017258644104003906, -0.0159149169921875, -0.014571189880371094, -0.013227462768554688, -0.011883735656738281, -0.010540008544921875, -0.009196281433105469, -0.007852554321289062, -0.006508827209472656, -0.00516510009765625, -0.0038213729858398438, -0.0024776458740234375, -0.0011339187622070312, 0.000209808349609375, 0.0015535354614257812, 0.0028972625732421875, 0.004240989685058594, 0.005584716796875, 0.006928443908691406, 0.008272171020507812, 0.009615898132324219, 0.010959625244140625, 0.012303352355957031, 0.013647079467773438, 0.014990806579589844, 0.01633453369140625, 0.017678260803222656, 0.019021987915039062, 0.02036571502685547, 0.021709442138671875, 0.02305316925048828, 0.024396896362304688, 0.025740623474121094, 0.0270843505859375, 0.028428077697753906, 0.029771804809570312, 0.03111553192138672, 0.032459259033203125, 0.03380298614501953, 0.03514671325683594, 0.036490440368652344, 0.03783416748046875, 0.039177894592285156, 0.04052162170410156, 0.04186534881591797, 0.043209075927734375, 0.04455280303955078, 0.04589653015136719, 0.047240257263183594, 0.048583984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 2.0, 9.0, 5.0, 8.0, 6.0, 6.0, 7.0, 14.0, 15.0, 20.0, 766.0, 13.0, 9.0, 15.0, 15.0, 8.0, 14.0, 3.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00222015380859375, -0.0021397173404693604, -0.0020592808723449707, -0.001978844404220581, -0.0018984079360961914, -0.0018179714679718018, -0.0017375349998474121, -0.0016570985317230225, -0.0015766620635986328, -0.0014962255954742432, -0.0014157891273498535, -0.0013353526592254639, -0.0012549161911010742, -0.0011744797229766846, -0.001094043254852295, -0.0010136067867279053, -0.0009331703186035156, -0.000852733850479126, -0.0007722973823547363, -0.0006918609142303467, -0.000611424446105957, -0.0005309879779815674, -0.00045055150985717773, -0.0003701150417327881, -0.00028967857360839844, -0.0002092421054840088, -0.00012880563735961914, -4.836916923522949e-05, 3.2067298889160156e-05, 0.0001125037670135498, 0.00019294023513793945, 0.0002733767032623291, 0.00035381317138671875, 0.0004342496395111084, 0.000514686107635498, 0.0005951225757598877, 0.0006755590438842773, 0.000755995512008667, 0.0008364319801330566, 0.0009168684482574463, 0.000997304916381836, 0.0010777413845062256, 0.0011581778526306152, 0.0012386143207550049, 0.0013190507888793945, 0.0013994872570037842, 0.0014799237251281738, 0.0015603601932525635, 0.0016407966613769531, 0.0017212331295013428, 0.0018016695976257324, 0.001882106065750122, 0.0019625425338745117, 0.0020429790019989014, 0.002123415470123291, 0.0022038519382476807, 0.0022842884063720703, 0.00236472487449646, 0.0024451613426208496, 0.0025255978107452393, 0.002606034278869629, 0.0026864707469940186, 0.002766907215118408, 0.002847343683242798, 0.0029277801513671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 8.0, 4.0, 5.0, 5.0, 15.0, 17.0, 24.0, 22.0, 29.0, 63.0, 61.0, 82.0, 122.0, 178.0, 237.0, 349.0, 507.0, 839.0, 1387.0, 2793.0, 6550.0, 23616.0, 290995.0, 3802970.0, 45424.0, 9477.0, 3678.0, 1815.0, 1008.0, 613.0, 408.0, 247.0, 203.0, 142.0, 99.0, 67.0, 51.0, 38.0, 37.0, 23.0, 17.0, 18.0, 7.0, 15.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05938720703125, -0.0574188232421875, -0.055450439453125, -0.0534820556640625, -0.051513671875, -0.0495452880859375, -0.047576904296875, -0.0456085205078125, -0.04364013671875, -0.0416717529296875, -0.039703369140625, -0.0377349853515625, -0.0357666015625, -0.0337982177734375, -0.031829833984375, -0.0298614501953125, -0.02789306640625, -0.0259246826171875, -0.023956298828125, -0.0219879150390625, -0.02001953125, -0.0180511474609375, -0.016082763671875, -0.0141143798828125, -0.01214599609375, -0.0101776123046875, -0.008209228515625, -0.0062408447265625, -0.0042724609375, -0.0023040771484375, -0.000335693359375, 0.0016326904296875, 0.00360107421875, 0.0055694580078125, 0.007537841796875, 0.0095062255859375, 0.011474609375, 0.0134429931640625, 0.015411376953125, 0.0173797607421875, 0.01934814453125, 0.0213165283203125, 0.023284912109375, 0.0252532958984375, 0.0272216796875, 0.0291900634765625, 0.031158447265625, 0.0331268310546875, 0.03509521484375, 0.0370635986328125, 0.039031982421875, 0.0410003662109375, 0.04296875, 0.0449371337890625, 0.046905517578125, 0.0488739013671875, 0.05084228515625, 0.0528106689453125, 0.054779052734375, 0.0567474365234375, 0.0587158203125, 0.0606842041015625, 0.062652587890625, 0.0646209716796875, 0.06658935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 9.0, 7.0, 12.0, 11.0, 27.0, 21.0, 24.0, 28.0, 30.0, 37.0, 63.0, 62.0, 85.0, 138.0, 314.0, 2255.0, 301.0, 161.0, 91.0, 64.0, 47.0, 35.0, 27.0, 26.0, 29.0, 20.0, 21.0, 16.0, 11.0, 17.0, 15.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00586700439453125, -0.005668163299560547, -0.005469322204589844, -0.005270481109619141, -0.0050716400146484375, -0.004872798919677734, -0.004673957824707031, -0.004475116729736328, -0.004276275634765625, -0.004077434539794922, -0.0038785934448242188, -0.0036797523498535156, -0.0034809112548828125, -0.0032820701599121094, -0.0030832290649414062, -0.002884387969970703, -0.002685546875, -0.002486705780029297, -0.0022878646850585938, -0.0020890235900878906, -0.0018901824951171875, -0.0016913414001464844, -0.0014925003051757812, -0.0012936592102050781, -0.001094818115234375, -0.0008959770202636719, -0.0006971359252929688, -0.0004982948303222656, -0.0002994537353515625, -0.00010061264038085938, 9.822845458984375e-05, 0.0002970695495605469, 0.00049591064453125, 0.0006947517395019531, 0.0008935928344726562, 0.0010924339294433594, 0.0012912750244140625, 0.0014901161193847656, 0.0016889572143554688, 0.0018877983093261719, 0.002086639404296875, 0.002285480499267578, 0.0024843215942382812, 0.0026831626892089844, 0.0028820037841796875, 0.0030808448791503906, 0.0032796859741210938, 0.003478527069091797, 0.0036773681640625, 0.003876209259033203, 0.004075050354003906, 0.004273891448974609, 0.0044727325439453125, 0.004671573638916016, 0.004870414733886719, 0.005069255828857422, 0.005268096923828125, 0.005466938018798828, 0.005665779113769531, 0.005864620208740234, 0.0060634613037109375, 0.006262302398681641, 0.006461143493652344, 0.006659984588623047, 0.00685882568359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 12.0, 20.0, 48.0, 103.0, 373.0, 286.0, 81.0, 32.0, 15.0, 10.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10142126679420471, -0.09874217957258224, -0.09606309235095978, -0.09338401257991791, -0.09070492535829544, -0.08802583813667297, -0.0853467583656311, -0.08266767114400864, -0.07998858392238617, -0.0773094967007637, -0.07463040947914124, -0.07195132970809937, -0.0692722424864769, -0.06659315526485443, -0.06391407549381256, -0.061234988272190094, -0.05855590105056763, -0.05587681382894516, -0.05319773033261299, -0.05051864683628082, -0.047839559614658356, -0.04516047239303589, -0.04248138889670372, -0.03980230540037155, -0.037123218178749084, -0.03444413095712662, -0.03176504746079445, -0.02908596210181713, -0.026406876742839813, -0.023727791383862495, -0.021048706024885178, -0.01836962066590786, -0.015690535306930542, -0.013011449947953224, -0.010332364588975906, -0.0076532792299985886, -0.004974193871021271, -0.002295108512043953, 0.00038397684693336487, 0.0030630622059106827, 0.0057421475648880005, 0.008421232923865318, 0.011100318282842636, 0.013779403641819954, 0.01645848900079727, 0.01913757435977459, 0.021816659718751907, 0.024495745077729225, 0.027174830436706543, 0.02985391579568386, 0.03253300115466118, 0.03521208465099335, 0.037891171872615814, 0.04057025909423828, 0.04324934259057045, 0.04592842608690262, 0.048607513308525085, 0.05128660053014755, 0.05396568402647972, 0.05664476752281189, 0.05932385474443436, 0.062002941966056824, 0.0646820217370987, 0.06736110895872116, 0.07004019618034363]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 9.0, 4.0, 2.0, 6.0, 8.0, 17.0, 15.0, 20.0, 18.0, 21.0, 30.0, 25.0, 46.0, 42.0, 55.0, 68.0, 56.0, 53.0, 52.0, 49.0, 47.0, 46.0, 40.0, 39.0, 43.0, 32.0, 28.0, 32.0, 18.0, 17.0, 17.0, 9.0, 11.0, 5.0, 2.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024932682514190674, -0.024112656712532043, -0.023292630910873413, -0.022472605109214783, -0.021652579307556152, -0.020832553505897522, -0.02001252770423889, -0.01919250190258026, -0.01837247610092163, -0.017552450299263, -0.01673242449760437, -0.01591239869594574, -0.01509237289428711, -0.014272347092628479, -0.013452321290969849, -0.012632295489311218, -0.011812269687652588, -0.010992243885993958, -0.010172218084335327, -0.009352192282676697, -0.008532166481018066, -0.007712140679359436, -0.006892114877700806, -0.006072089076042175, -0.005252063274383545, -0.0044320374727249146, -0.003612011671066284, -0.002791985869407654, -0.0019719600677490234, -0.001151934266090393, -0.0003319084644317627, 0.0004881173372268677, 0.001308143138885498, 0.0021281689405441284, 0.002948194742202759, 0.003768220543861389, 0.0045882463455200195, 0.00540827214717865, 0.00622829794883728, 0.007048323750495911, 0.007868349552154541, 0.008688375353813171, 0.009508401155471802, 0.010328426957130432, 0.011148452758789062, 0.011968478560447693, 0.012788504362106323, 0.013608530163764954, 0.014428555965423584, 0.015248581767082214, 0.016068607568740845, 0.016888633370399475, 0.017708659172058105, 0.018528684973716736, 0.019348710775375366, 0.020168736577033997, 0.020988762378692627, 0.021808788180351257, 0.022628813982009888, 0.023448839783668518, 0.02426886558532715, 0.02508889138698578, 0.02590891718864441, 0.02672894299030304, 0.02754896879196167]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 2.0, 9.0, 15.0, 11.0, 19.0, 23.0, 24.0, 31.0, 28.0, 58.0, 74.0, 107.0, 116.0, 185.0, 212.0, 354.0, 452.0, 645.0, 861.0, 1350.0, 1991.0, 2881.0, 4619.0, 7645.0, 13601.0, 31032.0, 886126.0, 51566.0, 18494.0, 9360.0, 5476.0, 3554.0, 2210.0, 1515.0, 1091.0, 736.0, 544.0, 379.0, 319.0, 207.0, 143.0, 126.0, 88.0, 67.0, 59.0, 42.0, 26.0, 26.0, 17.0, 10.0, 8.0, 9.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-0.035552978515625, -0.034465789794921875, -0.03337860107421875, -0.032291412353515625, -0.0312042236328125, -0.030117034912109375, -0.02902984619140625, -0.027942657470703125, -0.02685546875, -0.025768280029296875, -0.02468109130859375, -0.023593902587890625, -0.0225067138671875, -0.021419525146484375, -0.02033233642578125, -0.019245147705078125, -0.018157958984375, -0.017070770263671875, -0.01598358154296875, -0.014896392822265625, -0.0138092041015625, -0.012722015380859375, -0.01163482666015625, -0.010547637939453125, -0.00946044921875, -0.008373260498046875, -0.00728607177734375, -0.006198883056640625, -0.0051116943359375, -0.004024505615234375, -0.00293731689453125, -0.001850128173828125, -0.000762939453125, 0.000324249267578125, 0.00141143798828125, 0.002498626708984375, 0.0035858154296875, 0.004673004150390625, 0.00576019287109375, 0.006847381591796875, 0.0079345703125, 0.009021759033203125, 0.01010894775390625, 0.011196136474609375, 0.0122833251953125, 0.013370513916015625, 0.01445770263671875, 0.015544891357421875, 0.016632080078125, 0.017719268798828125, 0.01880645751953125, 0.019893646240234375, 0.0209808349609375, 0.022068023681640625, 0.02315521240234375, 0.024242401123046875, 0.02532958984375, 0.026416778564453125, 0.02750396728515625, 0.028591156005859375, 0.0296783447265625, 0.030765533447265625, 0.03185272216796875, 0.032939910888671875, 0.034027099609375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 8.0, 4.0, 9.0, 4.0, 6.0, 10.0, 14.0, 19.0, 519.0, 264.0, 13.0, 11.0, 15.0, 13.0, 10.0, 7.0, 8.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002288818359375, -0.002207636833190918, -0.002126455307006836, -0.002045273780822754, -0.001964092254638672, -0.0018829107284545898, -0.0018017292022705078, -0.0017205476760864258, -0.0016393661499023438, -0.0015581846237182617, -0.0014770030975341797, -0.0013958215713500977, -0.0013146400451660156, -0.0012334585189819336, -0.0011522769927978516, -0.0010710954666137695, -0.0009899139404296875, -0.0009087324142456055, -0.0008275508880615234, -0.0007463693618774414, -0.0006651878356933594, -0.0005840063095092773, -0.0005028247833251953, -0.0004216432571411133, -0.00034046173095703125, -0.0002592802047729492, -0.0001780986785888672, -9.691715240478516e-05, -1.5735626220703125e-05, 6.54458999633789e-05, 0.00014662742614746094, 0.00022780895233154297, 0.000308990478515625, 0.00039017200469970703, 0.00047135353088378906, 0.0005525350570678711, 0.0006337165832519531, 0.0007148981094360352, 0.0007960796356201172, 0.0008772611618041992, 0.0009584426879882812, 0.0010396242141723633, 0.0011208057403564453, 0.0012019872665405273, 0.0012831687927246094, 0.0013643503189086914, 0.0014455318450927734, 0.0015267133712768555, 0.0016078948974609375, 0.0016890764236450195, 0.0017702579498291016, 0.0018514394760131836, 0.0019326210021972656, 0.0020138025283813477, 0.0020949840545654297, 0.0021761655807495117, 0.0022573471069335938, 0.0023385286331176758, 0.002419710159301758, 0.00250089168548584, 0.002582073211669922, 0.002663254737854004, 0.002744436264038086, 0.002825617790222168, 0.00290679931640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 6.0, 10.0, 15.0, 21.0, 31.0, 40.0, 66.0, 89.0, 134.0, 171.0, 261.0, 455.0, 668.0, 1102.0, 2053.0, 4279.0, 10927.0, 58609.0, 892435.0, 56916.0, 10912.0, 4234.0, 2067.0, 1096.0, 664.0, 416.0, 266.0, 185.0, 127.0, 87.0, 55.0, 42.0, 21.0, 27.0, 12.0, 16.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.07028913497924805, -0.0681905746459961, -0.06609201431274414, -0.06399345397949219, -0.061894893646240234, -0.05979633331298828, -0.05769777297973633, -0.055599212646484375, -0.05350065231323242, -0.05140209197998047, -0.049303531646728516, -0.04720497131347656, -0.04510641098022461, -0.043007850646972656, -0.0409092903137207, -0.03881072998046875, -0.0367121696472168, -0.034613609313964844, -0.03251504898071289, -0.030416488647460938, -0.028317928314208984, -0.02621936798095703, -0.024120807647705078, -0.022022247314453125, -0.019923686981201172, -0.01782512664794922, -0.015726566314697266, -0.013628005981445312, -0.01152944564819336, -0.009430885314941406, -0.007332324981689453, -0.0052337646484375, -0.003135204315185547, -0.0010366439819335938, 0.0010619163513183594, 0.0031604766845703125, 0.005259037017822266, 0.007357597351074219, 0.009456157684326172, 0.011554718017578125, 0.013653278350830078, 0.01575183868408203, 0.017850399017333984, 0.019948959350585938, 0.02204751968383789, 0.024146080017089844, 0.026244640350341797, 0.02834320068359375, 0.030441761016845703, 0.032540321350097656, 0.03463888168334961, 0.03673744201660156, 0.038836002349853516, 0.04093456268310547, 0.04303312301635742, 0.045131683349609375, 0.04723024368286133, 0.04932880401611328, 0.051427364349365234, 0.05352592468261719, 0.05562448501586914, 0.057723045349121094, 0.05982160568237305, 0.061920166015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 5.0, 17.0, 13.0, 22.0, 17.0, 20.0, 27.0, 25.0, 34.0, 38.0, 42.0, 43.0, 45.0, 41.0, 35.0, 48.0, 50.0, 48.0, 43.0, 54.0, 54.0, 31.0, 37.0, 18.0, 35.0, 30.0, 28.0, 17.0, 17.0, 5.0, 14.0, 6.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0148162841796875, -0.014390110969543457, -0.013963937759399414, -0.013537764549255371, -0.013111591339111328, -0.012685418128967285, -0.012259244918823242, -0.0118330717086792, -0.011406898498535156, -0.010980725288391113, -0.01055455207824707, -0.010128378868103027, -0.009702205657958984, -0.009276032447814941, -0.008849859237670898, -0.008423686027526855, -0.007997512817382812, -0.0075713396072387695, -0.0071451663970947266, -0.006718993186950684, -0.006292819976806641, -0.005866646766662598, -0.005440473556518555, -0.005014300346374512, -0.004588127136230469, -0.004161953926086426, -0.003735780715942383, -0.00330960750579834, -0.002883434295654297, -0.002457261085510254, -0.002031087875366211, -0.001604914665222168, -0.001178741455078125, -0.000752568244934082, -0.00032639503479003906, 9.97781753540039e-05, 0.0005259513854980469, 0.0009521245956420898, 0.0013782978057861328, 0.0018044710159301758, 0.0022306442260742188, 0.0026568174362182617, 0.0030829906463623047, 0.0035091638565063477, 0.003935337066650391, 0.004361510276794434, 0.0047876834869384766, 0.0052138566970825195, 0.0056400299072265625, 0.0060662031173706055, 0.0064923763275146484, 0.006918549537658691, 0.007344722747802734, 0.007770895957946777, 0.00819706916809082, 0.008623242378234863, 0.009049415588378906, 0.00947558879852295, 0.009901762008666992, 0.010327935218811035, 0.010754108428955078, 0.011180281639099121, 0.011606454849243164, 0.012032628059387207, 0.01245880126953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 3.0, 4.0, 8.0, 9.0, 5.0, 12.0, 12.0, 12.0, 20.0, 19.0, 20.0, 36.0, 60.0, 92.0, 365.0, 2008.0, 59916.0, 980823.0, 4176.0, 558.0, 154.0, 59.0, 29.0, 31.0, 19.0, 11.0, 18.0, 18.0, 6.0, 13.0, 6.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028533935546875, -0.02767348289489746, -0.026813030242919922, -0.025952577590942383, -0.025092124938964844, -0.024231672286987305, -0.023371219635009766, -0.022510766983032227, -0.021650314331054688, -0.02078986167907715, -0.01992940902709961, -0.01906895637512207, -0.01820850372314453, -0.017348051071166992, -0.016487598419189453, -0.015627145767211914, -0.014766693115234375, -0.013906240463256836, -0.013045787811279297, -0.012185335159301758, -0.011324882507324219, -0.01046442985534668, -0.00960397720336914, -0.008743524551391602, -0.007883071899414062, -0.0070226192474365234, -0.006162166595458984, -0.005301713943481445, -0.004441261291503906, -0.003580808639526367, -0.002720355987548828, -0.001859903335571289, -0.00099945068359375, -0.00013899803161621094, 0.0007214546203613281, 0.0015819072723388672, 0.0024423599243164062, 0.0033028125762939453, 0.004163265228271484, 0.0050237178802490234, 0.0058841705322265625, 0.0067446231842041016, 0.007605075836181641, 0.00846552848815918, 0.009325981140136719, 0.010186433792114258, 0.011046886444091797, 0.011907339096069336, 0.012767791748046875, 0.013628244400024414, 0.014488697052001953, 0.015349149703979492, 0.01620960235595703, 0.01707005500793457, 0.01793050765991211, 0.01879096031188965, 0.019651412963867188, 0.020511865615844727, 0.021372318267822266, 0.022232770919799805, 0.023093223571777344, 0.023953676223754883, 0.024814128875732422, 0.02567458152770996, 0.0265350341796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 3.0, 14.0, 12.0, 18.0, 23.0, 24.0, 37.0, 35.0, 51.0, 65.0, 124.0, 98.0, 120.0, 86.0, 58.0, 41.0, 37.0, 24.0, 29.0, 15.0, 21.0, 11.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2695789337158203e-05, -1.2317672371864319e-05, -1.1939555406570435e-05, -1.156143844127655e-05, -1.1183321475982666e-05, -1.0805204510688782e-05, -1.0427087545394897e-05, -1.0048970580101013e-05, -9.670853614807129e-06, -9.292736649513245e-06, -8.91461968421936e-06, -8.536502718925476e-06, -8.158385753631592e-06, -7.780268788337708e-06, -7.402151823043823e-06, -7.024034857749939e-06, -6.645917892456055e-06, -6.26780092716217e-06, -5.889683961868286e-06, -5.511566996574402e-06, -5.133450031280518e-06, -4.755333065986633e-06, -4.377216100692749e-06, -3.999099135398865e-06, -3.6209821701049805e-06, -3.242865204811096e-06, -2.864748239517212e-06, -2.4866312742233276e-06, -2.1085143089294434e-06, -1.730397343635559e-06, -1.3522803783416748e-06, -9.741634130477905e-07, -5.960464477539062e-07, -2.1792948246002197e-07, 1.601874828338623e-07, 5.383044481277466e-07, 9.164214134216309e-07, 1.2945383787155151e-06, 1.6726553440093994e-06, 2.0507723093032837e-06, 2.428889274597168e-06, 2.8070062398910522e-06, 3.1851232051849365e-06, 3.563240170478821e-06, 3.941357135772705e-06, 4.319474101066589e-06, 4.697591066360474e-06, 5.075708031654358e-06, 5.453824996948242e-06, 5.8319419622421265e-06, 6.210058927536011e-06, 6.588175892829895e-06, 6.966292858123779e-06, 7.3444098234176636e-06, 7.722526788711548e-06, 8.100643754005432e-06, 8.478760719299316e-06, 8.8568776845932e-06, 9.234994649887085e-06, 9.61311161518097e-06, 9.991228580474854e-06, 1.0369345545768738e-05, 1.0747462511062622e-05, 1.1125579476356506e-05, 1.150369644165039e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 13.0, 35.0, 31.0, 68.0, 167.0, 351.0, 1054.0, 4942.0, 117170.0, 914923.0, 7581.0, 1363.0, 454.0, 189.0, 72.0, 43.0, 27.0, 20.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.04809284210205078, -0.04659461975097656, -0.045096397399902344, -0.043598175048828125, -0.042099952697753906, -0.04060173034667969, -0.03910350799560547, -0.03760528564453125, -0.03610706329345703, -0.03460884094238281, -0.033110618591308594, -0.031612396240234375, -0.030114173889160156, -0.028615951538085938, -0.02711772918701172, -0.0256195068359375, -0.02412128448486328, -0.022623062133789062, -0.021124839782714844, -0.019626617431640625, -0.018128395080566406, -0.016630172729492188, -0.015131950378417969, -0.01363372802734375, -0.012135505676269531, -0.010637283325195312, -0.009139060974121094, -0.007640838623046875, -0.006142616271972656, -0.0046443939208984375, -0.0031461715698242188, -0.00164794921875, -0.00014972686767578125, 0.0013484954833984375, 0.0028467178344726562, 0.004344940185546875, 0.005843162536621094, 0.0073413848876953125, 0.008839607238769531, 0.01033782958984375, 0.011836051940917969, 0.013334274291992188, 0.014832496643066406, 0.016330718994140625, 0.017828941345214844, 0.019327163696289062, 0.02082538604736328, 0.0223236083984375, 0.02382183074951172, 0.025320053100585938, 0.026818275451660156, 0.028316497802734375, 0.029814720153808594, 0.03131294250488281, 0.03281116485595703, 0.03430938720703125, 0.03580760955810547, 0.03730583190917969, 0.038804054260253906, 0.040302276611328125, 0.041800498962402344, 0.04329872131347656, 0.04479694366455078, 0.046295166015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 2.0, 13.0, 12.0, 14.0, 14.0, 12.0, 20.0, 24.0, 76.0, 162.0, 347.0, 117.0, 59.0, 23.0, 19.0, 17.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00878143310546875, -0.008482813835144043, -0.008184194564819336, -0.007885575294494629, -0.007586956024169922, -0.007288336753845215, -0.006989717483520508, -0.006691098213195801, -0.006392478942871094, -0.006093859672546387, -0.00579524040222168, -0.005496621131896973, -0.005198001861572266, -0.004899382591247559, -0.0046007633209228516, -0.0043021440505981445, -0.0040035247802734375, -0.0037049055099487305, -0.0034062862396240234, -0.0031076669692993164, -0.0028090476989746094, -0.0025104284286499023, -0.0022118091583251953, -0.0019131898880004883, -0.0016145706176757812, -0.0013159513473510742, -0.0010173320770263672, -0.0007187128067016602, -0.0004200935363769531, -0.0001214742660522461, 0.00017714500427246094, 0.00047576427459716797, 0.000774383544921875, 0.001073002815246582, 0.001371622085571289, 0.001670241355895996, 0.001968860626220703, 0.00226747989654541, 0.002566099166870117, 0.0028647184371948242, 0.0031633377075195312, 0.0034619569778442383, 0.0037605762481689453, 0.004059195518493652, 0.004357814788818359, 0.004656434059143066, 0.0049550533294677734, 0.0052536725997924805, 0.0055522918701171875, 0.0058509111404418945, 0.0061495304107666016, 0.006448149681091309, 0.006746768951416016, 0.007045388221740723, 0.00734400749206543, 0.007642626762390137, 0.007941246032714844, 0.00823986530303955, 0.008538484573364258, 0.008837103843688965, 0.009135723114013672, 0.009434342384338379, 0.009732961654663086, 0.010031580924987793, 0.0103302001953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 10.0, 14.0, 16.0, 66.0, 650.0, 147.0, 30.0, 8.0, 12.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6662124395370483, -0.6485141515731812, -0.630815863609314, -0.6131175756454468, -0.5954192876815796, -0.5777209401130676, -0.5600226521492004, -0.5423243641853333, -0.5246260762214661, -0.5069277882575989, -0.4892295002937317, -0.4715311825275421, -0.4538328945636749, -0.43613460659980774, -0.41843628883361816, -0.400738000869751, -0.3830397129058838, -0.3653414249420166, -0.3476431369781494, -0.32994481921195984, -0.31224653124809265, -0.29454824328422546, -0.2768499255180359, -0.2591516375541687, -0.2414533495903015, -0.22375506162643433, -0.20605675876140594, -0.18835845589637756, -0.17066016793251038, -0.1529618799686432, -0.1352635771036148, -0.11756528168916702, -0.09986692667007446, -0.08216863125562668, -0.0644703358411789, -0.04677204042673111, -0.029073745012283325, -0.01137544959783554, 0.006322845816612244, 0.024021141231060028, 0.04171943664550781, 0.0594177320599556, 0.07711602747440338, 0.09481432288885117, 0.11251261830329895, 0.13021090626716614, 0.14790920913219452, 0.1656075119972229, 0.1833057999610901, 0.20100408792495728, 0.21870239078998566, 0.23640069365501404, 0.2540989816188812, 0.2717972695827484, 0.289495587348938, 0.3071938753128052, 0.32489216327667236, 0.34259045124053955, 0.36028873920440674, 0.3779870569705963, 0.3956853449344635, 0.4133836328983307, 0.43108195066452026, 0.44878023862838745, 0.46647852659225464]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 8.0, 15.0, 11.0, 18.0, 27.0, 53.0, 67.0, 139.0, 162.0, 158.0, 110.0, 58.0, 47.0, 23.0, 11.0, 11.0, 9.0, 9.0, 5.0, 7.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2487790584564209, -0.2416069060564041, -0.23443473875522614, -0.22726258635520935, -0.22009043395519257, -0.21291828155517578, -0.2057461142539978, -0.19857396185398102, -0.19140180945396423, -0.18422965705394745, -0.17705748975276947, -0.16988533735275269, -0.1627131849527359, -0.15554103255271912, -0.14836886525154114, -0.14119671285152435, -0.13402454555034637, -0.1268523931503296, -0.11968023329973221, -0.11250807344913483, -0.10533592104911804, -0.09816376119852066, -0.09099160134792328, -0.0838194489479065, -0.07664728909730911, -0.06947512924671173, -0.062302976846694946, -0.055130816996097565, -0.04795866087079048, -0.0407865047454834, -0.03361434489488602, -0.026442188769578934, -0.01927003264427185, -0.012097875587642193, -0.004925718531012535, 0.0022464394569396973, 0.00941859558224678, 0.016590751707553864, 0.023762911558151245, 0.030935067683458328, 0.03810722380876541, 0.045279379934072495, 0.05245153605937958, 0.05962369590997696, 0.06679585576057434, 0.07396800816059113, 0.08114016801118851, 0.08831232786178589, 0.09548448026180267, 0.10265664011240005, 0.10982879251241684, 0.11700095236301422, 0.124173104763031, 0.13134527206420898, 0.13851742446422577, 0.14568957686424255, 0.15286174416542053, 0.16003389656543732, 0.1672060638666153, 0.17437821626663208, 0.18155036866664886, 0.18872252106666565, 0.19589468836784363, 0.2030668407678604, 0.2102389931678772]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 5.0, 7.0, 13.0, 17.0, 14.0, 17.0, 25.0, 28.0, 38.0, 74.0, 533.0, 29103.0, 4154368.0, 9062.0, 637.0, 98.0, 60.0, 34.0, 15.0, 26.0, 12.0, 7.0, 15.0, 10.0, 5.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.853515625, -3.712432861328125, -3.57135009765625, -3.430267333984375, -3.2891845703125, -3.148101806640625, -3.00701904296875, -2.865936279296875, -2.724853515625, -2.583770751953125, -2.44268798828125, -2.301605224609375, -2.1605224609375, -2.019439697265625, -1.87835693359375, -1.737274169921875, -1.59619140625, -1.455108642578125, -1.31402587890625, -1.172943115234375, -1.0318603515625, -0.890777587890625, -0.74969482421875, -0.608612060546875, -0.467529296875, -0.326446533203125, -0.18536376953125, -0.044281005859375, 0.0968017578125, 0.237884521484375, 0.37896728515625, 0.520050048828125, 0.6611328125, 0.802215576171875, 0.94329833984375, 1.084381103515625, 1.2254638671875, 1.366546630859375, 1.50762939453125, 1.648712158203125, 1.789794921875, 1.930877685546875, 2.07196044921875, 2.213043212890625, 2.3541259765625, 2.495208740234375, 2.63629150390625, 2.777374267578125, 2.91845703125, 3.059539794921875, 3.20062255859375, 3.341705322265625, 3.4827880859375, 3.623870849609375, 3.76495361328125, 3.906036376953125, 4.047119140625, 4.188201904296875, 4.32928466796875, 4.470367431640625, 4.6114501953125, 4.752532958984375, 4.89361572265625, 5.034698486328125, 5.17578125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 5.0, 7.0, 5.0, 6.0, 6.0, 14.0, 26.0, 312.0, 469.0, 11.0, 9.0, 16.0, 13.0, 8.0, 11.0, 6.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022716522216796875, -0.0021914243698120117, -0.002111196517944336, -0.00203096866607666, -0.0019507408142089844, -0.0018705129623413086, -0.0017902851104736328, -0.001710057258605957, -0.0016298294067382812, -0.0015496015548706055, -0.0014693737030029297, -0.001389145851135254, -0.0013089179992675781, -0.0012286901473999023, -0.0011484622955322266, -0.0010682344436645508, -0.000988006591796875, -0.0009077787399291992, -0.0008275508880615234, -0.0007473230361938477, -0.0006670951843261719, -0.0005868673324584961, -0.0005066394805908203, -0.00042641162872314453, -0.00034618377685546875, -0.00026595592498779297, -0.0001857280731201172, -0.0001055002212524414, -2.5272369384765625e-05, 5.4955482482910156e-05, 0.00013518333435058594, 0.00021541118621826172, 0.0002956390380859375, 0.0003758668899536133, 0.00045609474182128906, 0.0005363225936889648, 0.0006165504455566406, 0.0006967782974243164, 0.0007770061492919922, 0.000857234001159668, 0.0009374618530273438, 0.0010176897048950195, 0.0010979175567626953, 0.001178145408630371, 0.0012583732604980469, 0.0013386011123657227, 0.0014188289642333984, 0.0014990568161010742, 0.00157928466796875, 0.0016595125198364258, 0.0017397403717041016, 0.0018199682235717773, 0.0019001960754394531, 0.001980423927307129, 0.0020606517791748047, 0.0021408796310424805, 0.0022211074829101562, 0.002301335334777832, 0.002381563186645508, 0.0024617910385131836, 0.0025420188903808594, 0.002622246742248535, 0.002702474594116211, 0.0027827024459838867, 0.0028629302978515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 18.0, 18.0, 25.0, 31.0, 44.0, 65.0, 78.0, 111.0, 137.0, 237.0, 1298.0, 4180975.0, 10302.0, 330.0, 161.0, 121.0, 99.0, 60.0, 50.0, 31.0, 26.0, 18.0, 10.0, 10.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.078399658203125, -1.03472900390625, -0.991058349609375, -0.9473876953125, -0.903717041015625, -0.86004638671875, -0.816375732421875, -0.772705078125, -0.729034423828125, -0.68536376953125, -0.641693115234375, -0.5980224609375, -0.554351806640625, -0.51068115234375, -0.467010498046875, -0.42333984375, -0.379669189453125, -0.33599853515625, -0.292327880859375, -0.2486572265625, -0.204986572265625, -0.16131591796875, -0.117645263671875, -0.073974609375, -0.030303955078125, 0.01336669921875, 0.057037353515625, 0.1007080078125, 0.144378662109375, 0.18804931640625, 0.231719970703125, 0.275390625, 0.319061279296875, 0.36273193359375, 0.406402587890625, 0.4500732421875, 0.493743896484375, 0.53741455078125, 0.581085205078125, 0.624755859375, 0.668426513671875, 0.71209716796875, 0.755767822265625, 0.7994384765625, 0.843109130859375, 0.88677978515625, 0.930450439453125, 0.97412109375, 1.017791748046875, 1.06146240234375, 1.105133056640625, 1.1488037109375, 1.192474365234375, 1.23614501953125, 1.279815673828125, 1.323486328125, 1.367156982421875, 1.41082763671875, 1.454498291015625, 1.4981689453125, 1.541839599609375, 1.58551025390625, 1.629180908203125, 1.6728515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 17.0, 17.0, 24.0, 24.0, 47.0, 68.0, 67.0, 108.0, 143.0, 205.0, 334.0, 1558.0, 511.0, 290.0, 167.0, 124.0, 115.0, 68.0, 57.0, 28.0, 27.0, 20.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00867462158203125, -0.00833892822265625, -0.00800323486328125, -0.00766754150390625, -0.00733184814453125, -0.00699615478515625, -0.00666046142578125, -0.00632476806640625, -0.00598907470703125, -0.00565338134765625, -0.00531768798828125, -0.00498199462890625, -0.00464630126953125, -0.00431060791015625, -0.00397491455078125, -0.00363922119140625, -0.00330352783203125, -0.00296783447265625, -0.00263214111328125, -0.00229644775390625, -0.00196075439453125, -0.00162506103515625, -0.00128936767578125, -0.00095367431640625, -0.00061798095703125, -0.00028228759765625, 5.340576171875e-05, 0.00038909912109375, 0.00072479248046875, 0.00106048583984375, 0.00139617919921875, 0.00173187255859375, 0.00206756591796875, 0.00240325927734375, 0.00273895263671875, 0.00307464599609375, 0.00341033935546875, 0.00374603271484375, 0.00408172607421875, 0.00441741943359375, 0.00475311279296875, 0.00508880615234375, 0.00542449951171875, 0.00576019287109375, 0.00609588623046875, 0.00643157958984375, 0.00676727294921875, 0.00710296630859375, 0.00743865966796875, 0.00777435302734375, 0.00811004638671875, 0.00844573974609375, 0.00878143310546875, 0.00911712646484375, 0.00945281982421875, 0.00978851318359375, 0.01012420654296875, 0.01045989990234375, 0.01079559326171875, 0.01113128662109375, 0.01146697998046875, 0.01180267333984375, 0.01213836669921875, 0.01247406005859375, 0.01280975341796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 19.0, 29.0, 118.0, 366.0, 217.0, 96.0, 47.0, 27.0, 12.0, 17.0, 11.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10769225656986237, -0.10314282029867172, -0.09859337657690048, -0.09404394030570984, -0.0894944965839386, -0.08494506031274796, -0.08039562404155731, -0.07584618031978607, -0.07129674404859543, -0.06674730777740479, -0.062197864055633545, -0.0576484277844429, -0.05309898778796196, -0.04854954779148102, -0.044000111520290375, -0.03945067152380943, -0.03490123152732849, -0.03035179153084755, -0.025802353397011757, -0.021252915263175964, -0.016703475266695023, -0.01215403527021408, -0.007604597136378288, -0.0030551590025424957, 0.001494280993938446, 0.006043720059096813, 0.01059315912425518, 0.015142598189413548, 0.019692037254571915, 0.024241477251052856, 0.02879091538488865, 0.03334035351872444, 0.03788979351520538, 0.042439233511686325, 0.04698867350816727, 0.05153810977935791, 0.05608754977583885, 0.060636989772319794, 0.06518642604351044, 0.06973586976528168, 0.07428530603647232, 0.07883474230766296, 0.0833841860294342, 0.08793362230062485, 0.09248305857181549, 0.09703250229358673, 0.10158193856477737, 0.10613137483596802, 0.11068081855773926, 0.1152302548289299, 0.11977969855070114, 0.12432913482189178, 0.12887857854366302, 0.13342800736427307, 0.1379774510860443, 0.14252689480781555, 0.1470763385295868, 0.15162578225135803, 0.15617521107196808, 0.16072465479373932, 0.16527409851551056, 0.1698235273361206, 0.17437297105789185, 0.17892241477966309, 0.18347184360027313]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 10.0, 6.0, 20.0, 20.0, 25.0, 29.0, 38.0, 44.0, 45.0, 57.0, 57.0, 55.0, 75.0, 55.0, 67.0, 68.0, 55.0, 61.0, 57.0, 31.0, 27.0, 26.0, 14.0, 16.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08614182472229004, -0.08390861004590988, -0.08167539536952972, -0.07944218814373016, -0.07720897346735, -0.07497575879096985, -0.07274255156517029, -0.07050933688879013, -0.06827612221240997, -0.06604290753602982, -0.06380969285964966, -0.0615764856338501, -0.05934327095746994, -0.05711005628108978, -0.054876845329999924, -0.052643634378910065, -0.05041041970252991, -0.04817720502614975, -0.04594399407505989, -0.04371078312397003, -0.041477568447589874, -0.03924435377120972, -0.03701114282011986, -0.03477793186903, -0.03254471719264984, -0.030311504378914833, -0.028078291565179825, -0.025845078751444817, -0.02361186593770981, -0.0213786531239748, -0.019145440310239792, -0.016912227496504784, -0.014679014682769775, -0.012445801869034767, -0.010212589055299759, -0.00797937624156475, -0.005746163427829742, -0.003512950614094734, -0.001279737800359726, 0.0009534750133752823, 0.0031866878271102905, 0.005419900640845299, 0.007653113454580307, 0.009886326268315315, 0.012119539082050323, 0.014352751895785332, 0.01658596470952034, 0.018819177523255348, 0.021052390336990356, 0.023285603150725365, 0.025518815964460373, 0.02775202877819538, 0.02998524159193039, 0.03221845626831055, 0.034451667219400406, 0.036684878170490265, 0.03891809284687042, 0.04115130752325058, 0.04338451847434044, 0.0456177294254303, 0.047850944101810455, 0.05008415877819061, 0.05231736972928047, 0.05455058068037033, 0.05678379535675049]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 8.0, 17.0, 10.0, 13.0, 22.0, 21.0, 29.0, 39.0, 51.0, 63.0, 74.0, 108.0, 132.0, 166.0, 274.0, 324.0, 418.0, 518.0, 733.0, 1007.0, 1414.0, 1950.0, 2690.0, 3918.0, 5704.0, 8819.0, 14970.0, 28727.0, 736862.0, 177237.0, 23751.0, 12771.0, 7753.0, 5230.0, 3563.0, 2470.0, 1788.0, 1271.0, 950.0, 670.0, 488.0, 377.0, 258.0, 219.0, 171.0, 130.0, 93.0, 70.0, 54.0, 38.0, 33.0, 29.0, 26.0, 12.0, 14.0, 6.0, 6.0, 4.0, 0.0, 1.0], "bins": [-0.0462646484375, -0.04485750198364258, -0.043450355529785156, -0.042043209075927734, -0.04063606262207031, -0.03922891616821289, -0.03782176971435547, -0.03641462326049805, -0.035007476806640625, -0.0336003303527832, -0.03219318389892578, -0.03078603744506836, -0.029378890991210938, -0.027971744537353516, -0.026564598083496094, -0.025157451629638672, -0.02375030517578125, -0.022343158721923828, -0.020936012268066406, -0.019528865814208984, -0.018121719360351562, -0.01671457290649414, -0.015307426452636719, -0.013900279998779297, -0.012493133544921875, -0.011085987091064453, -0.009678840637207031, -0.00827169418334961, -0.0068645477294921875, -0.005457401275634766, -0.004050254821777344, -0.002643108367919922, -0.0012359619140625, 0.00017118453979492188, 0.0015783309936523438, 0.0029854774475097656, 0.0043926239013671875, 0.005799770355224609, 0.007206916809082031, 0.008614063262939453, 0.010021209716796875, 0.011428356170654297, 0.012835502624511719, 0.01424264907836914, 0.015649795532226562, 0.017056941986083984, 0.018464088439941406, 0.019871234893798828, 0.02127838134765625, 0.022685527801513672, 0.024092674255371094, 0.025499820709228516, 0.026906967163085938, 0.02831411361694336, 0.02972126007080078, 0.031128406524658203, 0.032535552978515625, 0.03394269943237305, 0.03534984588623047, 0.03675699234008789, 0.03816413879394531, 0.039571285247802734, 0.040978431701660156, 0.04238557815551758, 0.043792724609375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 4.0, 4.0, 7.0, 6.0, 4.0, 7.0, 12.0, 19.0, 136.0, 540.0, 113.0, 14.0, 7.0, 11.0, 18.0, 11.0, 10.0, 7.0, 5.0, 2.0, 8.0, 1.0, 7.0, 3.0, 0.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002002716064453125, -0.0019279420375823975, -0.00185316801071167, -0.0017783939838409424, -0.0017036199569702148, -0.0016288459300994873, -0.0015540719032287598, -0.0014792978763580322, -0.0014045238494873047, -0.0013297498226165771, -0.0012549757957458496, -0.001180201768875122, -0.0011054277420043945, -0.001030653715133667, -0.0009558796882629395, -0.0008811056613922119, -0.0008063316345214844, -0.0007315576076507568, -0.0006567835807800293, -0.0005820095539093018, -0.0005072355270385742, -0.0004324615001678467, -0.00035768747329711914, -0.0002829134464263916, -0.00020813941955566406, -0.00013336539268493652, -5.8591365814208984e-05, 1.6182661056518555e-05, 9.09566879272461e-05, 0.00016573071479797363, 0.00024050474166870117, 0.0003152787685394287, 0.00039005279541015625, 0.0004648268222808838, 0.0005396008491516113, 0.0006143748760223389, 0.0006891489028930664, 0.0007639229297637939, 0.0008386969566345215, 0.000913470983505249, 0.0009882450103759766, 0.001063019037246704, 0.0011377930641174316, 0.0012125670909881592, 0.0012873411178588867, 0.0013621151447296143, 0.0014368891716003418, 0.0015116631984710693, 0.0015864372253417969, 0.0016612112522125244, 0.001735985279083252, 0.0018107593059539795, 0.001885533332824707, 0.0019603073596954346, 0.002035081386566162, 0.0021098554134368896, 0.002184629440307617, 0.0022594034671783447, 0.0023341774940490723, 0.0024089515209198, 0.0024837255477905273, 0.002558499574661255, 0.0026332736015319824, 0.00270804762840271, 0.0027828216552734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 11.0, 11.0, 15.0, 17.0, 19.0, 17.0, 19.0, 17.0, 15.0, 25.0, 28.0, 43.0, 40.0, 66.0, 148.0, 767.0, 7612.0, 945359.0, 90402.0, 3061.0, 384.0, 83.0, 61.0, 43.0, 37.0, 35.0, 29.0, 17.0, 26.0, 25.0, 22.0, 20.0, 11.0, 15.0, 5.0, 1.0, 10.0, 3.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.1514568328857422, -0.14654159545898438, -0.14162635803222656, -0.13671112060546875, -0.13179588317871094, -0.12688064575195312, -0.12196540832519531, -0.1170501708984375, -0.11213493347167969, -0.10721969604492188, -0.10230445861816406, -0.09738922119140625, -0.09247398376464844, -0.08755874633789062, -0.08264350891113281, -0.077728271484375, -0.07281303405761719, -0.06789779663085938, -0.06298255920410156, -0.05806732177734375, -0.05315208435058594, -0.048236846923828125, -0.04332160949707031, -0.0384063720703125, -0.03349113464355469, -0.028575897216796875, -0.023660659790039062, -0.01874542236328125, -0.013830184936523438, -0.008914947509765625, -0.0039997100830078125, 0.00091552734375, 0.0058307647705078125, 0.010746002197265625, 0.015661239624023438, 0.02057647705078125, 0.025491714477539062, 0.030406951904296875, 0.03532218933105469, 0.0402374267578125, 0.04515266418457031, 0.050067901611328125, 0.05498313903808594, 0.05989837646484375, 0.06481361389160156, 0.06972885131835938, 0.07464408874511719, 0.079559326171875, 0.08447456359863281, 0.08938980102539062, 0.09430503845214844, 0.09922027587890625, 0.10413551330566406, 0.10905075073242188, 0.11396598815917969, 0.1188812255859375, 0.12379646301269531, 0.12871170043945312, 0.13362693786621094, 0.13854217529296875, 0.14345741271972656, 0.14837265014648438, 0.1532878875732422, 0.158203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 8.0, 8.0, 14.0, 19.0, 17.0, 21.0, 20.0, 10.0, 19.0, 28.0, 20.0, 25.0, 42.0, 43.0, 34.0, 49.0, 29.0, 39.0, 40.0, 40.0, 42.0, 31.0, 33.0, 43.0, 30.0, 36.0, 37.0, 23.0, 27.0, 20.0, 20.0, 30.0, 21.0, 14.0, 7.0, 9.0, 6.0, 8.0, 5.0, 3.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.007770538330078125, -0.007531702518463135, -0.0072928667068481445, -0.007054030895233154, -0.006815195083618164, -0.006576359272003174, -0.006337523460388184, -0.006098687648773193, -0.005859851837158203, -0.005621016025543213, -0.005382180213928223, -0.005143344402313232, -0.004904508590698242, -0.004665672779083252, -0.004426836967468262, -0.0041880011558532715, -0.003949165344238281, -0.003710329532623291, -0.0034714937210083008, -0.0032326579093933105, -0.0029938220977783203, -0.00275498628616333, -0.00251615047454834, -0.0022773146629333496, -0.0020384788513183594, -0.0017996430397033691, -0.001560807228088379, -0.0013219714164733887, -0.0010831356048583984, -0.0008442997932434082, -0.000605463981628418, -0.00036662817001342773, -0.0001277923583984375, 0.00011104345321655273, 0.00034987926483154297, 0.0005887150764465332, 0.0008275508880615234, 0.0010663866996765137, 0.001305222511291504, 0.0015440583229064941, 0.0017828941345214844, 0.0020217299461364746, 0.002260565757751465, 0.002499401569366455, 0.0027382373809814453, 0.0029770731925964355, 0.0032159090042114258, 0.003454744815826416, 0.0036935806274414062, 0.0039324164390563965, 0.004171252250671387, 0.004410088062286377, 0.004648923873901367, 0.004887759685516357, 0.005126595497131348, 0.005365431308746338, 0.005604267120361328, 0.005843102931976318, 0.006081938743591309, 0.006320774555206299, 0.006559610366821289, 0.006798446178436279, 0.0070372819900512695, 0.00727611780166626, 0.00751495361328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 11.0, 14.0, 25.0, 35.0, 69.0, 412.0, 15619.0, 1031404.0, 749.0, 95.0, 48.0, 24.0, 18.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.138916015625, -0.13590717315673828, -0.13289833068847656, -0.12988948822021484, -0.12688064575195312, -0.1238718032836914, -0.12086296081542969, -0.11785411834716797, -0.11484527587890625, -0.11183643341064453, -0.10882759094238281, -0.1058187484741211, -0.10280990600585938, -0.09980106353759766, -0.09679222106933594, -0.09378337860107422, -0.0907745361328125, -0.08776569366455078, -0.08475685119628906, -0.08174800872802734, -0.07873916625976562, -0.0757303237915039, -0.07272148132324219, -0.06971263885498047, -0.06670379638671875, -0.06369495391845703, -0.06068611145019531, -0.057677268981933594, -0.054668426513671875, -0.051659584045410156, -0.04865074157714844, -0.04564189910888672, -0.042633056640625, -0.03962421417236328, -0.03661537170410156, -0.033606529235839844, -0.030597686767578125, -0.027588844299316406, -0.024580001831054688, -0.02157115936279297, -0.01856231689453125, -0.015553474426269531, -0.012544631958007812, -0.009535789489746094, -0.006526947021484375, -0.0035181045532226562, -0.0005092620849609375, 0.0024995803833007812, 0.0055084228515625, 0.008517265319824219, 0.011526107788085938, 0.014534950256347656, 0.017543792724609375, 0.020552635192871094, 0.023561477661132812, 0.02657032012939453, 0.02957916259765625, 0.03258800506591797, 0.03559684753417969, 0.038605690002441406, 0.041614532470703125, 0.044623374938964844, 0.04763221740722656, 0.05064105987548828, 0.05364990234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 6.0, 8.0, 12.0, 33.0, 128.0, 298.0, 339.0, 88.0, 25.0, 17.0, 6.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024175643920898438, -0.0002346392720937729, -0.0002275221049785614, -0.00022040493786334991, -0.00021328777074813843, -0.00020617060363292694, -0.00019905343651771545, -0.00019193626940250397, -0.00018481910228729248, -0.000177701935172081, -0.0001705847680568695, -0.00016346760094165802, -0.00015635043382644653, -0.00014923326671123505, -0.00014211609959602356, -0.00013499893248081207, -0.00012788176536560059, -0.0001207645982503891, -0.00011364743113517761, -0.00010653026401996613, -9.941309690475464e-05, -9.229592978954315e-05, -8.517876267433167e-05, -7.806159555912018e-05, -7.094442844390869e-05, -6.38272613286972e-05, -5.671009421348572e-05, -4.959292709827423e-05, -4.2475759983062744e-05, -3.535859286785126e-05, -2.824142575263977e-05, -2.1124258637428284e-05, -1.4007091522216797e-05, -6.88992440700531e-06, 2.2724270820617676e-07, 7.3444098234176636e-06, 1.446157693862915e-05, 2.1578744053840637e-05, 2.8695911169052124e-05, 3.581307828426361e-05, 4.29302453994751e-05, 5.0047412514686584e-05, 5.716457962989807e-05, 6.428174674510956e-05, 7.139891386032104e-05, 7.851608097553253e-05, 8.563324809074402e-05, 9.27504152059555e-05, 9.986758232116699e-05, 0.00010698474943637848, 0.00011410191655158997, 0.00012121908366680145, 0.00012833625078201294, 0.00013545341789722443, 0.0001425705850124359, 0.0001496877521276474, 0.0001568049192428589, 0.00016392208635807037, 0.00017103925347328186, 0.00017815642058849335, 0.00018527358770370483, 0.00019239075481891632, 0.0001995079219341278, 0.0002066250890493393, 0.00021374225616455078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 4.0, 7.0, 22.0, 39.0, 125.0, 885.0, 975717.0, 70888.0, 649.0, 131.0, 29.0, 22.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11376953125, -0.11041545867919922, -0.10706138610839844, -0.10370731353759766, -0.10035324096679688, -0.0969991683959961, -0.09364509582519531, -0.09029102325439453, -0.08693695068359375, -0.08358287811279297, -0.08022880554199219, -0.0768747329711914, -0.07352066040039062, -0.07016658782958984, -0.06681251525878906, -0.06345844268798828, -0.0601043701171875, -0.05675029754638672, -0.05339622497558594, -0.050042152404785156, -0.046688079833984375, -0.043334007263183594, -0.03997993469238281, -0.03662586212158203, -0.03327178955078125, -0.02991771697998047, -0.026563644409179688, -0.023209571838378906, -0.019855499267578125, -0.016501426696777344, -0.013147354125976562, -0.009793281555175781, -0.006439208984375, -0.0030851364135742188, 0.0002689361572265625, 0.0036230087280273438, 0.006977081298828125, 0.010331153869628906, 0.013685226440429688, 0.01703929901123047, 0.02039337158203125, 0.02374744415283203, 0.027101516723632812, 0.030455589294433594, 0.033809661865234375, 0.037163734436035156, 0.04051780700683594, 0.04387187957763672, 0.0472259521484375, 0.05058002471923828, 0.05393409729003906, 0.057288169860839844, 0.060642242431640625, 0.0639963150024414, 0.06735038757324219, 0.07070446014404297, 0.07405853271484375, 0.07741260528564453, 0.08076667785644531, 0.0841207504272461, 0.08747482299804688, 0.09082889556884766, 0.09418296813964844, 0.09753704071044922, 0.10089111328125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 1.0, 4.0, 9.0, 9.0, 9.0, 15.0, 22.0, 27.0, 30.0, 54.0, 90.0, 392.0, 87.0, 59.0, 34.0, 28.0, 20.0, 21.0, 16.0, 13.0, 9.0, 12.0, 3.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00403594970703125, -0.003863394260406494, -0.0036908388137817383, -0.0035182833671569824, -0.0033457279205322266, -0.0031731724739074707, -0.003000617027282715, -0.002828061580657959, -0.002655506134033203, -0.0024829506874084473, -0.0023103952407836914, -0.0021378397941589355, -0.0019652843475341797, -0.0017927289009094238, -0.001620173454284668, -0.0014476180076599121, -0.0012750625610351562, -0.0011025071144104004, -0.0009299516677856445, -0.0007573962211608887, -0.0005848407745361328, -0.00041228532791137695, -0.0002397298812866211, -6.717443466186523e-05, 0.00010538101196289062, 0.0002779364585876465, 0.00045049190521240234, 0.0006230473518371582, 0.0007956027984619141, 0.0009681582450866699, 0.0011407136917114258, 0.0013132691383361816, 0.0014858245849609375, 0.0016583800315856934, 0.0018309354782104492, 0.002003490924835205, 0.002176046371459961, 0.002348601818084717, 0.0025211572647094727, 0.0026937127113342285, 0.0028662681579589844, 0.0030388236045837402, 0.003211379051208496, 0.003383934497833252, 0.003556489944458008, 0.0037290453910827637, 0.0039016008377075195, 0.004074156284332275, 0.004246711730957031, 0.004419267177581787, 0.004591822624206543, 0.004764378070831299, 0.004936933517456055, 0.0051094889640808105, 0.005282044410705566, 0.005454599857330322, 0.005627155303955078, 0.005799710750579834, 0.00597226619720459, 0.006144821643829346, 0.0063173770904541016, 0.006489932537078857, 0.006662487983703613, 0.006835043430328369, 0.007007598876953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 7.0, 8.0, 12.0, 50.0, 497.0, 361.0, 45.0, 20.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5648580193519592, -0.5522946119308472, -0.5397311449050903, -0.5271677374839783, -0.5146043300628662, -0.5020409226417542, -0.4894774854183197, -0.47691404819488525, -0.4643506407737732, -0.45178723335266113, -0.4392237961292267, -0.42666035890579224, -0.4140969514846802, -0.4015335440635681, -0.38897010684013367, -0.3764066696166992, -0.36384326219558716, -0.3512798547744751, -0.33871641755104065, -0.3261529803276062, -0.31358957290649414, -0.3010261654853821, -0.28846272826194763, -0.2758992910385132, -0.2633358836174011, -0.25077247619628906, -0.23820903897285461, -0.22564561665058136, -0.2130821943283081, -0.20051877200603485, -0.1879553496837616, -0.17539192736148834, -0.16282853484153748, -0.15026511251926422, -0.13770169019699097, -0.1251382678747177, -0.11257484555244446, -0.1000114232301712, -0.08744800090789795, -0.0748845785856247, -0.06232115626335144, -0.049757733941078186, -0.03719431161880493, -0.024630889296531677, -0.012067466974258423, 0.0004959553480148315, 0.013059377670288086, 0.02562279999256134, 0.038186222314834595, 0.05074964463710785, 0.0633130669593811, 0.07587648928165436, 0.08843991160392761, 0.10100333392620087, 0.11356675624847412, 0.12613017857074738, 0.13869360089302063, 0.15125702321529388, 0.16382044553756714, 0.1763838678598404, 0.18894729018211365, 0.2015107125043869, 0.21407413482666016, 0.2266375571489334, 0.23920097947120667]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 4.0, 7.0, 9.0, 12.0, 15.0, 25.0, 25.0, 33.0, 35.0, 41.0, 73.0, 62.0, 69.0, 80.0, 96.0, 78.0, 61.0, 70.0, 45.0, 41.0, 24.0, 17.0, 17.0, 14.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07876193523406982, -0.07644078135490417, -0.07411962747573853, -0.07179847359657288, -0.06947731971740723, -0.06715617328882217, -0.06483501940965652, -0.06251386553049088, -0.060192711651325226, -0.057871557772159576, -0.05555040389299393, -0.053229253739118576, -0.05090809985995293, -0.04858694598078728, -0.046265795826911926, -0.04394464194774628, -0.04162348806858063, -0.03930233418941498, -0.03698118031024933, -0.03466003015637398, -0.03233887627720833, -0.03001772239804268, -0.02769657038152218, -0.02537541836500168, -0.02305426448583603, -0.02073311060667038, -0.01841195859014988, -0.01609080657362938, -0.01376965269446373, -0.011448499746620655, -0.00912734679877758, -0.00680619478225708, -0.004485040903091431, -0.002163887955248356, 0.00015726499259471893, 0.0024784179404377937, 0.0047995708882808685, 0.007120723836123943, 0.009441876783967018, 0.011763028800487518, 0.014084182679653168, 0.016405336558818817, 0.018726488575339317, 0.021047640591859818, 0.023368794471025467, 0.025689948350191116, 0.028011100366711617, 0.030332252383232117, 0.032653406262397766, 0.034974560141563416, 0.037295714020729065, 0.039616864174604416, 0.041938018053770065, 0.044259171932935715, 0.046580322086811066, 0.048901475965976715, 0.051222629845142365, 0.053543783724308014, 0.05586493760347366, 0.058186087757349014, 0.060507241636514664, 0.06282839179039001, 0.06514954566955566, 0.06747069954872131, 0.06979185342788696]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 2.0, 4.0, 8.0, 10.0, 8.0, 6.0, 8.0, 14.0, 12.0, 8.0, 12.0, 6.0, 24.0, 16.0, 30.0, 44.0, 4157506.0, 36292.0, 22.0, 32.0, 24.0, 30.0, 20.0, 16.0, 8.0, 6.0, 14.0, 6.0, 12.0, 4.0, 4.0, 12.0, 2.0, 6.0, 6.0, 4.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.765625, -2.65911865234375, -2.5526123046875, -2.44610595703125, -2.339599609375, -2.23309326171875, -2.1265869140625, -2.02008056640625, -1.91357421875, -1.80706787109375, -1.7005615234375, -1.59405517578125, -1.487548828125, -1.38104248046875, -1.2745361328125, -1.16802978515625, -1.0615234375, -0.95501708984375, -0.8485107421875, -0.74200439453125, -0.635498046875, -0.52899169921875, -0.4224853515625, -0.31597900390625, -0.20947265625, -0.10296630859375, 0.0035400390625, 0.11004638671875, 0.216552734375, 0.32305908203125, 0.4295654296875, 0.53607177734375, 0.642578125, 0.74908447265625, 0.8555908203125, 0.96209716796875, 1.068603515625, 1.17510986328125, 1.2816162109375, 1.38812255859375, 1.49462890625, 1.60113525390625, 1.7076416015625, 1.81414794921875, 1.920654296875, 2.02716064453125, 2.1336669921875, 2.24017333984375, 2.3466796875, 2.45318603515625, 2.5596923828125, 2.66619873046875, 2.772705078125, 2.87921142578125, 2.9857177734375, 3.09222412109375, 3.19873046875, 3.30523681640625, 3.4117431640625, 3.51824951171875, 3.624755859375, 3.73126220703125, 3.8377685546875, 3.94427490234375, 4.05078125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 4.0, 2.0, 7.0, 4.0, 6.0, 7.0, 6.0, 14.0, 18.0, 64.0, 398.0, 307.0, 24.0, 20.0, 3.0, 13.0, 6.0, 16.0, 12.0, 4.0, 8.0, 3.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0019330978393554688, -0.0018620938062667847, -0.0017910897731781006, -0.0017200857400894165, -0.0016490817070007324, -0.0015780776739120483, -0.0015070736408233643, -0.0014360696077346802, -0.001365065574645996, -0.001294061541557312, -0.001223057508468628, -0.0011520534753799438, -0.0010810494422912598, -0.0010100454092025757, -0.0009390413761138916, -0.0008680373430252075, -0.0007970333099365234, -0.0007260292768478394, -0.0006550252437591553, -0.0005840212106704712, -0.0005130171775817871, -0.00044201314449310303, -0.00037100911140441895, -0.00030000507831573486, -0.00022900104522705078, -0.0001579970121383667, -8.699297904968262e-05, -1.5988945960998535e-05, 5.501508712768555e-05, 0.00012601912021636963, 0.0001970231533050537, 0.0002680271863937378, 0.0003390312194824219, 0.00041003525257110596, 0.00048103928565979004, 0.0005520433187484741, 0.0006230473518371582, 0.0006940513849258423, 0.0007650554180145264, 0.0008360594511032104, 0.0009070634841918945, 0.0009780675172805786, 0.0010490715503692627, 0.0011200755834579468, 0.0011910796165466309, 0.001262083649635315, 0.001333087682723999, 0.001404091715812683, 0.0014750957489013672, 0.0015460997819900513, 0.0016171038150787354, 0.0016881078481674194, 0.0017591118812561035, 0.0018301159143447876, 0.0019011199474334717, 0.0019721239805221558, 0.00204312801361084, 0.002114132046699524, 0.002185136079788208, 0.002256140112876892, 0.002327144145965576, 0.0023981481790542603, 0.0024691522121429443, 0.0025401562452316284, 0.0026111602783203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 6.0, 8.0, 7.0, 20.0, 16.0, 30.0, 35.0, 59.0, 82.0, 147.0, 258.0, 1933.0, 4190849.0, 377.0, 164.0, 88.0, 69.0, 48.0, 20.0, 27.0, 9.0, 7.0, 8.0, 5.0, 9.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01171875, -0.97705078125, -0.9423828125, -0.90771484375, -0.873046875, -0.83837890625, -0.8037109375, -0.76904296875, -0.734375, -0.69970703125, -0.6650390625, -0.63037109375, -0.595703125, -0.56103515625, -0.5263671875, -0.49169921875, -0.45703125, -0.42236328125, -0.3876953125, -0.35302734375, -0.318359375, -0.28369140625, -0.2490234375, -0.21435546875, -0.1796875, -0.14501953125, -0.1103515625, -0.07568359375, -0.041015625, -0.00634765625, 0.0283203125, 0.06298828125, 0.09765625, 0.13232421875, 0.1669921875, 0.20166015625, 0.236328125, 0.27099609375, 0.3056640625, 0.34033203125, 0.375, 0.40966796875, 0.4443359375, 0.47900390625, 0.513671875, 0.54833984375, 0.5830078125, 0.61767578125, 0.65234375, 0.68701171875, 0.7216796875, 0.75634765625, 0.791015625, 0.82568359375, 0.8603515625, 0.89501953125, 0.9296875, 0.96435546875, 0.9990234375, 1.03369140625, 1.068359375, 1.10302734375, 1.1376953125, 1.17236328125, 1.20703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 12.0, 26.0, 24.0, 40.0, 55.0, 62.0, 120.0, 262.0, 569.0, 1736.0, 544.0, 242.0, 113.0, 90.0, 56.0, 30.0, 23.0, 14.0, 9.0, 10.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00640106201171875, -0.0061841607093811035, -0.005967259407043457, -0.0057503581047058105, -0.005533456802368164, -0.005316555500030518, -0.005099654197692871, -0.004882752895355225, -0.004665851593017578, -0.004448950290679932, -0.004232048988342285, -0.004015147686004639, -0.003798246383666992, -0.0035813450813293457, -0.0033644437789916992, -0.0031475424766540527, -0.0029306411743164062, -0.0027137398719787598, -0.0024968385696411133, -0.002279937267303467, -0.0020630359649658203, -0.0018461346626281738, -0.0016292333602905273, -0.0014123320579528809, -0.0011954307556152344, -0.0009785294532775879, -0.0007616281509399414, -0.0005447268486022949, -0.00032782554626464844, -0.00011092424392700195, 0.00010597705841064453, 0.000322878360748291, 0.0005397796630859375, 0.000756680965423584, 0.0009735822677612305, 0.001190483570098877, 0.0014073848724365234, 0.00162428617477417, 0.0018411874771118164, 0.002058088779449463, 0.0022749900817871094, 0.002491891384124756, 0.0027087926864624023, 0.002925693988800049, 0.0031425952911376953, 0.003359496593475342, 0.0035763978958129883, 0.0037932991981506348, 0.004010200500488281, 0.004227101802825928, 0.004444003105163574, 0.004660904407501221, 0.004877805709838867, 0.005094707012176514, 0.00531160831451416, 0.005528509616851807, 0.005745410919189453, 0.0059623122215271, 0.006179213523864746, 0.006396114826202393, 0.006613016128540039, 0.0068299174308776855, 0.007046818733215332, 0.0072637200355529785, 0.007480621337890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 267.0, 745.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9134668111801147, -0.8936519026756287, -0.8738369941711426, -0.8540220856666565, -0.8342071771621704, -0.8143923282623291, -0.794577419757843, -0.7747625112533569, -0.7549476027488708, -0.7351326942443848, -0.7153177857398987, -0.6955028772354126, -0.6756880283355713, -0.6558731198310852, -0.6360582113265991, -0.616243302822113, -0.596428394317627, -0.5766134858131409, -0.5567985773086548, -0.5369836688041687, -0.5171687602996826, -0.4973538815975189, -0.4775390028953552, -0.45772409439086914, -0.43790918588638306, -0.418094277381897, -0.3982793688774109, -0.3784644901752472, -0.3586495816707611, -0.338834673166275, -0.31901979446411133, -0.29920488595962524, -0.27938997745513916, -0.2595750689506531, -0.23976017534732819, -0.2199452817440033, -0.2001303732395172, -0.18031546473503113, -0.16050057113170624, -0.14068567752838135, -0.12087076902389526, -0.10105586796998978, -0.08124096691608429, -0.0614260658621788, -0.041611164808273315, -0.02179626375436783, -0.0019813627004623413, 0.01783353090286255, 0.03764843940734863, 0.05746334046125412, 0.0772782415151596, 0.0970931425690651, 0.11690804362297058, 0.13672295212745667, 0.15653784573078156, 0.17635273933410645, 0.19616764783859253, 0.2159825563430786, 0.2357974499464035, 0.2556123435497284, 0.2754272520542145, 0.29524216055870056, 0.31505703926086426, 0.33487194776535034, 0.3546868562698364]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 13.0, 20.0, 41.0, 45.0, 80.0, 122.0, 160.0, 170.0, 138.0, 102.0, 62.0, 29.0, 12.0, 10.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03470331430435181, -0.03209485113620758, -0.029486384242773056, -0.02687791921198368, -0.024269454181194305, -0.02166098915040493, -0.019052524119615555, -0.01644405908882618, -0.013835594058036804, -0.011227129027247429, -0.008618663996458054, -0.006010198965668678, -0.003401733934879303, -0.0007932689040899277, 0.0018151961266994476, 0.004423661157488823, 0.007032126188278198, 0.009640591219067574, 0.012249056249856949, 0.014857521280646324, 0.0174659863114357, 0.020074451342225075, 0.02268291637301445, 0.025291381403803825, 0.0278998464345932, 0.030508311465382576, 0.03311677649617195, 0.035725243389606476, 0.0383337065577507, 0.04094216972589493, 0.04355063661932945, 0.04615910351276398, 0.0487675666809082, 0.05137602984905243, 0.053984496742486954, 0.05659296363592148, 0.059201426804065704, 0.06180988997220993, 0.06441836059093475, 0.06702682375907898, 0.0696352869272232, 0.07224375009536743, 0.07485221326351166, 0.07746068388223648, 0.0800691470503807, 0.08267761021852493, 0.08528608083724976, 0.08789454400539398, 0.09050300717353821, 0.09311147034168243, 0.09571993350982666, 0.09832840412855148, 0.10093686729669571, 0.10354533046483994, 0.10615380108356476, 0.10876226425170898, 0.11137072741985321, 0.11397919058799744, 0.11658765375614166, 0.11919612437486649, 0.12180458754301071, 0.12441305071115494, 0.12702152132987976, 0.129629984498024, 0.1322384476661682]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 8.0, 8.0, 6.0, 13.0, 7.0, 6.0, 15.0, 27.0, 24.0, 20.0, 30.0, 37.0, 41.0, 43.0, 53.0, 78.0, 175.0, 7346.0, 1034629.0, 5365.0, 188.0, 90.0, 46.0, 42.0, 43.0, 34.0, 32.0, 19.0, 18.0, 25.0, 19.0, 18.0, 13.0, 8.0, 4.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.1643352508544922, -0.15911483764648438, -0.15389442443847656, -0.14867401123046875, -0.14345359802246094, -0.13823318481445312, -0.1330127716064453, -0.1277923583984375, -0.12257194519042969, -0.11735153198242188, -0.11213111877441406, -0.10691070556640625, -0.10169029235839844, -0.09646987915039062, -0.09124946594238281, -0.086029052734375, -0.08080863952636719, -0.07558822631835938, -0.07036781311035156, -0.06514739990234375, -0.05992698669433594, -0.054706573486328125, -0.04948616027832031, -0.0442657470703125, -0.03904533386230469, -0.033824920654296875, -0.028604507446289062, -0.02338409423828125, -0.018163681030273438, -0.012943267822265625, -0.0077228546142578125, -0.00250244140625, 0.0027179718017578125, 0.007938385009765625, 0.013158798217773438, 0.01837921142578125, 0.023599624633789062, 0.028820037841796875, 0.03404045104980469, 0.0392608642578125, 0.04448127746582031, 0.049701690673828125, 0.05492210388183594, 0.06014251708984375, 0.06536293029785156, 0.07058334350585938, 0.07580375671386719, 0.081024169921875, 0.08624458312988281, 0.09146499633789062, 0.09668540954589844, 0.10190582275390625, 0.10712623596191406, 0.11234664916992188, 0.11756706237792969, 0.1227874755859375, 0.1280078887939453, 0.13322830200195312, 0.13844871520996094, 0.14366912841796875, 0.14888954162597656, 0.15410995483398438, 0.1593303680419922, 0.16455078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 15.0, 44.0, 124.0, 215.0, 251.0, 178.0, 122.0, 43.0, 11.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024204254150390625, -0.002134650945663452, -0.0018488764762878418, -0.0015631020069122314, -0.001277327537536621, -0.0009915530681610107, -0.0007057785987854004, -0.00042000412940979004, -0.0001342296600341797, 0.00015154480934143066, 0.000437319278717041, 0.0007230937480926514, 0.0010088682174682617, 0.001294642686843872, 0.0015804171562194824, 0.0018661916255950928, 0.002151966094970703, 0.0024377405643463135, 0.002723515033721924, 0.003009289503097534, 0.0032950639724731445, 0.003580838441848755, 0.0038666129112243652, 0.004152387380599976, 0.004438161849975586, 0.004723936319351196, 0.005009710788726807, 0.005295485258102417, 0.005581259727478027, 0.005867034196853638, 0.006152808666229248, 0.006438583135604858, 0.006724357604980469, 0.007010132074356079, 0.0072959065437316895, 0.0075816810131073, 0.00786745548248291, 0.00815322995185852, 0.00843900442123413, 0.008724778890609741, 0.009010553359985352, 0.009296327829360962, 0.009582102298736572, 0.009867876768112183, 0.010153651237487793, 0.010439425706863403, 0.010725200176239014, 0.011010974645614624, 0.011296749114990234, 0.011582523584365845, 0.011868298053741455, 0.012154072523117065, 0.012439846992492676, 0.012725621461868286, 0.013011395931243896, 0.013297170400619507, 0.013582944869995117, 0.013868719339370728, 0.014154493808746338, 0.014440268278121948, 0.014726042747497559, 0.015011817216873169, 0.01529759168624878, 0.01558336615562439, 0.015869140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 23.0, 38.0, 40.0, 74.0, 119.0, 207.0, 560.0, 1675.0, 10366.0, 208578.0, 786438.0, 35019.0, 3790.0, 871.0, 292.0, 145.0, 88.0, 64.0, 45.0, 22.0, 9.0, 14.0, 11.0, 5.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09967041015625, -0.09684181213378906, -0.09401321411132812, -0.09118461608886719, -0.08835601806640625, -0.08552742004394531, -0.08269882202148438, -0.07987022399902344, -0.0770416259765625, -0.07421302795410156, -0.07138442993164062, -0.06855583190917969, -0.06572723388671875, -0.06289863586425781, -0.060070037841796875, -0.05724143981933594, -0.054412841796875, -0.05158424377441406, -0.048755645751953125, -0.04592704772949219, -0.04309844970703125, -0.04026985168457031, -0.037441253662109375, -0.03461265563964844, -0.0317840576171875, -0.028955459594726562, -0.026126861572265625, -0.023298263549804688, -0.02046966552734375, -0.017641067504882812, -0.014812469482421875, -0.011983871459960938, -0.0091552734375, -0.0063266754150390625, -0.003498077392578125, -0.0006694793701171875, 0.00215911865234375, 0.0049877166748046875, 0.007816314697265625, 0.010644912719726562, 0.0134735107421875, 0.016302108764648438, 0.019130706787109375, 0.021959304809570312, 0.02478790283203125, 0.027616500854492188, 0.030445098876953125, 0.03327369689941406, 0.036102294921875, 0.03893089294433594, 0.041759490966796875, 0.04458808898925781, 0.04741668701171875, 0.05024528503417969, 0.053073883056640625, 0.05590248107910156, 0.0587310791015625, 0.06155967712402344, 0.06438827514648438, 0.06721687316894531, 0.07004547119140625, 0.07287406921386719, 0.07570266723632812, 0.07853126525878906, 0.08135986328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 11.0, 10.0, 5.0, 15.0, 21.0, 25.0, 28.0, 25.0, 32.0, 40.0, 46.0, 39.0, 54.0, 39.0, 57.0, 50.0, 44.0, 63.0, 57.0, 36.0, 54.0, 29.0, 38.0, 28.0, 28.0, 25.0, 17.0, 19.0, 11.0, 6.0, 2.0, 10.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0194244384765625, -0.01884746551513672, -0.018270492553710938, -0.017693519592285156, -0.017116546630859375, -0.016539573669433594, -0.015962600708007812, -0.015385627746582031, -0.01480865478515625, -0.014231681823730469, -0.013654708862304688, -0.013077735900878906, -0.012500762939453125, -0.011923789978027344, -0.011346817016601562, -0.010769844055175781, -0.01019287109375, -0.009615898132324219, -0.009038925170898438, -0.008461952209472656, -0.007884979248046875, -0.007308006286621094, -0.0067310333251953125, -0.006154060363769531, -0.00557708740234375, -0.005000114440917969, -0.0044231414794921875, -0.0038461685180664062, -0.003269195556640625, -0.0026922225952148438, -0.0021152496337890625, -0.0015382766723632812, -0.0009613037109375, -0.00038433074951171875, 0.0001926422119140625, 0.0007696151733398438, 0.001346588134765625, 0.0019235610961914062, 0.0025005340576171875, 0.0030775070190429688, 0.00365447998046875, 0.004231452941894531, 0.0048084259033203125, 0.005385398864746094, 0.005962371826171875, 0.006539344787597656, 0.0071163177490234375, 0.007693290710449219, 0.008270263671875, 0.008847236633300781, 0.009424209594726562, 0.010001182556152344, 0.010578155517578125, 0.011155128479003906, 0.011732101440429688, 0.012309074401855469, 0.01288604736328125, 0.013463020324707031, 0.014039993286132812, 0.014616966247558594, 0.015193939208984375, 0.015770912170410156, 0.016347885131835938, 0.01692485809326172, 0.0175018310546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 15.0, 23.0, 25.0, 59.0, 92.0, 216.0, 590.0, 2794.0, 47511.0, 979652.0, 15000.0, 1761.0, 412.0, 151.0, 75.0, 45.0, 23.0, 25.0, 9.0, 9.0, 10.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12347412109375, -0.11911869049072266, -0.11476325988769531, -0.11040782928466797, -0.10605239868164062, -0.10169696807861328, -0.09734153747558594, -0.0929861068725586, -0.08863067626953125, -0.0842752456665039, -0.07991981506347656, -0.07556438446044922, -0.07120895385742188, -0.06685352325439453, -0.06249809265136719, -0.058142662048339844, -0.0537872314453125, -0.049431800842285156, -0.04507637023925781, -0.04072093963623047, -0.036365509033203125, -0.03201007843017578, -0.027654647827148438, -0.023299217224121094, -0.01894378662109375, -0.014588356018066406, -0.010232925415039062, -0.005877494812011719, -0.001522064208984375, 0.0028333663940429688, 0.0071887969970703125, 0.011544227600097656, 0.015899658203125, 0.020255088806152344, 0.024610519409179688, 0.02896595001220703, 0.033321380615234375, 0.03767681121826172, 0.04203224182128906, 0.046387672424316406, 0.05074310302734375, 0.055098533630371094, 0.05945396423339844, 0.06380939483642578, 0.06816482543945312, 0.07252025604248047, 0.07687568664550781, 0.08123111724853516, 0.0855865478515625, 0.08994197845458984, 0.09429740905761719, 0.09865283966064453, 0.10300827026367188, 0.10736370086669922, 0.11171913146972656, 0.1160745620727539, 0.12042999267578125, 0.1247854232788086, 0.12914085388183594, 0.13349628448486328, 0.13785171508789062, 0.14220714569091797, 0.1465625762939453, 0.15091800689697266, 0.1552734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 10.0, 9.0, 29.0, 67.0, 93.0, 175.0, 215.0, 187.0, 100.0, 55.0, 24.0, 14.0, 12.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6881694793701172e-05, -2.6182271540164948e-05, -2.5482848286628723e-05, -2.47834250330925e-05, -2.4084001779556274e-05, -2.338457852602005e-05, -2.2685155272483826e-05, -2.19857320189476e-05, -2.1286308765411377e-05, -2.0586885511875153e-05, -1.9887462258338928e-05, -1.9188039004802704e-05, -1.848861575126648e-05, -1.7789192497730255e-05, -1.708976924419403e-05, -1.6390345990657806e-05, -1.5690922737121582e-05, -1.4991499483585358e-05, -1.4292076230049133e-05, -1.3592652976512909e-05, -1.2893229722976685e-05, -1.219380646944046e-05, -1.1494383215904236e-05, -1.0794959962368011e-05, -1.0095536708831787e-05, -9.396113455295563e-06, -8.696690201759338e-06, -7.997266948223114e-06, -7.29784369468689e-06, -6.598420441150665e-06, -5.898997187614441e-06, -5.1995739340782166e-06, -4.500150680541992e-06, -3.800727427005768e-06, -3.1013041734695435e-06, -2.401880919933319e-06, -1.7024576663970947e-06, -1.0030344128608704e-06, -3.03611159324646e-07, 3.9581209421157837e-07, 1.0952353477478027e-06, 1.794658601284027e-06, 2.4940818548202515e-06, 3.193505108356476e-06, 3.8929283618927e-06, 4.5923516154289246e-06, 5.291774868965149e-06, 5.991198122501373e-06, 6.690621376037598e-06, 7.390044629573822e-06, 8.089467883110046e-06, 8.78889113664627e-06, 9.488314390182495e-06, 1.018773764371872e-05, 1.0887160897254944e-05, 1.1586584150791168e-05, 1.2286007404327393e-05, 1.2985430657863617e-05, 1.3684853911399841e-05, 1.4384277164936066e-05, 1.508370041847229e-05, 1.5783123672008514e-05, 1.648254692554474e-05, 1.7181970179080963e-05, 1.7881393432617188e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 11.0, 7.0, 4.0, 7.0, 26.0, 24.0, 42.0, 111.0, 323.0, 2239.0, 1015636.0, 28905.0, 897.0, 152.0, 77.0, 24.0, 18.0, 17.0, 6.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.4048957824707031, -0.39084625244140625, -0.3767967224121094, -0.3627471923828125, -0.3486976623535156, -0.33464813232421875, -0.3205986022949219, -0.306549072265625, -0.2924995422363281, -0.27845001220703125, -0.2644004821777344, -0.2503509521484375, -0.23630142211914062, -0.22225189208984375, -0.20820236206054688, -0.19415283203125, -0.18010330200195312, -0.16605377197265625, -0.15200424194335938, -0.1379547119140625, -0.12390518188476562, -0.10985565185546875, -0.09580612182617188, -0.081756591796875, -0.06770706176757812, -0.05365753173828125, -0.039608001708984375, -0.0255584716796875, -0.011508941650390625, 0.00254058837890625, 0.016590118408203125, 0.0306396484375, 0.044689178466796875, 0.05873870849609375, 0.07278823852539062, 0.0868377685546875, 0.10088729858398438, 0.11493682861328125, 0.12898635864257812, 0.143035888671875, 0.15708541870117188, 0.17113494873046875, 0.18518447875976562, 0.1992340087890625, 0.21328353881835938, 0.22733306884765625, 0.24138259887695312, 0.25543212890625, 0.2694816589355469, 0.28353118896484375, 0.2975807189941406, 0.3116302490234375, 0.3256797790527344, 0.33972930908203125, 0.3537788391113281, 0.367828369140625, 0.3818778991699219, 0.39592742919921875, 0.4099769592285156, 0.4240264892578125, 0.4380760192871094, 0.45212554931640625, 0.4661750793457031, 0.480224609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 9.0, 29.0, 140.0, 508.0, 222.0, 47.0, 11.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17333984375, -0.16927623748779297, -0.16521263122558594, -0.1611490249633789, -0.15708541870117188, -0.15302181243896484, -0.1489582061767578, -0.14489459991455078, -0.14083099365234375, -0.13676738739013672, -0.1327037811279297, -0.12864017486572266, -0.12457656860351562, -0.1205129623413086, -0.11644935607910156, -0.11238574981689453, -0.1083221435546875, -0.10425853729248047, -0.10019493103027344, -0.0961313247680664, -0.09206771850585938, -0.08800411224365234, -0.08394050598144531, -0.07987689971923828, -0.07581329345703125, -0.07174968719482422, -0.06768608093261719, -0.06362247467041016, -0.059558868408203125, -0.055495262145996094, -0.05143165588378906, -0.04736804962158203, -0.043304443359375, -0.03924083709716797, -0.03517723083496094, -0.031113624572753906, -0.027050018310546875, -0.022986412048339844, -0.018922805786132812, -0.014859199523925781, -0.01079559326171875, -0.006731986999511719, -0.0026683807373046875, 0.0013952255249023438, 0.005458831787109375, 0.009522438049316406, 0.013586044311523438, 0.01764965057373047, 0.0217132568359375, 0.02577686309814453, 0.029840469360351562, 0.033904075622558594, 0.037967681884765625, 0.042031288146972656, 0.04609489440917969, 0.05015850067138672, 0.05422210693359375, 0.05828571319580078, 0.06234931945800781, 0.06641292572021484, 0.07047653198242188, 0.0745401382446289, 0.07860374450683594, 0.08266735076904297, 0.08673095703125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 38.0, 894.0, 81.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646113395690918, -3.567890167236328, -3.4896671772003174, -3.4114439487457275, -3.3332207202911377, -3.254997730255127, -3.176774501800537, -3.0985512733459473, -3.0203280448913574, -2.9421048164367676, -2.863881826400757, -2.785658597946167, -2.707435369491577, -2.6292123794555664, -2.5509891510009766, -2.4727659225463867, -2.394542932510376, -2.316319704055786, -2.2380967140197754, -2.1598734855651855, -2.0816502571105957, -2.003427028656006, -1.9252040386199951, -1.8469808101654053, -1.768757700920105, -1.6905345916748047, -1.6123113632202148, -1.5340882539749146, -1.4558651447296143, -1.3776419162750244, -1.2994188070297241, -1.2211956977844238, -1.1429723501205444, -1.0647492408752441, -0.9865260124206543, -0.908302903175354, -0.8300797343254089, -0.7518565654754639, -0.6736334562301636, -0.5954102873802185, -0.5171871185302734, -0.43896394968032837, -0.3607408106327057, -0.282517671585083, -0.20429450273513794, -0.12607133388519287, -0.04784819483757019, 0.03037494421005249, 0.10859811305999756, 0.18682126700878143, 0.2650444209575653, 0.343267560005188, 0.42149072885513306, 0.4997138977050781, 0.5779370069503784, 0.6561601758003235, 0.7343833446502686, 0.8126065135002136, 0.8908296823501587, 0.969052791595459, 1.0472760200500488, 1.1254991292953491, 1.2037222385406494, 1.2819454669952393, 1.3601685762405396]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 8.0, 19.0, 22.0, 38.0, 55.0, 66.0, 102.0, 90.0, 116.0, 115.0, 88.0, 90.0, 62.0, 48.0, 37.0, 18.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14681369066238403, -0.13668106496334076, -0.12654843926429749, -0.11641582101583481, -0.10628319531679153, -0.09615056961774826, -0.08601795136928558, -0.07588532567024231, -0.06575269997119904, -0.05562007427215576, -0.045487452298402786, -0.03535483032464981, -0.025222204625606537, -0.015089578926563263, -0.0049569569528102875, 0.005175665020942688, 0.015308290719985962, 0.025440914556384087, 0.03557353839278221, 0.04570616036653519, 0.05583878606557846, 0.06597141176462173, 0.07610403001308441, 0.08623665571212769, 0.09636928141117096, 0.10650190711021423, 0.11663453280925751, 0.12676715850830078, 0.13689976930618286, 0.14703240990638733, 0.1571650207042694, 0.16729764640331268, 0.17743027210235596, 0.18756289780139923, 0.1976955235004425, 0.20782814919948578, 0.21796077489852905, 0.22809338569641113, 0.2382260113954544, 0.24835863709449768, 0.25849127769470215, 0.26862388849258423, 0.2787565290927887, 0.2888891398906708, 0.29902178049087524, 0.3091543912887573, 0.3192870318889618, 0.32941964268684387, 0.33955225348472595, 0.34968486428260803, 0.3598175048828125, 0.3699501156806946, 0.38008275628089905, 0.39021536707878113, 0.4003480076789856, 0.4104806184768677, 0.42061322927474976, 0.43074584007263184, 0.4408784806728363, 0.4510110914707184, 0.46114373207092285, 0.47127634286880493, 0.4814089834690094, 0.4915415942668915, 0.501674234867096]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 8.0, 10.0, 14.0, 10.0, 27.0, 28.0, 42.0, 69.0, 88.0, 159.0, 197.0, 327.0, 507.0, 1263.0, 78148.0, 4105787.0, 5909.0, 673.0, 361.0, 213.0, 167.0, 73.0, 66.0, 37.0, 21.0, 23.0, 13.0, 10.0, 11.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.1750965118408203, -0.16867446899414062, -0.16225242614746094, -0.15583038330078125, -0.14940834045410156, -0.14298629760742188, -0.1365642547607422, -0.1301422119140625, -0.12372016906738281, -0.11729812622070312, -0.11087608337402344, -0.10445404052734375, -0.09803199768066406, -0.09160995483398438, -0.08518791198730469, -0.078765869140625, -0.07234382629394531, -0.06592178344726562, -0.05949974060058594, -0.05307769775390625, -0.04665565490722656, -0.040233612060546875, -0.03381156921386719, -0.0273895263671875, -0.020967483520507812, -0.014545440673828125, -0.008123397827148438, -0.00170135498046875, 0.0047206878662109375, 0.011142730712890625, 0.017564773559570312, 0.02398681640625, 0.030408859252929688, 0.036830902099609375, 0.04325294494628906, 0.04967498779296875, 0.05609703063964844, 0.06251907348632812, 0.06894111633300781, 0.0753631591796875, 0.08178520202636719, 0.08820724487304688, 0.09462928771972656, 0.10105133056640625, 0.10747337341308594, 0.11389541625976562, 0.12031745910644531, 0.126739501953125, 0.1331615447998047, 0.13958358764648438, 0.14600563049316406, 0.15242767333984375, 0.15884971618652344, 0.16527175903320312, 0.1716938018798828, 0.1781158447265625, 0.1845378875732422, 0.19095993041992188, 0.19738197326660156, 0.20380401611328125, 0.21022605895996094, 0.21664810180664062, 0.2230701446533203, 0.2294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 20.0, 21.0, 63.0, 120.0, 184.0, 198.0, 176.0, 117.0, 67.0, 23.0, 14.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005157470703125, -0.004801511764526367, -0.004445552825927734, -0.0040895938873291016, -0.0037336349487304688, -0.003377676010131836, -0.003021717071533203, -0.0026657581329345703, -0.0023097991943359375, -0.0019538402557373047, -0.0015978813171386719, -0.001241922378540039, -0.0008859634399414062, -0.0005300045013427734, -0.00017404556274414062, 0.0001819133758544922, 0.000537872314453125, 0.0008938312530517578, 0.0012497901916503906, 0.0016057491302490234, 0.0019617080688476562, 0.002317667007446289, 0.002673625946044922, 0.0030295848846435547, 0.0033855438232421875, 0.0037415027618408203, 0.004097461700439453, 0.004453420639038086, 0.004809379577636719, 0.0051653385162353516, 0.005521297454833984, 0.005877256393432617, 0.00623321533203125, 0.006589174270629883, 0.006945133209228516, 0.0073010921478271484, 0.007657051086425781, 0.008013010025024414, 0.008368968963623047, 0.00872492790222168, 0.009080886840820312, 0.009436845779418945, 0.009792804718017578, 0.010148763656616211, 0.010504722595214844, 0.010860681533813477, 0.01121664047241211, 0.011572599411010742, 0.011928558349609375, 0.012284517288208008, 0.01264047622680664, 0.012996435165405273, 0.013352394104003906, 0.013708353042602539, 0.014064311981201172, 0.014420270919799805, 0.014776229858398438, 0.01513218879699707, 0.015488147735595703, 0.015844106674194336, 0.01620006561279297, 0.0165560245513916, 0.016911983489990234, 0.017267942428588867, 0.0176239013671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 14.0, 22.0, 63.0, 57.0, 91.0, 159.0, 272.0, 564.0, 316515.0, 3875253.0, 584.0, 237.0, 165.0, 119.0, 69.0, 38.0, 28.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9638671875, -0.9306640625, -0.8974609375, -0.8642578125, -0.8310546875, -0.7978515625, -0.7646484375, -0.7314453125, -0.6982421875, -0.6650390625, -0.6318359375, -0.5986328125, -0.5654296875, -0.5322265625, -0.4990234375, -0.4658203125, -0.4326171875, -0.3994140625, -0.3662109375, -0.3330078125, -0.2998046875, -0.2666015625, -0.2333984375, -0.2001953125, -0.1669921875, -0.1337890625, -0.1005859375, -0.0673828125, -0.0341796875, -0.0009765625, 0.0322265625, 0.0654296875, 0.0986328125, 0.1318359375, 0.1650390625, 0.1982421875, 0.2314453125, 0.2646484375, 0.2978515625, 0.3310546875, 0.3642578125, 0.3974609375, 0.4306640625, 0.4638671875, 0.4970703125, 0.5302734375, 0.5634765625, 0.5966796875, 0.6298828125, 0.6630859375, 0.6962890625, 0.7294921875, 0.7626953125, 0.7958984375, 0.8291015625, 0.8623046875, 0.8955078125, 0.9287109375, 0.9619140625, 0.9951171875, 1.0283203125, 1.0615234375, 1.0947265625, 1.1279296875, 1.1611328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 46.0, 395.0, 3404.0, 198.0, 22.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07362079620361328, -0.07082557678222656, -0.06803035736083984, -0.06523513793945312, -0.062439918518066406, -0.05964469909667969, -0.05684947967529297, -0.05405426025390625, -0.05125904083251953, -0.04846382141113281, -0.045668601989746094, -0.042873382568359375, -0.040078163146972656, -0.03728294372558594, -0.03448772430419922, -0.0316925048828125, -0.02889728546142578, -0.026102066040039062, -0.023306846618652344, -0.020511627197265625, -0.017716407775878906, -0.014921188354492188, -0.012125968933105469, -0.00933074951171875, -0.006535530090332031, -0.0037403106689453125, -0.0009450912475585938, 0.001850128173828125, 0.004645347595214844, 0.0074405670166015625, 0.010235786437988281, 0.013031005859375, 0.01582622528076172, 0.018621444702148438, 0.021416664123535156, 0.024211883544921875, 0.027007102966308594, 0.029802322387695312, 0.03259754180908203, 0.03539276123046875, 0.03818798065185547, 0.04098320007324219, 0.043778419494628906, 0.046573638916015625, 0.049368858337402344, 0.05216407775878906, 0.05495929718017578, 0.0577545166015625, 0.06054973602294922, 0.06334495544433594, 0.06614017486572266, 0.06893539428710938, 0.0717306137084961, 0.07452583312988281, 0.07732105255126953, 0.08011627197265625, 0.08291149139404297, 0.08570671081542969, 0.0885019302368164, 0.09129714965820312, 0.09409236907958984, 0.09688758850097656, 0.09968280792236328, 0.10247802734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 33.0, 240.0, 659.0, 51.0, 13.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240181565284729, -1.1962400674819946, -1.1522986888885498, -1.1083571910858154, -1.064415693283081, -1.0204741954803467, -0.9765328168869019, -0.9325913190841675, -0.8886498808860779, -0.8447084426879883, -0.8007669448852539, -0.7568255066871643, -0.7128840684890747, -0.6689425706863403, -0.6250011324882507, -0.5810596942901611, -0.5371181964874268, -0.49317672848701477, -0.4492352604866028, -0.4052938222885132, -0.3613523542881012, -0.3174108862876892, -0.2734694480895996, -0.22952798008918762, -0.18558651208877563, -0.14164504408836365, -0.09770359098911285, -0.05376213788986206, -0.009820669889450073, 0.034120798110961914, 0.07806223630905151, 0.1220037043094635, 0.1659451723098755, 0.20988664031028748, 0.25382810831069946, 0.29776954650878906, 0.34171101450920105, 0.38565248250961304, 0.42959392070770264, 0.4735353887081146, 0.5174768567085266, 0.5614182949066162, 0.6053597927093506, 0.6493012309074402, 0.6932426691055298, 0.7371841669082642, 0.7811256051063538, 0.8250670433044434, 0.8690085411071777, 0.9129499793052673, 0.9568914771080017, 1.0008329153060913, 1.0447744131088257, 1.0887157917022705, 1.1326572895050049, 1.1765987873077393, 1.2205402851104736, 1.264481782913208, 1.3084231615066528, 1.3523646593093872, 1.3963061571121216, 1.4402475357055664, 1.4841890335083008, 1.5281305313110352, 1.57207190990448]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 9.0, 12.0, 8.0, 13.0, 24.0, 17.0, 35.0, 35.0, 47.0, 55.0, 54.0, 63.0, 78.0, 74.0, 63.0, 54.0, 66.0, 62.0, 57.0, 36.0, 40.0, 21.0, 15.0, 11.0, 13.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08872687816619873, -0.0858239084482193, -0.08292093873023987, -0.08001796901226044, -0.077114999294281, -0.07421202212572098, -0.07130905240774155, -0.06840608268976212, -0.06550311297178268, -0.06260014325380325, -0.05969717353582382, -0.05679420009255409, -0.05389123037457466, -0.05098826065659523, -0.0480852872133255, -0.04518231749534607, -0.04227934777736664, -0.03937637805938721, -0.036473408341407776, -0.033570434898138046, -0.030667465180158615, -0.027764495462179184, -0.024861523881554604, -0.021958552300930023, -0.019055582582950592, -0.01615261286497116, -0.01324964128434658, -0.010346670635044575, -0.007443699985742569, -0.004540729336440563, -0.0016377586871385574, 0.001265212893486023, 0.004168182611465454, 0.00707115326076746, 0.009974123910069466, 0.012877094559371471, 0.015780065208673477, 0.01868303492665291, 0.02158600650727749, 0.02448897808790207, 0.0273919478058815, 0.03029491752386093, 0.03319788724184036, 0.03610086068511009, 0.03900383040308952, 0.041906800121068954, 0.044809773564338684, 0.047712743282318115, 0.050615713000297546, 0.05351868271827698, 0.05642165243625641, 0.05932462587952614, 0.06222759559750557, 0.0651305690407753, 0.06803353875875473, 0.07093650847673416, 0.07383947819471359, 0.07674244791269302, 0.07964541763067245, 0.08254838734865189, 0.08545136451721191, 0.08835433423519135, 0.09125730395317078, 0.09416027367115021, 0.09706324338912964]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 1.0, 9.0, 7.0, 14.0, 17.0, 29.0, 35.0, 42.0, 57.0, 122.0, 175.0, 376.0, 905.0, 3041.0, 19459.0, 601309.0, 403030.0, 15520.0, 2622.0, 851.0, 368.0, 182.0, 106.0, 76.0, 55.0, 30.0, 22.0, 13.0, 23.0, 13.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.252685546875, -0.2445220947265625, -0.236358642578125, -0.2281951904296875, -0.22003173828125, -0.2118682861328125, -0.203704833984375, -0.1955413818359375, -0.1873779296875, -0.1792144775390625, -0.171051025390625, -0.1628875732421875, -0.15472412109375, -0.1465606689453125, -0.138397216796875, -0.1302337646484375, -0.1220703125, -0.1139068603515625, -0.105743408203125, -0.0975799560546875, -0.08941650390625, -0.0812530517578125, -0.073089599609375, -0.0649261474609375, -0.0567626953125, -0.0485992431640625, -0.040435791015625, -0.0322723388671875, -0.02410888671875, -0.0159454345703125, -0.007781982421875, 0.0003814697265625, 0.008544921875, 0.0167083740234375, 0.024871826171875, 0.0330352783203125, 0.04119873046875, 0.0493621826171875, 0.057525634765625, 0.0656890869140625, 0.0738525390625, 0.0820159912109375, 0.090179443359375, 0.0983428955078125, 0.10650634765625, 0.1146697998046875, 0.122833251953125, 0.1309967041015625, 0.13916015625, 0.1473236083984375, 0.155487060546875, 0.1636505126953125, 0.17181396484375, 0.1799774169921875, 0.188140869140625, 0.1963043212890625, 0.2044677734375, 0.2126312255859375, 0.220794677734375, 0.2289581298828125, 0.23712158203125, 0.2452850341796875, 0.253448486328125, 0.2616119384765625, 0.269775390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 13.0, 29.0, 43.0, 50.0, 106.0, 109.0, 132.0, 114.0, 112.0, 109.0, 73.0, 44.0, 26.0, 17.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006549835205078125, -0.006225764751434326, -0.005901694297790527, -0.0055776238441467285, -0.00525355339050293, -0.004929482936859131, -0.004605412483215332, -0.004281342029571533, -0.003957271575927734, -0.0036332011222839355, -0.0033091306686401367, -0.002985060214996338, -0.002660989761352539, -0.0023369193077087402, -0.0020128488540649414, -0.0016887784004211426, -0.0013647079467773438, -0.001040637493133545, -0.0007165670394897461, -0.00039249658584594727, -6.842613220214844e-05, 0.0002556443214416504, 0.0005797147750854492, 0.000903785228729248, 0.0012278556823730469, 0.0015519261360168457, 0.0018759965896606445, 0.0022000670433044434, 0.002524137496948242, 0.002848207950592041, 0.00317227840423584, 0.0034963488578796387, 0.0038204193115234375, 0.004144489765167236, 0.004468560218811035, 0.004792630672454834, 0.005116701126098633, 0.005440771579742432, 0.0057648420333862305, 0.006088912487030029, 0.006412982940673828, 0.006737053394317627, 0.007061123847961426, 0.007385194301605225, 0.0077092647552490234, 0.008033335208892822, 0.008357405662536621, 0.00868147611618042, 0.009005546569824219, 0.009329617023468018, 0.009653687477111816, 0.009977757930755615, 0.010301828384399414, 0.010625898838043213, 0.010949969291687012, 0.01127403974533081, 0.01159811019897461, 0.011922180652618408, 0.012246251106262207, 0.012570321559906006, 0.012894392013549805, 0.013218462467193604, 0.013542532920837402, 0.013866603374481201, 0.014190673828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 13.0, 12.0, 21.0, 38.0, 40.0, 54.0, 73.0, 106.0, 152.0, 208.0, 325.0, 567.0, 1078.0, 2339.0, 6664.0, 26072.0, 170230.0, 673301.0, 134385.0, 22307.0, 5750.0, 2157.0, 1019.0, 569.0, 335.0, 208.0, 154.0, 82.0, 69.0, 49.0, 45.0, 33.0, 18.0, 20.0, 11.0, 9.0, 13.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09393310546875, -0.0911245346069336, -0.08831596374511719, -0.08550739288330078, -0.08269882202148438, -0.07989025115966797, -0.07708168029785156, -0.07427310943603516, -0.07146453857421875, -0.06865596771240234, -0.06584739685058594, -0.06303882598876953, -0.060230255126953125, -0.05742168426513672, -0.05461311340332031, -0.051804542541503906, -0.0489959716796875, -0.046187400817871094, -0.04337882995605469, -0.04057025909423828, -0.037761688232421875, -0.03495311737060547, -0.03214454650878906, -0.029335975646972656, -0.02652740478515625, -0.023718833923339844, -0.020910263061523438, -0.01810169219970703, -0.015293121337890625, -0.012484550476074219, -0.009675979614257812, -0.006867408752441406, -0.004058837890625, -0.0012502670288085938, 0.0015583038330078125, 0.004366874694824219, 0.007175445556640625, 0.009984016418457031, 0.012792587280273438, 0.015601158142089844, 0.01840972900390625, 0.021218299865722656, 0.024026870727539062, 0.02683544158935547, 0.029644012451171875, 0.03245258331298828, 0.03526115417480469, 0.038069725036621094, 0.0408782958984375, 0.043686866760253906, 0.04649543762207031, 0.04930400848388672, 0.052112579345703125, 0.05492115020751953, 0.05772972106933594, 0.060538291931152344, 0.06334686279296875, 0.06615543365478516, 0.06896400451660156, 0.07177257537841797, 0.07458114624023438, 0.07738971710205078, 0.08019828796386719, 0.0830068588256836, 0.0858154296875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 10.0, 7.0, 8.0, 15.0, 13.0, 15.0, 12.0, 26.0, 20.0, 25.0, 36.0, 38.0, 33.0, 40.0, 49.0, 48.0, 53.0, 48.0, 50.0, 42.0, 50.0, 45.0, 37.0, 45.0, 48.0, 43.0, 26.0, 13.0, 20.0, 16.0, 9.0, 9.0, 4.0, 6.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.02124190330505371, -0.020434856414794922, -0.019627809524536133, -0.018820762634277344, -0.018013715744018555, -0.017206668853759766, -0.016399621963500977, -0.015592575073242188, -0.014785528182983398, -0.01397848129272461, -0.01317143440246582, -0.012364387512207031, -0.011557340621948242, -0.010750293731689453, -0.009943246841430664, -0.009136199951171875, -0.008329153060913086, -0.007522106170654297, -0.006715059280395508, -0.005908012390136719, -0.00510096549987793, -0.004293918609619141, -0.0034868717193603516, -0.0026798248291015625, -0.0018727779388427734, -0.0010657310485839844, -0.0002586841583251953, 0.0005483627319335938, 0.0013554096221923828, 0.002162456512451172, 0.002969503402709961, 0.00377655029296875, 0.004583597183227539, 0.005390644073486328, 0.006197690963745117, 0.007004737854003906, 0.007811784744262695, 0.008618831634521484, 0.009425878524780273, 0.010232925415039062, 0.011039972305297852, 0.01184701919555664, 0.01265406608581543, 0.013461112976074219, 0.014268159866333008, 0.015075206756591797, 0.015882253646850586, 0.016689300537109375, 0.017496347427368164, 0.018303394317626953, 0.019110441207885742, 0.01991748809814453, 0.02072453498840332, 0.02153158187866211, 0.0223386287689209, 0.023145675659179688, 0.023952722549438477, 0.024759769439697266, 0.025566816329956055, 0.026373863220214844, 0.027180910110473633, 0.027987957000732422, 0.02879500389099121, 0.02960205078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 15.0, 12.0, 29.0, 45.0, 62.0, 169.0, 321.0, 659.0, 1787.0, 7304.0, 109396.0, 882962.0, 38681.0, 4674.0, 1341.0, 515.0, 236.0, 135.0, 64.0, 38.0, 27.0, 23.0, 11.0, 5.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10546875, -0.10230731964111328, -0.09914588928222656, -0.09598445892333984, -0.09282302856445312, -0.0896615982055664, -0.08650016784667969, -0.08333873748779297, -0.08017730712890625, -0.07701587677001953, -0.07385444641113281, -0.0706930160522461, -0.06753158569335938, -0.06437015533447266, -0.06120872497558594, -0.05804729461669922, -0.0548858642578125, -0.05172443389892578, -0.04856300354003906, -0.045401573181152344, -0.042240142822265625, -0.039078712463378906, -0.03591728210449219, -0.03275585174560547, -0.02959442138671875, -0.02643299102783203, -0.023271560668945312, -0.020110130310058594, -0.016948699951171875, -0.013787269592285156, -0.010625839233398438, -0.007464408874511719, -0.004302978515625, -0.0011415481567382812, 0.0020198822021484375, 0.005181312561035156, 0.008342742919921875, 0.011504173278808594, 0.014665603637695312, 0.01782703399658203, 0.02098846435546875, 0.02414989471435547, 0.027311325073242188, 0.030472755432128906, 0.033634185791015625, 0.036795616149902344, 0.03995704650878906, 0.04311847686767578, 0.0462799072265625, 0.04944133758544922, 0.05260276794433594, 0.055764198303222656, 0.058925628662109375, 0.062087059020996094, 0.06524848937988281, 0.06840991973876953, 0.07157135009765625, 0.07473278045654297, 0.07789421081542969, 0.0810556411743164, 0.08421707153320312, 0.08737850189208984, 0.09053993225097656, 0.09370136260986328, 0.09686279296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 11.0, 13.0, 13.0, 14.0, 39.0, 44.0, 45.0, 61.0, 108.0, 80.0, 105.0, 107.0, 95.0, 68.0, 57.0, 49.0, 30.0, 15.0, 11.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.281560778617859e-06, -8.966773748397827e-06, -8.651986718177795e-06, -8.337199687957764e-06, -8.022412657737732e-06, -7.7076256275177e-06, -7.3928385972976685e-06, -7.078051567077637e-06, -6.763264536857605e-06, -6.448477506637573e-06, -6.1336904764175415e-06, -5.81890344619751e-06, -5.504116415977478e-06, -5.189329385757446e-06, -4.8745423555374146e-06, -4.559755325317383e-06, -4.244968295097351e-06, -3.930181264877319e-06, -3.6153942346572876e-06, -3.300607204437256e-06, -2.985820174217224e-06, -2.6710331439971924e-06, -2.3562461137771606e-06, -2.041459083557129e-06, -1.7266720533370972e-06, -1.4118850231170654e-06, -1.0970979928970337e-06, -7.82310962677002e-07, -4.675239324569702e-07, -1.5273690223693848e-07, 1.6205012798309326e-07, 4.76837158203125e-07, 7.916241884231567e-07, 1.1064112186431885e-06, 1.4211982488632202e-06, 1.735985279083252e-06, 2.0507723093032837e-06, 2.3655593395233154e-06, 2.680346369743347e-06, 2.995133399963379e-06, 3.3099204301834106e-06, 3.6247074604034424e-06, 3.939494490623474e-06, 4.254281520843506e-06, 4.569068551063538e-06, 4.883855581283569e-06, 5.198642611503601e-06, 5.513429641723633e-06, 5.8282166719436646e-06, 6.143003702163696e-06, 6.457790732383728e-06, 6.77257776260376e-06, 7.0873647928237915e-06, 7.402151823043823e-06, 7.716938853263855e-06, 8.031725883483887e-06, 8.346512913703918e-06, 8.66129994392395e-06, 8.976086974143982e-06, 9.290874004364014e-06, 9.605661034584045e-06, 9.920448064804077e-06, 1.0235235095024109e-05, 1.055002212524414e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 8.0, 17.0, 19.0, 30.0, 36.0, 67.0, 99.0, 183.0, 343.0, 692.0, 1765.0, 6782.0, 76504.0, 882172.0, 69994.0, 6629.0, 1722.0, 662.0, 326.0, 182.0, 99.0, 53.0, 41.0, 23.0, 21.0, 13.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.0893545150756836, -0.08642387390136719, -0.08349323272705078, -0.08056259155273438, -0.07763195037841797, -0.07470130920410156, -0.07177066802978516, -0.06884002685546875, -0.06590938568115234, -0.06297874450683594, -0.06004810333251953, -0.057117462158203125, -0.05418682098388672, -0.05125617980957031, -0.048325538635253906, -0.0453948974609375, -0.042464256286621094, -0.03953361511230469, -0.03660297393798828, -0.033672332763671875, -0.03074169158935547, -0.027811050415039062, -0.024880409240722656, -0.02194976806640625, -0.019019126892089844, -0.016088485717773438, -0.013157844543457031, -0.010227203369140625, -0.007296562194824219, -0.0043659210205078125, -0.0014352798461914062, 0.001495361328125, 0.004426002502441406, 0.0073566436767578125, 0.010287284851074219, 0.013217926025390625, 0.01614856719970703, 0.019079208374023438, 0.022009849548339844, 0.02494049072265625, 0.027871131896972656, 0.030801773071289062, 0.03373241424560547, 0.036663055419921875, 0.03959369659423828, 0.04252433776855469, 0.045454978942871094, 0.0483856201171875, 0.051316261291503906, 0.05424690246582031, 0.05717754364013672, 0.060108184814453125, 0.06303882598876953, 0.06596946716308594, 0.06890010833740234, 0.07183074951171875, 0.07476139068603516, 0.07769203186035156, 0.08062267303466797, 0.08355331420898438, 0.08648395538330078, 0.08941459655761719, 0.0923452377319336, 0.09527587890625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 9.0, 4.0, 9.0, 21.0, 19.0, 24.0, 28.0, 56.0, 62.0, 72.0, 77.0, 101.0, 117.0, 85.0, 78.0, 64.0, 46.0, 41.0, 23.0, 14.0, 15.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040374755859375, -0.039034366607666016, -0.03769397735595703, -0.03635358810424805, -0.03501319885253906, -0.03367280960083008, -0.032332420349121094, -0.03099203109741211, -0.029651641845703125, -0.02831125259399414, -0.026970863342285156, -0.025630474090576172, -0.024290084838867188, -0.022949695587158203, -0.02160930633544922, -0.020268917083740234, -0.01892852783203125, -0.017588138580322266, -0.01624774932861328, -0.014907360076904297, -0.013566970825195312, -0.012226581573486328, -0.010886192321777344, -0.00954580307006836, -0.008205413818359375, -0.006865024566650391, -0.005524635314941406, -0.004184246063232422, -0.0028438568115234375, -0.0015034675598144531, -0.00016307830810546875, 0.0011773109436035156, 0.0025177001953125, 0.0038580894470214844, 0.005198478698730469, 0.006538867950439453, 0.007879257202148438, 0.009219646453857422, 0.010560035705566406, 0.01190042495727539, 0.013240814208984375, 0.01458120346069336, 0.015921592712402344, 0.017261981964111328, 0.018602371215820312, 0.019942760467529297, 0.02128314971923828, 0.022623538970947266, 0.02396392822265625, 0.025304317474365234, 0.02664470672607422, 0.027985095977783203, 0.029325485229492188, 0.030665874481201172, 0.032006263732910156, 0.03334665298461914, 0.034687042236328125, 0.03602743148803711, 0.037367820739746094, 0.03870820999145508, 0.04004859924316406, 0.04138898849487305, 0.04272937774658203, 0.044069766998291016, 0.04541015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 22.0, 33.0, 88.0, 285.0, 318.0, 153.0, 58.0, 21.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0978119373321533, -1.0739288330078125, -1.0500457286834717, -1.0261625051498413, -1.0022794008255005, -0.9783962965011597, -0.9545131325721741, -0.9306299686431885, -0.9067468643188477, -0.8828637599945068, -0.8589805960655212, -0.8350974321365356, -0.8112143278121948, -0.787331223487854, -0.7634480595588684, -0.7395648956298828, -0.715681791305542, -0.6917986869812012, -0.6679155230522156, -0.64403235912323, -0.6201492547988892, -0.5962661504745483, -0.5723829865455627, -0.5484998226165771, -0.5246167182922363, -0.5007336139678955, -0.4768504500389099, -0.4529673159122467, -0.4290841817855835, -0.4052010476589203, -0.3813179135322571, -0.35743477940559387, -0.3335516154766083, -0.30966848134994507, -0.28578534722328186, -0.26190221309661865, -0.23801907896995544, -0.21413594484329224, -0.19025281071662903, -0.16636967658996582, -0.1424865424633026, -0.1186034083366394, -0.0947202742099762, -0.07083714008331299, -0.04695400595664978, -0.023070871829986572, 0.0008122622966766357, 0.024695396423339844, 0.04857853055000305, 0.07246166467666626, 0.09634479880332947, 0.12022793292999268, 0.14411106705665588, 0.1679942011833191, 0.1918773353099823, 0.2157604694366455, 0.23964360356330872, 0.2635267376899719, 0.28740987181663513, 0.31129300594329834, 0.33517614006996155, 0.35905927419662476, 0.38294240832328796, 0.40682554244995117, 0.4307086765766144]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 14.0, 15.0, 16.0, 16.0, 17.0, 30.0, 23.0, 31.0, 36.0, 37.0, 42.0, 38.0, 46.0, 56.0, 45.0, 60.0, 54.0, 45.0, 54.0, 47.0, 44.0, 35.0, 35.0, 28.0, 18.0, 26.0, 19.0, 6.0, 11.0, 16.0, 8.0, 6.0, 9.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21772104501724243, -0.21102651953697205, -0.20433199405670166, -0.19763746857643127, -0.1909429430961609, -0.1842484176158905, -0.17755387723445892, -0.17085935175418854, -0.16416482627391815, -0.15747030079364777, -0.15077577531337738, -0.144081249833107, -0.13738670945167542, -0.13069218397140503, -0.12399765849113464, -0.11730313301086426, -0.11060860753059387, -0.10391408205032349, -0.0972195565700531, -0.09052502363920212, -0.08383049815893173, -0.07713597267866135, -0.07044143974781036, -0.06374691426753998, -0.05705238878726959, -0.05035786330699921, -0.04366333410143852, -0.03696880489587784, -0.030274279415607452, -0.023579753935337067, -0.016885224729776382, -0.010190695524215698, -0.0034961700439453125, 0.0031983572989702225, 0.009892884641885757, 0.016587411984801292, 0.023281939327716827, 0.029976464807987213, 0.0366709940135479, 0.04336552321910858, 0.05006004869937897, 0.05675457417964935, 0.06344909965991974, 0.07014363259077072, 0.07683815807104111, 0.08353268355131149, 0.09022721648216248, 0.09692174196243286, 0.10361626744270325, 0.11031079292297363, 0.11700531840324402, 0.123699851334095, 0.1303943693637848, 0.13708889484405518, 0.14378343522548676, 0.15047796070575714, 0.15717248618602753, 0.1638670116662979, 0.1705615371465683, 0.17725606262683868, 0.18395060300827026, 0.19064512848854065, 0.19733965396881104, 0.20403417944908142, 0.2107287049293518]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 8.0, 7.0, 12.0, 18.0, 19.0, 23.0, 29.0, 43.0, 43.0, 95.0, 160.0, 266.0, 634.0, 1833.0, 9234.0, 136587.0, 3947682.0, 87999.0, 7346.0, 1397.0, 426.0, 189.0, 85.0, 41.0, 21.0, 18.0, 13.0, 10.0, 7.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.1598529815673828, -0.15356826782226562, -0.14728355407714844, -0.14099884033203125, -0.13471412658691406, -0.12842941284179688, -0.12214469909667969, -0.1158599853515625, -0.10957527160644531, -0.10329055786132812, -0.09700584411621094, -0.09072113037109375, -0.08443641662597656, -0.07815170288085938, -0.07186698913574219, -0.065582275390625, -0.05929756164550781, -0.053012847900390625, -0.04672813415527344, -0.04044342041015625, -0.03415870666503906, -0.027873992919921875, -0.021589279174804688, -0.0153045654296875, -0.009019851684570312, -0.002735137939453125, 0.0035495758056640625, 0.00983428955078125, 0.016119003295898438, 0.022403717041015625, 0.028688430786132812, 0.03497314453125, 0.04125785827636719, 0.047542572021484375, 0.05382728576660156, 0.06011199951171875, 0.06639671325683594, 0.07268142700195312, 0.07896614074707031, 0.0852508544921875, 0.09153556823730469, 0.09782028198242188, 0.10410499572753906, 0.11038970947265625, 0.11667442321777344, 0.12295913696289062, 0.1292438507080078, 0.135528564453125, 0.1418132781982422, 0.14809799194335938, 0.15438270568847656, 0.16066741943359375, 0.16695213317871094, 0.17323684692382812, 0.1795215606689453, 0.1858062744140625, 0.1920909881591797, 0.19837570190429688, 0.20466041564941406, 0.21094512939453125, 0.21722984313964844, 0.22351455688476562, 0.2297992706298828, 0.236083984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 18.0, 25.0, 29.0, 56.0, 51.0, 78.0, 81.0, 85.0, 98.0, 79.0, 89.0, 71.0, 53.0, 63.0, 41.0, 22.0, 16.0, 11.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007009446620941162, -0.006713747978210449, -0.006418049335479736, -0.0061223506927490234, -0.0058266520500183105, -0.005530953407287598, -0.005235254764556885, -0.004939556121826172, -0.004643857479095459, -0.004348158836364746, -0.004052460193634033, -0.0037567615509033203, -0.0034610629081726074, -0.0031653642654418945, -0.0028696656227111816, -0.0025739669799804688, -0.002278268337249756, -0.001982569694519043, -0.00168687105178833, -0.0013911724090576172, -0.0010954737663269043, -0.0007997751235961914, -0.0005040764808654785, -0.00020837783813476562, 8.732080459594727e-05, 0.00038301944732666016, 0.000678718090057373, 0.0009744167327880859, 0.0012701153755187988, 0.0015658140182495117, 0.0018615126609802246, 0.0021572113037109375, 0.0024529099464416504, 0.0027486085891723633, 0.003044307231903076, 0.003340005874633789, 0.003635704517364502, 0.003931403160095215, 0.004227101802825928, 0.004522800445556641, 0.0048184990882873535, 0.005114197731018066, 0.005409896373748779, 0.005705595016479492, 0.006001293659210205, 0.006296992301940918, 0.006592690944671631, 0.006888389587402344, 0.007184088230133057, 0.0074797868728637695, 0.007775485515594482, 0.008071184158325195, 0.008366882801055908, 0.008662581443786621, 0.008958280086517334, 0.009253978729248047, 0.00954967737197876, 0.009845376014709473, 0.010141074657440186, 0.010436773300170898, 0.010732471942901611, 0.011028170585632324, 0.011323869228363037, 0.01161956787109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 19.0, 35.0, 46.0, 105.0, 191.0, 467.0, 1841.0, 325037.0, 3863387.0, 2285.0, 486.0, 185.0, 84.0, 43.0, 24.0, 17.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.8258514404296875, -0.801605224609375, -0.7773590087890625, -0.75311279296875, -0.7288665771484375, -0.704620361328125, -0.6803741455078125, -0.6561279296875, -0.6318817138671875, -0.607635498046875, -0.5833892822265625, -0.55914306640625, -0.5348968505859375, -0.510650634765625, -0.4864044189453125, -0.462158203125, -0.4379119873046875, -0.413665771484375, -0.3894195556640625, -0.36517333984375, -0.3409271240234375, -0.316680908203125, -0.2924346923828125, -0.2681884765625, -0.2439422607421875, -0.219696044921875, -0.1954498291015625, -0.17120361328125, -0.1469573974609375, -0.122711181640625, -0.0984649658203125, -0.07421875, -0.0499725341796875, -0.025726318359375, -0.0014801025390625, 0.02276611328125, 0.0470123291015625, 0.071258544921875, 0.0955047607421875, 0.1197509765625, 0.1439971923828125, 0.168243408203125, 0.1924896240234375, 0.21673583984375, 0.2409820556640625, 0.265228271484375, 0.2894744873046875, 0.313720703125, 0.3379669189453125, 0.362213134765625, 0.3864593505859375, 0.41070556640625, 0.4349517822265625, 0.459197998046875, 0.4834442138671875, 0.5076904296875, 0.5319366455078125, 0.556182861328125, 0.5804290771484375, 0.60467529296875, 0.6289215087890625, 0.653167724609375, 0.6774139404296875, 0.70166015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 9.0, 14.0, 15.0, 35.0, 52.0, 123.0, 332.0, 1913.0, 1116.0, 269.0, 111.0, 45.0, 19.0, 13.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0], "bins": [-0.0762939453125, -0.07479429244995117, -0.07329463958740234, -0.07179498672485352, -0.07029533386230469, -0.06879568099975586, -0.06729602813720703, -0.0657963752746582, -0.06429672241210938, -0.06279706954956055, -0.06129741668701172, -0.05979776382446289, -0.05829811096191406, -0.056798458099365234, -0.055298805236816406, -0.05379915237426758, -0.05229949951171875, -0.05079984664916992, -0.049300193786621094, -0.047800540924072266, -0.04630088806152344, -0.04480123519897461, -0.04330158233642578, -0.04180192947387695, -0.040302276611328125, -0.0388026237487793, -0.03730297088623047, -0.03580331802368164, -0.03430366516113281, -0.032804012298583984, -0.031304359436035156, -0.029804706573486328, -0.0283050537109375, -0.026805400848388672, -0.025305747985839844, -0.023806095123291016, -0.022306442260742188, -0.02080678939819336, -0.01930713653564453, -0.017807483673095703, -0.016307830810546875, -0.014808177947998047, -0.013308525085449219, -0.01180887222290039, -0.010309219360351562, -0.008809566497802734, -0.007309913635253906, -0.005810260772705078, -0.00431060791015625, -0.002810955047607422, -0.0013113021850585938, 0.00018835067749023438, 0.0016880035400390625, 0.0031876564025878906, 0.004687309265136719, 0.006186962127685547, 0.007686614990234375, 0.009186267852783203, 0.010685920715332031, 0.01218557357788086, 0.013685226440429688, 0.015184879302978516, 0.016684532165527344, 0.018184185028076172, 0.019683837890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 10.0, 11.0, 19.0, 65.0, 256.0, 444.0, 138.0, 38.0, 14.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318445086479187, -0.29758262634277344, -0.27672016620635986, -0.2558577060699463, -0.2349952757358551, -0.21413281559944153, -0.19327035546302795, -0.17240791022777557, -0.151545450091362, -0.13068298995494843, -0.10982054471969604, -0.08895808458328247, -0.0680956318974495, -0.047233179211616516, -0.026370719075202942, -0.0055082738399505615, 0.015354186296463013, 0.03621663898229599, 0.057079095393419266, 0.07794155180454254, 0.09880400449037552, 0.1196664571762085, 0.14052891731262207, 0.16139136254787445, 0.18225382268428802, 0.2031162828207016, 0.22397872805595398, 0.24484118819236755, 0.26570364832878113, 0.2865660786628723, 0.3074285387992859, 0.32829099893569946, 0.34915345907211304, 0.3700159192085266, 0.3908783793449402, 0.41174083948135376, 0.43260326981544495, 0.4534657299518585, 0.4743281900882721, 0.4951906204223633, 0.5160530805587769, 0.5369155406951904, 0.557778000831604, 0.5786404609680176, 0.5995029211044312, 0.6203653812408447, 0.6412278413772583, 0.6620902419090271, 0.6829527616500854, 0.703815221786499, 0.7246776819229126, 0.7455401420593262, 0.7664026021957397, 0.7872650623321533, 0.8081275224685669, 0.8289899230003357, 0.8498523831367493, 0.8707148432731628, 0.8915773034095764, 0.91243976354599, 0.9333022236824036, 0.9541646242141724, 0.9750270843505859, 0.9958895444869995, 1.016752004623413]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 6.0, 10.0, 10.0, 12.0, 24.0, 22.0, 25.0, 34.0, 40.0, 45.0, 52.0, 56.0, 40.0, 57.0, 46.0, 59.0, 48.0, 75.0, 47.0, 53.0, 49.0, 36.0, 34.0, 25.0, 15.0, 17.0, 11.0, 11.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10676193237304688, -0.10338378697633743, -0.10000564157962799, -0.09662750363349915, -0.0932493582367897, -0.08987121284008026, -0.08649307489395142, -0.08311492949724197, -0.07973678410053253, -0.07635863870382309, -0.07298049330711365, -0.0696023553609848, -0.06622420996427536, -0.06284606456756592, -0.059467922896146774, -0.05608978122472763, -0.05271163582801819, -0.049333490431308746, -0.0459553487598896, -0.04257720708847046, -0.03919906169176102, -0.035820916295051575, -0.03244277462363243, -0.029064631089568138, -0.025686487555503845, -0.022308344021439552, -0.01893020048737526, -0.015552056953310966, -0.012173913419246674, -0.00879576988518238, -0.005417626351118088, -0.002039482817053795, 0.001338660717010498, 0.004716804251074791, 0.008094947785139084, 0.011473091319203377, 0.01485123485326767, 0.018229378387331963, 0.021607521921396255, 0.02498566545546055, 0.02836380898952484, 0.03174195438623428, 0.03512009605765343, 0.03849823772907257, 0.04187638312578201, 0.045254528522491455, 0.0486326701939106, 0.05201081186532974, 0.055388957262039185, 0.05876710265874863, 0.06214524433016777, 0.06552338600158691, 0.06890153139829636, 0.0722796767950058, 0.07565781474113464, 0.07903596013784409, 0.08241410553455353, 0.08579225093126297, 0.08917039632797241, 0.09254853427410126, 0.0959266796708107, 0.09930482506752014, 0.10268296301364899, 0.10606110841035843, 0.10943925380706787]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 15.0, 21.0, 24.0, 38.0, 59.0, 94.0, 126.0, 249.0, 405.0, 831.0, 2189.0, 9094.0, 75962.0, 837142.0, 106801.0, 11068.0, 2568.0, 928.0, 420.0, 168.0, 103.0, 71.0, 39.0, 30.0, 26.0, 16.0, 13.0, 7.0, 10.0, 8.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.2027263641357422, -0.19536972045898438, -0.18801307678222656, -0.18065643310546875, -0.17329978942871094, -0.16594314575195312, -0.1585865020751953, -0.1512298583984375, -0.1438732147216797, -0.13651657104492188, -0.12915992736816406, -0.12180328369140625, -0.11444664001464844, -0.10708999633789062, -0.09973335266113281, -0.092376708984375, -0.08502006530761719, -0.07766342163085938, -0.07030677795410156, -0.06295013427734375, -0.05559349060058594, -0.048236846923828125, -0.04088020324707031, -0.0335235595703125, -0.026166915893554688, -0.018810272216796875, -0.011453628540039062, -0.00409698486328125, 0.0032596588134765625, 0.010616302490234375, 0.017972946166992188, 0.02532958984375, 0.03268623352050781, 0.040042877197265625, 0.04739952087402344, 0.05475616455078125, 0.06211280822753906, 0.06946945190429688, 0.07682609558105469, 0.0841827392578125, 0.09153938293457031, 0.09889602661132812, 0.10625267028808594, 0.11360931396484375, 0.12096595764160156, 0.12832260131835938, 0.1356792449951172, 0.143035888671875, 0.1503925323486328, 0.15774917602539062, 0.16510581970214844, 0.17246246337890625, 0.17981910705566406, 0.18717575073242188, 0.1945323944091797, 0.2018890380859375, 0.2092456817626953, 0.21660232543945312, 0.22395896911621094, 0.23131561279296875, 0.23867225646972656, 0.24602890014648438, 0.2533855438232422, 0.2607421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 14.0, 17.0, 16.0, 27.0, 32.0, 42.0, 51.0, 62.0, 60.0, 67.0, 76.0, 62.0, 74.0, 64.0, 68.0, 62.0, 52.0, 48.0, 20.0, 16.0, 18.0, 18.0, 10.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008087158203125, -0.007769465446472168, -0.007451772689819336, -0.007134079933166504, -0.006816387176513672, -0.00649869441986084, -0.006181001663208008, -0.005863308906555176, -0.005545616149902344, -0.005227923393249512, -0.00491023063659668, -0.004592537879943848, -0.004274845123291016, -0.003957152366638184, -0.0036394596099853516, -0.0033217668533325195, -0.0030040740966796875, -0.0026863813400268555, -0.0023686885833740234, -0.0020509958267211914, -0.0017333030700683594, -0.0014156103134155273, -0.0010979175567626953, -0.0007802248001098633, -0.00046253204345703125, -0.00014483928680419922, 0.0001728534698486328, 0.0004905462265014648, 0.0008082389831542969, 0.001125931739807129, 0.001443624496459961, 0.001761317253112793, 0.002079010009765625, 0.002396702766418457, 0.002714395523071289, 0.003032088279724121, 0.003349781036376953, 0.003667473793029785, 0.003985166549682617, 0.004302859306335449, 0.004620552062988281, 0.004938244819641113, 0.005255937576293945, 0.005573630332946777, 0.005891323089599609, 0.006209015846252441, 0.0065267086029052734, 0.0068444013595581055, 0.0071620941162109375, 0.0074797868728637695, 0.0077974796295166016, 0.008115172386169434, 0.008432865142822266, 0.008750557899475098, 0.00906825065612793, 0.009385943412780762, 0.009703636169433594, 0.010021328926086426, 0.010339021682739258, 0.01065671443939209, 0.010974407196044922, 0.011292099952697754, 0.011609792709350586, 0.011927485466003418, 0.01224517822265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 11.0, 19.0, 16.0, 27.0, 24.0, 34.0, 68.0, 98.0, 177.0, 274.0, 511.0, 1240.0, 3585.0, 14064.0, 94423.0, 704819.0, 196940.0, 23884.0, 5119.0, 1641.0, 666.0, 347.0, 187.0, 121.0, 85.0, 51.0, 36.0, 18.0, 13.0, 11.0, 10.0, 11.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09754467010498047, -0.09358787536621094, -0.0896310806274414, -0.08567428588867188, -0.08171749114990234, -0.07776069641113281, -0.07380390167236328, -0.06984710693359375, -0.06589031219482422, -0.06193351745605469, -0.057976722717285156, -0.054019927978515625, -0.050063133239746094, -0.04610633850097656, -0.04214954376220703, -0.0381927490234375, -0.03423595428466797, -0.030279159545898438, -0.026322364807128906, -0.022365570068359375, -0.018408775329589844, -0.014451980590820312, -0.010495185852050781, -0.00653839111328125, -0.0025815963745117188, 0.0013751983642578125, 0.005331993103027344, 0.009288787841796875, 0.013245582580566406, 0.017202377319335938, 0.02115917205810547, 0.025115966796875, 0.02907276153564453, 0.03302955627441406, 0.036986351013183594, 0.040943145751953125, 0.044899940490722656, 0.04885673522949219, 0.05281352996826172, 0.05677032470703125, 0.06072711944580078, 0.06468391418457031, 0.06864070892333984, 0.07259750366210938, 0.0765542984008789, 0.08051109313964844, 0.08446788787841797, 0.0884246826171875, 0.09238147735595703, 0.09633827209472656, 0.1002950668334961, 0.10425186157226562, 0.10820865631103516, 0.11216545104980469, 0.11612224578857422, 0.12007904052734375, 0.12403583526611328, 0.1279926300048828, 0.13194942474365234, 0.13590621948242188, 0.1398630142211914, 0.14381980895996094, 0.14777660369873047, 0.1517333984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 12.0, 13.0, 13.0, 20.0, 13.0, 20.0, 31.0, 34.0, 44.0, 41.0, 42.0, 37.0, 39.0, 48.0, 45.0, 46.0, 41.0, 50.0, 48.0, 45.0, 29.0, 32.0, 36.0, 30.0, 33.0, 23.0, 19.0, 18.0, 14.0, 10.0, 10.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.035919189453125, -0.03477668762207031, -0.033634185791015625, -0.03249168395996094, -0.03134918212890625, -0.030206680297851562, -0.029064178466796875, -0.027921676635742188, -0.0267791748046875, -0.025636672973632812, -0.024494171142578125, -0.023351669311523438, -0.02220916748046875, -0.021066665649414062, -0.019924163818359375, -0.018781661987304688, -0.01763916015625, -0.016496658325195312, -0.015354156494140625, -0.014211654663085938, -0.01306915283203125, -0.011926651000976562, -0.010784149169921875, -0.009641647338867188, -0.0084991455078125, -0.0073566436767578125, -0.006214141845703125, -0.0050716400146484375, -0.00392913818359375, -0.0027866363525390625, -0.001644134521484375, -0.0005016326904296875, 0.000640869140625, 0.0017833709716796875, 0.002925872802734375, 0.0040683746337890625, 0.00521087646484375, 0.0063533782958984375, 0.007495880126953125, 0.008638381958007812, 0.0097808837890625, 0.010923385620117188, 0.012065887451171875, 0.013208389282226562, 0.01435089111328125, 0.015493392944335938, 0.016635894775390625, 0.017778396606445312, 0.0189208984375, 0.020063400268554688, 0.021205902099609375, 0.022348403930664062, 0.02349090576171875, 0.024633407592773438, 0.025775909423828125, 0.026918411254882812, 0.0280609130859375, 0.029203414916992188, 0.030345916748046875, 0.03148841857910156, 0.03263092041015625, 0.03377342224121094, 0.034915924072265625, 0.03605842590332031, 0.037200927734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 12.0, 10.0, 18.0, 30.0, 39.0, 77.0, 139.0, 327.0, 928.0, 3740.0, 49336.0, 923044.0, 64880.0, 4311.0, 956.0, 328.0, 157.0, 77.0, 50.0, 27.0, 16.0, 10.0, 12.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09722900390625, -0.0941457748413086, -0.09106254577636719, -0.08797931671142578, -0.08489608764648438, -0.08181285858154297, -0.07872962951660156, -0.07564640045166016, -0.07256317138671875, -0.06947994232177734, -0.06639671325683594, -0.06331348419189453, -0.060230255126953125, -0.05714702606201172, -0.05406379699707031, -0.050980567932128906, -0.0478973388671875, -0.044814109802246094, -0.04173088073730469, -0.03864765167236328, -0.035564422607421875, -0.03248119354248047, -0.029397964477539062, -0.026314735412597656, -0.02323150634765625, -0.020148277282714844, -0.017065048217773438, -0.013981819152832031, -0.010898590087890625, -0.007815361022949219, -0.0047321319580078125, -0.0016489028930664062, 0.001434326171875, 0.004517555236816406, 0.0076007843017578125, 0.010684013366699219, 0.013767242431640625, 0.01685047149658203, 0.019933700561523438, 0.023016929626464844, 0.02610015869140625, 0.029183387756347656, 0.03226661682128906, 0.03534984588623047, 0.038433074951171875, 0.04151630401611328, 0.04459953308105469, 0.047682762145996094, 0.0507659912109375, 0.053849220275878906, 0.05693244934082031, 0.06001567840576172, 0.06309890747070312, 0.06618213653564453, 0.06926536560058594, 0.07234859466552734, 0.07543182373046875, 0.07851505279541016, 0.08159828186035156, 0.08468151092529297, 0.08776473999023438, 0.09084796905517578, 0.09393119812011719, 0.0970144271850586, 0.10009765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 9.0, 10.0, 16.0, 33.0, 39.0, 54.0, 56.0, 75.0, 91.0, 81.0, 95.0, 76.0, 82.0, 65.0, 63.0, 32.0, 39.0, 19.0, 20.0, 17.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.055002212524414e-05, -1.0224059224128723e-05, -9.898096323013306e-06, -9.572133421897888e-06, -9.24617052078247e-06, -8.920207619667053e-06, -8.594244718551636e-06, -8.268281817436218e-06, -7.9423189163208e-06, -7.616356015205383e-06, -7.290393114089966e-06, -6.964430212974548e-06, -6.638467311859131e-06, -6.312504410743713e-06, -5.986541509628296e-06, -5.660578608512878e-06, -5.334615707397461e-06, -5.0086528062820435e-06, -4.682689905166626e-06, -4.3567270040512085e-06, -4.030764102935791e-06, -3.7048012018203735e-06, -3.378838300704956e-06, -3.0528753995895386e-06, -2.726912498474121e-06, -2.4009495973587036e-06, -2.074986696243286e-06, -1.7490237951278687e-06, -1.4230608940124512e-06, -1.0970979928970337e-06, -7.711350917816162e-07, -4.4517219066619873e-07, -1.1920928955078125e-07, 2.0675361156463623e-07, 5.327165126800537e-07, 8.586794137954712e-07, 1.1846423149108887e-06, 1.5106052160263062e-06, 1.8365681171417236e-06, 2.162531018257141e-06, 2.4884939193725586e-06, 2.814456820487976e-06, 3.1404197216033936e-06, 3.466382622718811e-06, 3.7923455238342285e-06, 4.118308424949646e-06, 4.4442713260650635e-06, 4.770234227180481e-06, 5.0961971282958984e-06, 5.422160029411316e-06, 5.748122930526733e-06, 6.074085831642151e-06, 6.400048732757568e-06, 6.726011633872986e-06, 7.051974534988403e-06, 7.377937436103821e-06, 7.703900337219238e-06, 8.029863238334656e-06, 8.355826139450073e-06, 8.68178904056549e-06, 9.007751941680908e-06, 9.333714842796326e-06, 9.659677743911743e-06, 9.98564064502716e-06, 1.0311603546142578e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 13.0, 34.0, 31.0, 50.0, 86.0, 148.0, 203.0, 470.0, 1142.0, 3466.0, 17503.0, 222995.0, 724424.0, 65866.0, 8488.0, 2105.0, 715.0, 354.0, 161.0, 88.0, 57.0, 33.0, 25.0, 21.0, 14.0, 11.0, 10.0, 2.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.06829833984375, -0.0664668083190918, -0.0646352767944336, -0.06280374526977539, -0.06097221374511719, -0.059140682220458984, -0.05730915069580078, -0.05547761917114258, -0.053646087646484375, -0.05181455612182617, -0.04998302459716797, -0.048151493072509766, -0.04631996154785156, -0.04448843002319336, -0.042656898498535156, -0.04082536697387695, -0.03899383544921875, -0.03716230392456055, -0.035330772399902344, -0.03349924087524414, -0.03166770935058594, -0.029836177825927734, -0.02800464630126953, -0.026173114776611328, -0.024341583251953125, -0.022510051727294922, -0.02067852020263672, -0.018846988677978516, -0.017015457153320312, -0.01518392562866211, -0.013352394104003906, -0.011520862579345703, -0.0096893310546875, -0.007857799530029297, -0.006026268005371094, -0.004194736480712891, -0.0023632049560546875, -0.0005316734313964844, 0.0012998580932617188, 0.003131389617919922, 0.004962921142578125, 0.006794452667236328, 0.008625984191894531, 0.010457515716552734, 0.012289047241210938, 0.01412057876586914, 0.015952110290527344, 0.017783641815185547, 0.01961517333984375, 0.021446704864501953, 0.023278236389160156, 0.02510976791381836, 0.026941299438476562, 0.028772830963134766, 0.03060436248779297, 0.03243589401245117, 0.034267425537109375, 0.03609895706176758, 0.03793048858642578, 0.039762020111083984, 0.04159355163574219, 0.04342508316040039, 0.045256614685058594, 0.0470881462097168, 0.048919677734375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 13.0, 19.0, 25.0, 37.0, 43.0, 67.0, 63.0, 96.0, 93.0, 97.0, 92.0, 95.0, 62.0, 51.0, 35.0, 28.0, 26.0, 9.0, 8.0, 8.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041412353515625, -0.040204524993896484, -0.03899669647216797, -0.03778886795043945, -0.03658103942871094, -0.03537321090698242, -0.034165382385253906, -0.03295755386352539, -0.031749725341796875, -0.03054189682006836, -0.029334068298339844, -0.028126239776611328, -0.026918411254882812, -0.025710582733154297, -0.02450275421142578, -0.023294925689697266, -0.02208709716796875, -0.020879268646240234, -0.01967144012451172, -0.018463611602783203, -0.017255783081054688, -0.016047954559326172, -0.014840126037597656, -0.01363229751586914, -0.012424468994140625, -0.01121664047241211, -0.010008811950683594, -0.008800983428955078, -0.0075931549072265625, -0.006385326385498047, -0.005177497863769531, -0.003969669342041016, -0.0027618408203125, -0.0015540122985839844, -0.00034618377685546875, 0.0008616447448730469, 0.0020694732666015625, 0.003277301788330078, 0.004485130310058594, 0.005692958831787109, 0.006900787353515625, 0.00810861587524414, 0.009316444396972656, 0.010524272918701172, 0.011732101440429688, 0.012939929962158203, 0.014147758483886719, 0.015355587005615234, 0.01656341552734375, 0.017771244049072266, 0.01897907257080078, 0.020186901092529297, 0.021394729614257812, 0.022602558135986328, 0.023810386657714844, 0.02501821517944336, 0.026226043701171875, 0.02743387222290039, 0.028641700744628906, 0.029849529266357422, 0.031057357788085938, 0.03226518630981445, 0.03347301483154297, 0.034680843353271484, 0.035888671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 20.0, 45.0, 204.0, 412.0, 233.0, 50.0, 23.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7504279017448425, -0.7155011296272278, -0.6805742979049683, -0.6456475257873535, -0.610720694065094, -0.5757939219474792, -0.5408670902252197, -0.505940318107605, -0.47101351618766785, -0.4360867142677307, -0.4011599123477936, -0.36623311042785645, -0.3313063383102417, -0.2963795065879822, -0.26145273447036743, -0.2265259325504303, -0.19159913063049316, -0.15667232871055603, -0.1217455342411995, -0.08681873977184296, -0.05189193785190582, -0.01696513593196869, 0.01796165108680725, 0.052888453006744385, 0.08781525492668152, 0.12274205684661865, 0.1576688587665558, 0.19259564578533173, 0.22752244770526886, 0.2624492645263672, 0.29737603664398193, 0.33230283856391907, 0.3672295808792114, 0.40215638279914856, 0.4370831847190857, 0.47200995683670044, 0.50693678855896, 0.5418635606765747, 0.5767903327941895, 0.611717164516449, 0.6466439962387085, 0.6815707683563232, 0.7164976000785828, 0.7514243721961975, 0.786351203918457, 0.8212779760360718, 0.8562047481536865, 0.891131579875946, 0.9260583519935608, 0.9609851241111755, 0.9959119558334351, 1.0308387279510498, 1.0657655000686646, 1.1006923913955688, 1.1356191635131836, 1.1705459356307983, 1.205472707748413, 1.2403994798660278, 1.2753262519836426, 1.3102531433105469, 1.3451799154281616, 1.3801066875457764, 1.4150334596633911, 1.4499602317810059, 1.4848871231079102]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 5.0, 10.0, 13.0, 16.0, 21.0, 26.0, 29.0, 31.0, 43.0, 41.0, 52.0, 50.0, 48.0, 85.0, 68.0, 66.0, 47.0, 69.0, 46.0, 34.0, 56.0, 34.0, 23.0, 21.0, 15.0, 9.0, 12.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33691900968551636, -0.32644206285476685, -0.31596511602401733, -0.3054881691932678, -0.2950111925601959, -0.2845342457294464, -0.2740572988986969, -0.2635803520679474, -0.2531033754348755, -0.24262642860412598, -0.23214946687221527, -0.22167252004146576, -0.21119555830955505, -0.20071861147880554, -0.19024166464805603, -0.17976471781730652, -0.169287770986557, -0.1588108241558075, -0.1483338624238968, -0.13785691559314728, -0.12737995386123657, -0.11690300703048706, -0.10642606019973755, -0.09594910591840744, -0.08547215163707733, -0.07499519735574722, -0.06451824307441711, -0.0540412962436676, -0.043564341962337494, -0.033087387681007385, -0.022610440850257874, -0.012133486568927765, -0.0016565322875976562, 0.008820420131087303, 0.019297372549772263, 0.029774323105812073, 0.04025127738714218, 0.05072823166847229, 0.0612051784992218, 0.07168213278055191, 0.08215908706188202, 0.09263604134321213, 0.10311299562454224, 0.11358994245529175, 0.12406689673662186, 0.13454385101795197, 0.14502079784870148, 0.15549775958061218, 0.1659747064113617, 0.1764516532421112, 0.1869286149740219, 0.19740556180477142, 0.20788252353668213, 0.21835947036743164, 0.22883641719818115, 0.23931336402893066, 0.24979032576084137, 0.2602672874927521, 0.2707442343235016, 0.2812211811542511, 0.2916981279850006, 0.3021751046180725, 0.312652051448822, 0.32312899827957153, 0.33360594511032104]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 10.0, 15.0, 12.0, 31.0, 55.0, 77.0, 125.0, 286.0, 666.0, 1806.0, 7882.0, 141155.0, 3983261.0, 51912.0, 4961.0, 1251.0, 403.0, 187.0, 70.0, 47.0, 19.0, 13.0, 8.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.1889629364013672, -0.18151473999023438, -0.17406654357910156, -0.16661834716796875, -0.15917015075683594, -0.15172195434570312, -0.1442737579345703, -0.1368255615234375, -0.1293773651123047, -0.12192916870117188, -0.11448097229003906, -0.10703277587890625, -0.09958457946777344, -0.09213638305664062, -0.08468818664550781, -0.077239990234375, -0.06979179382324219, -0.062343597412109375, -0.05489540100097656, -0.04744720458984375, -0.03999900817871094, -0.032550811767578125, -0.025102615356445312, -0.0176544189453125, -0.010206222534179688, -0.002758026123046875, 0.0046901702880859375, 0.01213836669921875, 0.019586563110351562, 0.027034759521484375, 0.03448295593261719, 0.04193115234375, 0.04937934875488281, 0.056827545166015625, 0.06427574157714844, 0.07172393798828125, 0.07917213439941406, 0.08662033081054688, 0.09406852722167969, 0.1015167236328125, 0.10896492004394531, 0.11641311645507812, 0.12386131286621094, 0.13130950927734375, 0.13875770568847656, 0.14620590209960938, 0.1536540985107422, 0.161102294921875, 0.1685504913330078, 0.17599868774414062, 0.18344688415527344, 0.19089508056640625, 0.19834327697753906, 0.20579147338867188, 0.2132396697998047, 0.2206878662109375, 0.2281360626220703, 0.23558425903320312, 0.24303245544433594, 0.25048065185546875, 0.25792884826660156, 0.2653770446777344, 0.2728252410888672, 0.2802734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 20.0, 17.0, 30.0, 38.0, 50.0, 65.0, 78.0, 77.0, 94.0, 101.0, 73.0, 82.0, 58.0, 57.0, 43.0, 33.0, 19.0, 11.0, 11.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01206207275390625, -0.011661171913146973, -0.011260271072387695, -0.010859370231628418, -0.01045846939086914, -0.010057568550109863, -0.009656667709350586, -0.009255766868591309, -0.008854866027832031, -0.008453965187072754, -0.008053064346313477, -0.007652163505554199, -0.007251262664794922, -0.0068503618240356445, -0.006449460983276367, -0.00604856014251709, -0.0056476593017578125, -0.005246758460998535, -0.004845857620239258, -0.0044449567794799805, -0.004044055938720703, -0.0036431550979614258, -0.0032422542572021484, -0.002841353416442871, -0.0024404525756835938, -0.0020395517349243164, -0.001638650894165039, -0.0012377500534057617, -0.0008368492126464844, -0.00043594837188720703, -3.504753112792969e-05, 0.00036585330963134766, 0.000766754150390625, 0.0011676549911499023, 0.0015685558319091797, 0.001969456672668457, 0.0023703575134277344, 0.0027712583541870117, 0.003172159194946289, 0.0035730600357055664, 0.003973960876464844, 0.004374861717224121, 0.0047757625579833984, 0.005176663398742676, 0.005577564239501953, 0.0059784650802612305, 0.006379365921020508, 0.006780266761779785, 0.0071811676025390625, 0.00758206844329834, 0.007982969284057617, 0.008383870124816895, 0.008784770965576172, 0.00918567180633545, 0.009586572647094727, 0.009987473487854004, 0.010388374328613281, 0.010789275169372559, 0.011190176010131836, 0.011591076850891113, 0.01199197769165039, 0.012392878532409668, 0.012793779373168945, 0.013194680213928223, 0.0135955810546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 6.0, 3.0, 10.0, 12.0, 11.0, 19.0, 24.0, 35.0, 29.0, 56.0, 92.0, 164.0, 402.0, 6559.0, 4184156.0, 1972.0, 301.0, 131.0, 85.0, 53.0, 42.0, 35.0, 25.0, 22.0, 11.0, 8.0, 5.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.849609375, -0.8216323852539062, -0.7936553955078125, -0.7656784057617188, -0.737701416015625, -0.7097244262695312, -0.6817474365234375, -0.6537704467773438, -0.62579345703125, -0.5978164672851562, -0.5698394775390625, -0.5418624877929688, -0.513885498046875, -0.48590850830078125, -0.4579315185546875, -0.42995452880859375, -0.4019775390625, -0.37400054931640625, -0.3460235595703125, -0.31804656982421875, -0.290069580078125, -0.26209259033203125, -0.2341156005859375, -0.20613861083984375, -0.17816162109375, -0.15018463134765625, -0.1222076416015625, -0.09423065185546875, -0.066253662109375, -0.03827667236328125, -0.0102996826171875, 0.01767730712890625, 0.045654296875, 0.07363128662109375, 0.1016082763671875, 0.12958526611328125, 0.157562255859375, 0.18553924560546875, 0.2135162353515625, 0.24149322509765625, 0.26947021484375, 0.29744720458984375, 0.3254241943359375, 0.35340118408203125, 0.381378173828125, 0.40935516357421875, 0.4373321533203125, 0.46530914306640625, 0.4932861328125, 0.5212631225585938, 0.5492401123046875, 0.5772171020507812, 0.605194091796875, 0.6331710815429688, 0.6611480712890625, 0.6891250610351562, 0.71710205078125, 0.7450790405273438, 0.7730560302734375, 0.8010330200195312, 0.829010009765625, 0.8569869995117188, 0.8849639892578125, 0.9129409790039062, 0.94091796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 11.0, 6.0, 25.0, 89.0, 395.0, 2286.0, 991.0, 178.0, 56.0, 22.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031768798828125, -0.029616832733154297, -0.027464866638183594, -0.02531290054321289, -0.023160934448242188, -0.021008968353271484, -0.01885700225830078, -0.016705036163330078, -0.014553070068359375, -0.012401103973388672, -0.010249137878417969, -0.008097171783447266, -0.0059452056884765625, -0.0037932395935058594, -0.0016412734985351562, 0.0005106925964355469, 0.00266265869140625, 0.004814624786376953, 0.006966590881347656, 0.00911855697631836, 0.011270523071289062, 0.013422489166259766, 0.015574455261230469, 0.017726421356201172, 0.019878387451171875, 0.022030353546142578, 0.02418231964111328, 0.026334285736083984, 0.028486251831054688, 0.03063821792602539, 0.032790184020996094, 0.0349421501159668, 0.0370941162109375, 0.0392460823059082, 0.041398048400878906, 0.04355001449584961, 0.04570198059082031, 0.047853946685791016, 0.05000591278076172, 0.05215787887573242, 0.054309844970703125, 0.05646181106567383, 0.05861377716064453, 0.060765743255615234, 0.06291770935058594, 0.06506967544555664, 0.06722164154052734, 0.06937360763549805, 0.07152557373046875, 0.07367753982543945, 0.07582950592041016, 0.07798147201538086, 0.08013343811035156, 0.08228540420532227, 0.08443737030029297, 0.08658933639526367, 0.08874130249023438, 0.09089326858520508, 0.09304523468017578, 0.09519720077514648, 0.09734916687011719, 0.09950113296508789, 0.1016530990600586, 0.1038050651550293, 0.10595703125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 62.0, 226.0, 415.0, 203.0, 55.0, 18.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3865686058998108, -0.370013028383255, -0.3534574806690216, -0.3369019031524658, -0.3203463554382324, -0.30379077792167664, -0.28723520040512085, -0.27067965269088745, -0.25412407517433167, -0.23756851255893707, -0.22101294994354248, -0.2044573724269867, -0.1879018098115921, -0.1713462471961975, -0.15479066967964172, -0.13823510706424713, -0.12167954444885254, -0.10512398183345795, -0.08856841176748276, -0.07201284170150757, -0.055457279086112976, -0.038901716470718384, -0.022346146404743195, -0.005790576338768005, 0.010764986276626587, 0.027320552617311478, 0.04387611895799637, 0.06043168529868126, 0.07698725163936615, 0.09354281425476074, 0.11009838432073593, 0.12665395438671112, 0.14320945739746094, 0.15976502001285553, 0.17632058262825012, 0.1928761601448059, 0.2094317227602005, 0.2259872853755951, 0.24254286289215088, 0.2590984106063843, 0.27565398812294006, 0.29220956563949585, 0.30876511335372925, 0.32532069087028503, 0.3418762683868408, 0.3584318161010742, 0.37498739361763, 0.3915429711341858, 0.4080985188484192, 0.424654096364975, 0.4412096440792084, 0.45776522159576416, 0.47432076930999756, 0.49087634682655334, 0.5074319243431091, 0.5239874720573425, 0.5405430793762207, 0.5570986270904541, 0.5736542344093323, 0.5902097821235657, 0.6067653298377991, 0.6233209371566772, 0.6398764848709106, 0.656432032585144, 0.6729875802993774]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 29.0, 39.0, 51.0, 65.0, 90.0, 97.0, 113.0, 95.0, 123.0, 99.0, 59.0, 52.0, 30.0, 24.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235720694065094, -0.22942300140857697, -0.22312530875205994, -0.2168276160955429, -0.21052992343902588, -0.20423223078250885, -0.19793453812599182, -0.1916368454694748, -0.18533915281295776, -0.17904146015644073, -0.1727437674999237, -0.16644607484340668, -0.16014838218688965, -0.15385068953037262, -0.1475529968738556, -0.14125530421733856, -0.13495761156082153, -0.1286599189043045, -0.12236222624778748, -0.11606453359127045, -0.10976684093475342, -0.10346914827823639, -0.09717145562171936, -0.09087376296520233, -0.0845760703086853, -0.07827837765216827, -0.07198068499565125, -0.06568299233913422, -0.05938529968261719, -0.05308760702610016, -0.04678991436958313, -0.0404922217130661, -0.03419452905654907, -0.027896836400032043, -0.021599143743515015, -0.015301451086997986, -0.009003758430480957, -0.0027060657739639282, 0.0035916268825531006, 0.00988931953907013, 0.016187012195587158, 0.022484704852104187, 0.028782397508621216, 0.035080090165138245, 0.04137778282165527, 0.0476754754781723, 0.05397316813468933, 0.06027086079120636, 0.06656855344772339, 0.07286624610424042, 0.07916393876075745, 0.08546163141727448, 0.0917593240737915, 0.09805701673030853, 0.10435470938682556, 0.11065240204334259, 0.11695009469985962, 0.12324778735637665, 0.12954548001289368, 0.1358431726694107, 0.14214086532592773, 0.14843855798244476, 0.1547362506389618, 0.16103394329547882, 0.16733163595199585]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 13.0, 7.0, 14.0, 20.0, 24.0, 27.0, 55.0, 73.0, 89.0, 152.0, 217.0, 344.0, 650.0, 1275.0, 3253.0, 9543.0, 38552.0, 232306.0, 596397.0, 129175.0, 24844.0, 6724.0, 2375.0, 1033.0, 500.0, 308.0, 199.0, 118.0, 83.0, 54.0, 30.0, 20.0, 28.0, 9.0, 11.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.107421875, -0.10410118103027344, -0.10078048706054688, -0.09745979309082031, -0.09413909912109375, -0.09081840515136719, -0.08749771118164062, -0.08417701721191406, -0.0808563232421875, -0.07753562927246094, -0.07421493530273438, -0.07089424133300781, -0.06757354736328125, -0.06425285339355469, -0.060932159423828125, -0.05761146545410156, -0.054290771484375, -0.05097007751464844, -0.047649383544921875, -0.04432868957519531, -0.04100799560546875, -0.03768730163574219, -0.034366607666015625, -0.031045913696289062, -0.0277252197265625, -0.024404525756835938, -0.021083831787109375, -0.017763137817382812, -0.01444244384765625, -0.011121749877929688, -0.007801055908203125, -0.0044803619384765625, -0.00115966796875, 0.0021610260009765625, 0.005481719970703125, 0.008802413940429688, 0.01212310791015625, 0.015443801879882812, 0.018764495849609375, 0.022085189819335938, 0.0254058837890625, 0.028726577758789062, 0.032047271728515625, 0.03536796569824219, 0.03868865966796875, 0.04200935363769531, 0.045330047607421875, 0.04865074157714844, 0.051971435546875, 0.05529212951660156, 0.058612823486328125, 0.06193351745605469, 0.06525421142578125, 0.06857490539550781, 0.07189559936523438, 0.07521629333496094, 0.0785369873046875, 0.08185768127441406, 0.08517837524414062, 0.08849906921386719, 0.09181976318359375, 0.09514045715332031, 0.09846115112304688, 0.10178184509277344, 0.1051025390625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 16.0, 20.0, 30.0, 45.0, 54.0, 62.0, 74.0, 66.0, 73.0, 87.0, 87.0, 95.0, 62.0, 53.0, 52.0, 35.0, 26.0, 15.0, 10.0, 5.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01163482666015625, -0.01120901107788086, -0.010783195495605469, -0.010357379913330078, -0.009931564331054688, -0.009505748748779297, -0.009079933166503906, -0.008654117584228516, -0.008228302001953125, -0.007802486419677734, -0.007376670837402344, -0.006950855255126953, -0.0065250396728515625, -0.006099224090576172, -0.005673408508300781, -0.005247592926025391, -0.00482177734375, -0.004395961761474609, -0.003970146179199219, -0.003544330596923828, -0.0031185150146484375, -0.002692699432373047, -0.0022668838500976562, -0.0018410682678222656, -0.001415252685546875, -0.0009894371032714844, -0.0005636215209960938, -0.00013780593872070312, 0.0002880096435546875, 0.0007138252258300781, 0.0011396408081054688, 0.0015654563903808594, 0.00199127197265625, 0.0024170875549316406, 0.0028429031372070312, 0.003268718719482422, 0.0036945343017578125, 0.004120349884033203, 0.004546165466308594, 0.004971981048583984, 0.005397796630859375, 0.005823612213134766, 0.006249427795410156, 0.006675243377685547, 0.0071010589599609375, 0.007526874542236328, 0.007952690124511719, 0.00837850570678711, 0.0088043212890625, 0.00923013687133789, 0.009655952453613281, 0.010081768035888672, 0.010507583618164062, 0.010933399200439453, 0.011359214782714844, 0.011785030364990234, 0.012210845947265625, 0.012636661529541016, 0.013062477111816406, 0.013488292694091797, 0.013914108276367188, 0.014339923858642578, 0.014765739440917969, 0.01519155502319336, 0.01561737060546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 3.0, 4.0, 12.0, 12.0, 9.0, 17.0, 39.0, 62.0, 87.0, 134.0, 230.0, 413.0, 859.0, 2177.0, 6366.0, 27838.0, 241117.0, 660484.0, 87605.0, 14372.0, 3876.0, 1405.0, 641.0, 308.0, 160.0, 124.0, 64.0, 40.0, 30.0, 15.0, 11.0, 13.0, 7.0, 6.0, 0.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11572265625, -0.11213874816894531, -0.10855484008789062, -0.10497093200683594, -0.10138702392578125, -0.09780311584472656, -0.09421920776367188, -0.09063529968261719, -0.0870513916015625, -0.08346748352050781, -0.07988357543945312, -0.07629966735839844, -0.07271575927734375, -0.06913185119628906, -0.06554794311523438, -0.06196403503417969, -0.058380126953125, -0.05479621887207031, -0.051212310791015625, -0.04762840270996094, -0.04404449462890625, -0.04046058654785156, -0.036876678466796875, -0.03329277038574219, -0.0297088623046875, -0.026124954223632812, -0.022541046142578125, -0.018957138061523438, -0.01537322998046875, -0.011789321899414062, -0.008205413818359375, -0.0046215057373046875, -0.00103759765625, 0.0025463104248046875, 0.006130218505859375, 0.009714126586914062, 0.01329803466796875, 0.016881942749023438, 0.020465850830078125, 0.024049758911132812, 0.0276336669921875, 0.031217575073242188, 0.034801483154296875, 0.03838539123535156, 0.04196929931640625, 0.04555320739746094, 0.049137115478515625, 0.05272102355957031, 0.056304931640625, 0.05988883972167969, 0.06347274780273438, 0.06705665588378906, 0.07064056396484375, 0.07422447204589844, 0.07780838012695312, 0.08139228820800781, 0.0849761962890625, 0.08856010437011719, 0.09214401245117188, 0.09572792053222656, 0.09931182861328125, 0.10289573669433594, 0.10647964477539062, 0.11006355285644531, 0.1136474609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 11.0, 14.0, 7.0, 14.0, 27.0, 30.0, 27.0, 27.0, 34.0, 42.0, 46.0, 31.0, 44.0, 58.0, 46.0, 63.0, 54.0, 49.0, 42.0, 31.0, 32.0, 39.0, 39.0, 31.0, 29.0, 16.0, 15.0, 13.0, 21.0, 5.0, 11.0, 8.0, 7.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04290771484375, -0.04164266586303711, -0.04037761688232422, -0.03911256790161133, -0.03784751892089844, -0.03658246994018555, -0.035317420959472656, -0.034052371978759766, -0.032787322998046875, -0.031522274017333984, -0.030257225036621094, -0.028992176055908203, -0.027727127075195312, -0.026462078094482422, -0.02519702911376953, -0.02393198013305664, -0.02266693115234375, -0.02140188217163086, -0.02013683319091797, -0.018871784210205078, -0.017606735229492188, -0.016341686248779297, -0.015076637268066406, -0.013811588287353516, -0.012546539306640625, -0.011281490325927734, -0.010016441345214844, -0.008751392364501953, -0.0074863433837890625, -0.006221294403076172, -0.004956245422363281, -0.0036911964416503906, -0.0024261474609375, -0.0011610984802246094, 0.00010395050048828125, 0.0013689994812011719, 0.0026340484619140625, 0.003899097442626953, 0.005164146423339844, 0.006429195404052734, 0.007694244384765625, 0.008959293365478516, 0.010224342346191406, 0.011489391326904297, 0.012754440307617188, 0.014019489288330078, 0.015284538269042969, 0.01654958724975586, 0.01781463623046875, 0.01907968521118164, 0.02034473419189453, 0.021609783172607422, 0.022874832153320312, 0.024139881134033203, 0.025404930114746094, 0.026669979095458984, 0.027935028076171875, 0.029200077056884766, 0.030465126037597656, 0.03173017501831055, 0.03299522399902344, 0.03426027297973633, 0.03552532196044922, 0.03679037094116211, 0.038055419921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 10.0, 20.0, 34.0, 78.0, 119.0, 196.0, 373.0, 834.0, 2282.0, 8918.0, 93255.0, 824375.0, 104339.0, 9550.0, 2406.0, 893.0, 406.0, 203.0, 107.0, 55.0, 28.0, 16.0, 15.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04693603515625, -0.045166015625, -0.04339599609375, -0.0416259765625, -0.03985595703125, -0.0380859375, -0.03631591796875, -0.0345458984375, -0.03277587890625, -0.031005859375, -0.02923583984375, -0.0274658203125, -0.02569580078125, -0.02392578125, -0.02215576171875, -0.0203857421875, -0.01861572265625, -0.016845703125, -0.01507568359375, -0.0133056640625, -0.01153564453125, -0.009765625, -0.00799560546875, -0.0062255859375, -0.00445556640625, -0.002685546875, -0.00091552734375, 0.0008544921875, 0.00262451171875, 0.00439453125, 0.00616455078125, 0.0079345703125, 0.00970458984375, 0.011474609375, 0.01324462890625, 0.0150146484375, 0.01678466796875, 0.0185546875, 0.02032470703125, 0.0220947265625, 0.02386474609375, 0.025634765625, 0.02740478515625, 0.0291748046875, 0.03094482421875, 0.03271484375, 0.03448486328125, 0.0362548828125, 0.03802490234375, 0.039794921875, 0.04156494140625, 0.0433349609375, 0.04510498046875, 0.046875, 0.04864501953125, 0.0504150390625, 0.05218505859375, 0.053955078125, 0.05572509765625, 0.0574951171875, 0.05926513671875, 0.06103515625, 0.06280517578125, 0.0645751953125, 0.06634521484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 13.0, 11.0, 8.0, 18.0, 23.0, 28.0, 19.0, 32.0, 36.0, 39.0, 37.0, 54.0, 63.0, 52.0, 54.0, 68.0, 66.0, 50.0, 40.0, 49.0, 37.0, 31.0, 35.0, 22.0, 20.0, 16.0, 10.0, 9.0, 13.0, 8.0, 10.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.602836608886719e-06, -5.420297384262085e-06, -5.237758159637451e-06, -5.055218935012817e-06, -4.872679710388184e-06, -4.69014048576355e-06, -4.507601261138916e-06, -4.325062036514282e-06, -4.1425228118896484e-06, -3.959983587265015e-06, -3.777444362640381e-06, -3.594905138015747e-06, -3.4123659133911133e-06, -3.2298266887664795e-06, -3.0472874641418457e-06, -2.864748239517212e-06, -2.682209014892578e-06, -2.4996697902679443e-06, -2.3171305656433105e-06, -2.1345913410186768e-06, -1.952052116394043e-06, -1.7695128917694092e-06, -1.5869736671447754e-06, -1.4044344425201416e-06, -1.2218952178955078e-06, -1.039355993270874e-06, -8.568167686462402e-07, -6.742775440216064e-07, -4.917383193969727e-07, -3.0919909477233887e-07, -1.2665987014770508e-07, 5.587935447692871e-08, 2.384185791015625e-07, 4.209578037261963e-07, 6.034970283508301e-07, 7.860362529754639e-07, 9.685754776000977e-07, 1.1511147022247314e-06, 1.3336539268493652e-06, 1.516193151473999e-06, 1.6987323760986328e-06, 1.8812716007232666e-06, 2.0638108253479004e-06, 2.246350049972534e-06, 2.428889274597168e-06, 2.6114284992218018e-06, 2.7939677238464355e-06, 2.9765069484710693e-06, 3.159046173095703e-06, 3.341585397720337e-06, 3.5241246223449707e-06, 3.7066638469696045e-06, 3.889203071594238e-06, 4.071742296218872e-06, 4.254281520843506e-06, 4.43682074546814e-06, 4.6193599700927734e-06, 4.801899194717407e-06, 4.984438419342041e-06, 5.166977643966675e-06, 5.349516868591309e-06, 5.532056093215942e-06, 5.714595317840576e-06, 5.89713454246521e-06, 6.079673767089844e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 8.0, 15.0, 20.0, 32.0, 45.0, 96.0, 178.0, 293.0, 716.0, 1558.0, 4792.0, 24876.0, 323313.0, 625251.0, 55505.0, 7769.0, 2266.0, 869.0, 416.0, 210.0, 114.0, 72.0, 48.0, 24.0, 16.0, 8.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.05706787109375, -0.05561113357543945, -0.054154396057128906, -0.05269765853881836, -0.05124092102050781, -0.049784183502197266, -0.04832744598388672, -0.04687070846557617, -0.045413970947265625, -0.04395723342895508, -0.04250049591064453, -0.041043758392333984, -0.03958702087402344, -0.03813028335571289, -0.036673545837402344, -0.0352168083190918, -0.03376007080078125, -0.0323033332824707, -0.030846595764160156, -0.02938985824584961, -0.027933120727539062, -0.026476383209228516, -0.02501964569091797, -0.023562908172607422, -0.022106170654296875, -0.020649433135986328, -0.01919269561767578, -0.017735958099365234, -0.016279220581054688, -0.01482248306274414, -0.013365745544433594, -0.011909008026123047, -0.0104522705078125, -0.008995532989501953, -0.007538795471191406, -0.006082057952880859, -0.0046253204345703125, -0.0031685829162597656, -0.0017118453979492188, -0.0002551078796386719, 0.001201629638671875, 0.002658367156982422, 0.004115104675292969, 0.005571842193603516, 0.0070285797119140625, 0.00848531723022461, 0.009942054748535156, 0.011398792266845703, 0.01285552978515625, 0.014312267303466797, 0.015769004821777344, 0.01722574234008789, 0.018682479858398438, 0.020139217376708984, 0.02159595489501953, 0.023052692413330078, 0.024509429931640625, 0.025966167449951172, 0.02742290496826172, 0.028879642486572266, 0.030336380004882812, 0.03179311752319336, 0.033249855041503906, 0.03470659255981445, 0.036163330078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 7.0, 7.0, 5.0, 16.0, 13.0, 27.0, 37.0, 49.0, 58.0, 79.0, 82.0, 95.0, 92.0, 104.0, 91.0, 66.0, 47.0, 32.0, 27.0, 22.0, 19.0, 9.0, 8.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.038482666015625, -0.0374448299407959, -0.0364069938659668, -0.035369157791137695, -0.034331321716308594, -0.03329348564147949, -0.03225564956665039, -0.03121781349182129, -0.030179977416992188, -0.029142141342163086, -0.028104305267333984, -0.027066469192504883, -0.02602863311767578, -0.02499079704284668, -0.023952960968017578, -0.022915124893188477, -0.021877288818359375, -0.020839452743530273, -0.019801616668701172, -0.01876378059387207, -0.01772594451904297, -0.016688108444213867, -0.015650272369384766, -0.014612436294555664, -0.013574600219726562, -0.012536764144897461, -0.01149892807006836, -0.010461091995239258, -0.009423255920410156, -0.008385419845581055, -0.007347583770751953, -0.0063097476959228516, -0.00527191162109375, -0.0042340755462646484, -0.003196239471435547, -0.0021584033966064453, -0.0011205673217773438, -8.273124694824219e-05, 0.0009551048278808594, 0.001992940902709961, 0.0030307769775390625, 0.004068613052368164, 0.005106449127197266, 0.006144285202026367, 0.007182121276855469, 0.00821995735168457, 0.009257793426513672, 0.010295629501342773, 0.011333465576171875, 0.012371301651000977, 0.013409137725830078, 0.01444697380065918, 0.015484809875488281, 0.016522645950317383, 0.017560482025146484, 0.018598318099975586, 0.019636154174804688, 0.02067399024963379, 0.02171182632446289, 0.022749662399291992, 0.023787498474121094, 0.024825334548950195, 0.025863170623779297, 0.0269010066986084, 0.0279388427734375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 10.0, 18.0, 19.0, 41.0, 54.0, 108.0, 128.0, 130.0, 127.0, 107.0, 87.0, 41.0, 39.0, 21.0, 10.0, 13.0, 5.0, 4.0, 3.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3151957392692566, -0.30295446515083313, -0.29071322083473206, -0.2784719467163086, -0.2662307024002075, -0.25398942828178406, -0.2417481541633606, -0.22950689494609833, -0.21726563572883606, -0.2050243765115738, -0.19278311729431152, -0.18054184317588806, -0.1683005839586258, -0.15605932474136353, -0.14381805062294006, -0.1315767914056778, -0.11933553218841553, -0.10709427297115326, -0.0948530063033104, -0.08261173963546753, -0.07037048041820526, -0.058129217475652695, -0.04588795453310013, -0.03364668786525726, -0.021405428647994995, -0.009164165705442429, 0.003077097237110138, 0.015318360179662704, 0.02755962312221527, 0.03980088606476784, 0.052042149007320404, 0.06428341567516327, 0.07652470469474792, 0.08876596391201019, 0.10100723057985306, 0.11324849724769592, 0.1254897564649582, 0.13773101568222046, 0.14997228980064392, 0.1622135490179062, 0.17445480823516846, 0.18669606745243073, 0.198937326669693, 0.21117860078811646, 0.22341986000537872, 0.235661119222641, 0.24790239334106445, 0.2601436376571655, 0.272384911775589, 0.28462618589401245, 0.2968674302101135, 0.309108704328537, 0.32134997844696045, 0.3335912227630615, 0.345832496881485, 0.35807377099990845, 0.3703150153160095, 0.382556289434433, 0.39479753375053406, 0.4070388078689575, 0.4192800521850586, 0.43152132630348206, 0.4437626004219055, 0.4560038447380066, 0.46824511885643005]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 8.0, 3.0, 8.0, 4.0, 13.0, 16.0, 21.0, 18.0, 22.0, 25.0, 27.0, 28.0, 28.0, 34.0, 38.0, 42.0, 60.0, 51.0, 56.0, 61.0, 48.0, 43.0, 45.0, 35.0, 42.0, 30.0, 27.0, 36.0, 20.0, 24.0, 17.0, 17.0, 13.0, 8.0, 5.0, 4.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2096102237701416, -0.20185251533985138, -0.19409479200839996, -0.18633708357810974, -0.17857936024665833, -0.1708216518163681, -0.16306394338607788, -0.15530622005462646, -0.14754851162433624, -0.13979080319404602, -0.1320330798625946, -0.12427537143230438, -0.11651765555143356, -0.10875993967056274, -0.10100223124027252, -0.0932445153594017, -0.08548679947853088, -0.07772908359766006, -0.06997136771678925, -0.06221365928649902, -0.054455943405628204, -0.046698227524757385, -0.038940515369176865, -0.031182803213596344, -0.023425087332725525, -0.015667373314499855, -0.007909659296274185, -0.00015194527804851532, 0.0076057687401771545, 0.015363484621047974, 0.023121196776628494, 0.030878908932209015, 0.038636624813079834, 0.04639434069395065, 0.054152052849531174, 0.061909765005111694, 0.06966748088598251, 0.07742519676685333, 0.08518290519714355, 0.09294062107801437, 0.10069833695888519, 0.10845605283975601, 0.11621376872062683, 0.12397147715091705, 0.13172918558120728, 0.1394869089126587, 0.1472446173429489, 0.15500232577323914, 0.16276004910469055, 0.17051775753498077, 0.1782754808664322, 0.1860331892967224, 0.19379091262817383, 0.20154862105846405, 0.20930632948875427, 0.2170640528202057, 0.2248217612504959, 0.23257946968078613, 0.24033719301223755, 0.24809490144252777, 0.255852609872818, 0.2636103332042694, 0.2713680565357208, 0.27912575006484985, 0.28688347339630127]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 10.0, 6.0, 14.0, 14.0, 15.0, 23.0, 39.0, 74.0, 123.0, 210.0, 409.0, 858.0, 2051.0, 5676.0, 23537.0, 285341.0, 3696853.0, 154864.0, 17028.0, 4377.0, 1493.0, 607.0, 270.0, 148.0, 88.0, 53.0, 24.0, 22.0, 14.0, 15.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.12184715270996094, -0.11783981323242188, -0.11383247375488281, -0.10982513427734375, -0.10581779479980469, -0.10181045532226562, -0.09780311584472656, -0.0937957763671875, -0.08978843688964844, -0.08578109741210938, -0.08177375793457031, -0.07776641845703125, -0.07375907897949219, -0.06975173950195312, -0.06574440002441406, -0.061737060546875, -0.05772972106933594, -0.053722381591796875, -0.04971504211425781, -0.04570770263671875, -0.04170036315917969, -0.037693023681640625, -0.03368568420410156, -0.0296783447265625, -0.025671005249023438, -0.021663665771484375, -0.017656326293945312, -0.01364898681640625, -0.009641647338867188, -0.005634307861328125, -0.0016269683837890625, 0.00238037109375, 0.0063877105712890625, 0.010395050048828125, 0.014402389526367188, 0.01840972900390625, 0.022417068481445312, 0.026424407958984375, 0.030431747436523438, 0.0344390869140625, 0.03844642639160156, 0.042453765869140625, 0.04646110534667969, 0.05046844482421875, 0.05447578430175781, 0.058483123779296875, 0.06249046325683594, 0.066497802734375, 0.07050514221191406, 0.07451248168945312, 0.07851982116699219, 0.08252716064453125, 0.08653450012207031, 0.09054183959960938, 0.09454917907714844, 0.0985565185546875, 0.10256385803222656, 0.10657119750976562, 0.11057853698730469, 0.11458587646484375, 0.11859321594238281, 0.12260055541992188, 0.12660789489746094, 0.130615234375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 17.0, 20.0, 35.0, 37.0, 47.0, 53.0, 72.0, 84.0, 61.0, 93.0, 82.0, 76.0, 62.0, 59.0, 36.0, 45.0, 27.0, 20.0, 18.0, 11.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01038360595703125, -0.009979963302612305, -0.00957632064819336, -0.009172677993774414, -0.008769035339355469, -0.008365392684936523, -0.007961750030517578, -0.007558107376098633, -0.0071544647216796875, -0.006750822067260742, -0.006347179412841797, -0.0059435367584228516, -0.005539894104003906, -0.005136251449584961, -0.004732608795166016, -0.00432896614074707, -0.003925323486328125, -0.0035216808319091797, -0.0031180381774902344, -0.002714395523071289, -0.0023107528686523438, -0.0019071102142333984, -0.0015034675598144531, -0.0010998249053955078, -0.0006961822509765625, -0.0002925395965576172, 0.00011110305786132812, 0.0005147457122802734, 0.0009183883666992188, 0.001322031021118164, 0.0017256736755371094, 0.0021293163299560547, 0.002532958984375, 0.0029366016387939453, 0.0033402442932128906, 0.003743886947631836, 0.004147529602050781, 0.0045511722564697266, 0.004954814910888672, 0.005358457565307617, 0.0057621002197265625, 0.006165742874145508, 0.006569385528564453, 0.0069730281829833984, 0.007376670837402344, 0.007780313491821289, 0.008183956146240234, 0.00858759880065918, 0.008991241455078125, 0.00939488410949707, 0.009798526763916016, 0.010202169418334961, 0.010605812072753906, 0.011009454727172852, 0.011413097381591797, 0.011816740036010742, 0.012220382690429688, 0.012624025344848633, 0.013027667999267578, 0.013431310653686523, 0.013834953308105469, 0.014238595962524414, 0.01464223861694336, 0.015045881271362305, 0.01544952392578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 14.0, 11.0, 32.0, 65.0, 101.0, 189.0, 409.0, 1418.0, 7418.0, 245640.0, 3914725.0, 20283.0, 2774.0, 671.0, 258.0, 109.0, 75.0, 42.0, 11.0, 16.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31640625, -0.3074188232421875, -0.298431396484375, -0.2894439697265625, -0.28045654296875, -0.2714691162109375, -0.262481689453125, -0.2534942626953125, -0.2445068359375, -0.2355194091796875, -0.226531982421875, -0.2175445556640625, -0.20855712890625, -0.1995697021484375, -0.190582275390625, -0.1815948486328125, -0.172607421875, -0.1636199951171875, -0.154632568359375, -0.1456451416015625, -0.13665771484375, -0.1276702880859375, -0.118682861328125, -0.1096954345703125, -0.1007080078125, -0.0917205810546875, -0.082733154296875, -0.0737457275390625, -0.06475830078125, -0.0557708740234375, -0.046783447265625, -0.0377960205078125, -0.02880859375, -0.0198211669921875, -0.010833740234375, -0.0018463134765625, 0.00714111328125, 0.0161285400390625, 0.025115966796875, 0.0341033935546875, 0.0430908203125, 0.0520782470703125, 0.061065673828125, 0.0700531005859375, 0.07904052734375, 0.0880279541015625, 0.097015380859375, 0.1060028076171875, 0.114990234375, 0.1239776611328125, 0.132965087890625, 0.1419525146484375, 0.15093994140625, 0.1599273681640625, 0.168914794921875, 0.1779022216796875, 0.1868896484375, 0.1958770751953125, 0.204864501953125, 0.2138519287109375, 0.22283935546875, 0.2318267822265625, 0.240814208984375, 0.2498016357421875, 0.2587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 15.0, 19.0, 42.0, 64.0, 156.0, 377.0, 1019.0, 1366.0, 531.0, 228.0, 96.0, 53.0, 39.0, 19.0, 12.0, 3.0, 9.0, 7.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06488847732543945, -0.0631875991821289, -0.06148672103881836, -0.05978584289550781, -0.058084964752197266, -0.05638408660888672, -0.05468320846557617, -0.052982330322265625, -0.05128145217895508, -0.04958057403564453, -0.047879695892333984, -0.04617881774902344, -0.04447793960571289, -0.042777061462402344, -0.0410761833190918, -0.03937530517578125, -0.0376744270324707, -0.035973548889160156, -0.03427267074584961, -0.03257179260253906, -0.030870914459228516, -0.02917003631591797, -0.027469158172607422, -0.025768280029296875, -0.024067401885986328, -0.02236652374267578, -0.020665645599365234, -0.018964767456054688, -0.01726388931274414, -0.015563011169433594, -0.013862133026123047, -0.0121612548828125, -0.010460376739501953, -0.008759498596191406, -0.007058620452880859, -0.0053577423095703125, -0.0036568641662597656, -0.0019559860229492188, -0.0002551078796386719, 0.001445770263671875, 0.003146648406982422, 0.004847526550292969, 0.006548404693603516, 0.008249282836914062, 0.00995016098022461, 0.011651039123535156, 0.013351917266845703, 0.01505279541015625, 0.016753673553466797, 0.018454551696777344, 0.02015542984008789, 0.021856307983398438, 0.023557186126708984, 0.02525806427001953, 0.026958942413330078, 0.028659820556640625, 0.030360698699951172, 0.03206157684326172, 0.033762454986572266, 0.03546333312988281, 0.03716421127319336, 0.038865089416503906, 0.04056596755981445, 0.042266845703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [6.0, 21.0, 237.0, 654.0, 88.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14179199934005737, -0.09927183389663696, -0.05675167590379715, -0.014231517910957336, 0.028288647532463074, 0.07080881297588348, 0.1133289635181427, 0.1558491289615631, 0.19836929440498352, 0.24088945984840393, 0.28340962529182434, 0.32592976093292236, 0.3684499263763428, 0.4109700918197632, 0.4534902572631836, 0.496010422706604, 0.5385305881500244, 0.5810507535934448, 0.6235709190368652, 0.6660910844802856, 0.708611249923706, 0.7511314153671265, 0.7936515808105469, 0.8361717462539673, 0.8786919116973877, 0.9212120771408081, 0.9637322425842285, 1.006252408027649, 1.0487725734710693, 1.0912927389144897, 1.1338129043579102, 1.1763330698013306, 1.2188531160354614, 1.2613732814788818, 1.3038934469223022, 1.3464136123657227, 1.388933777809143, 1.4314539432525635, 1.4739741086959839, 1.5164942741394043, 1.5590144395828247, 1.6015346050262451, 1.6440547704696655, 1.686574935913086, 1.7290951013565063, 1.7716152667999268, 1.8141354322433472, 1.8566555976867676, 1.8991756439208984, 1.9416958093643188, 1.9842159748077393, 2.02673602104187, 2.06925630569458, 2.111776351928711, 2.154296636581421, 2.1968166828155518, 2.2393369674682617, 2.2818570137023926, 2.3243772983551025, 2.3668973445892334, 2.4094176292419434, 2.451937675476074, 2.494457960128784, 2.536978006362915, 2.579498291015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 10.0, 14.0, 19.0, 19.0, 19.0, 34.0, 27.0, 32.0, 40.0, 44.0, 60.0, 71.0, 58.0, 64.0, 54.0, 62.0, 65.0, 54.0, 55.0, 42.0, 29.0, 29.0, 23.0, 14.0, 18.0, 11.0, 7.0, 5.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.16993248462677002, -0.16450616717338562, -0.15907984972000122, -0.15365353226661682, -0.14822722971439362, -0.14280091226100922, -0.13737459480762482, -0.13194827735424042, -0.1265219748020172, -0.12109565734863281, -0.11566934734582901, -0.11024302989244461, -0.10481671988964081, -0.09939040243625641, -0.09396408498287201, -0.08853776752948761, -0.08311145007610321, -0.07768513262271881, -0.07225882261991501, -0.06683250516653061, -0.06140619143843651, -0.05597987771034241, -0.05055356025695801, -0.04512724652886391, -0.039700932800769806, -0.034274619072675705, -0.028848303481936455, -0.023421987891197205, -0.017995674163103104, -0.012569360435009003, -0.007143042981624603, -0.0017167292535305023, 0.0037095844745635986, 0.009135899133980274, 0.01456221379339695, 0.0199885293841362, 0.0254148431122303, 0.030841156840324402, 0.0362674742937088, 0.0416937880218029, 0.047120101749897, 0.052546415477991104, 0.057972729206085205, 0.0633990466594696, 0.068825364112854, 0.0742516741156578, 0.0796779915690422, 0.08510430157184601, 0.09053061902523041, 0.09595693647861481, 0.10138324648141861, 0.10680956393480301, 0.11223587393760681, 0.11766219139099121, 0.12308850884437561, 0.12851482629776, 0.1339411437511444, 0.1393674612045288, 0.1447937786579132, 0.1502200961112976, 0.1556463986635208, 0.1610727161169052, 0.1664990335702896, 0.171925351023674, 0.17735165357589722]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 8.0, 12.0, 18.0, 31.0, 30.0, 45.0, 66.0, 96.0, 180.0, 327.0, 702.0, 1578.0, 4902.0, 22973.0, 191342.0, 658964.0, 142259.0, 18139.0, 4076.0, 1397.0, 605.0, 309.0, 166.0, 84.0, 79.0, 50.0, 26.0, 20.0, 13.0, 11.0, 7.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1243896484375, -0.1208791732788086, -0.11736869812011719, -0.11385822296142578, -0.11034774780273438, -0.10683727264404297, -0.10332679748535156, -0.09981632232666016, -0.09630584716796875, -0.09279537200927734, -0.08928489685058594, -0.08577442169189453, -0.08226394653320312, -0.07875347137451172, -0.07524299621582031, -0.0717325210571289, -0.0682220458984375, -0.0647115707397461, -0.06120109558105469, -0.05769062042236328, -0.054180145263671875, -0.05066967010498047, -0.04715919494628906, -0.043648719787597656, -0.04013824462890625, -0.036627769470214844, -0.03311729431152344, -0.02960681915283203, -0.026096343994140625, -0.02258586883544922, -0.019075393676757812, -0.015564918518066406, -0.012054443359375, -0.008543968200683594, -0.0050334930419921875, -0.0015230178833007812, 0.001987457275390625, 0.005497932434082031, 0.009008407592773438, 0.012518882751464844, 0.01602935791015625, 0.019539833068847656, 0.023050308227539062, 0.02656078338623047, 0.030071258544921875, 0.03358173370361328, 0.03709220886230469, 0.040602684020996094, 0.0441131591796875, 0.047623634338378906, 0.05113410949707031, 0.05464458465576172, 0.058155059814453125, 0.06166553497314453, 0.06517601013183594, 0.06868648529052734, 0.07219696044921875, 0.07570743560791016, 0.07921791076660156, 0.08272838592529297, 0.08623886108398438, 0.08974933624267578, 0.09325981140136719, 0.0967702865600586, 0.10028076171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 18.0, 19.0, 39.0, 49.0, 60.0, 79.0, 92.0, 92.0, 104.0, 79.0, 76.0, 82.0, 42.0, 51.0, 35.0, 18.0, 17.0, 12.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01203155517578125, -0.011542201042175293, -0.011052846908569336, -0.010563492774963379, -0.010074138641357422, -0.009584784507751465, -0.009095430374145508, -0.00860607624053955, -0.008116722106933594, -0.007627367973327637, -0.00713801383972168, -0.006648659706115723, -0.006159305572509766, -0.005669951438903809, -0.0051805973052978516, -0.0046912431716918945, -0.0042018890380859375, -0.0037125349044799805, -0.0032231807708740234, -0.0027338266372680664, -0.0022444725036621094, -0.0017551183700561523, -0.0012657642364501953, -0.0007764101028442383, -0.00028705596923828125, 0.00020229816436767578, 0.0006916522979736328, 0.0011810064315795898, 0.0016703605651855469, 0.002159714698791504, 0.002649068832397461, 0.003138422966003418, 0.003627777099609375, 0.004117131233215332, 0.004606485366821289, 0.005095839500427246, 0.005585193634033203, 0.00607454776763916, 0.006563901901245117, 0.007053256034851074, 0.007542610168457031, 0.008031964302062988, 0.008521318435668945, 0.009010672569274902, 0.00950002670288086, 0.009989380836486816, 0.010478734970092773, 0.01096808910369873, 0.011457443237304688, 0.011946797370910645, 0.012436151504516602, 0.012925505638122559, 0.013414859771728516, 0.013904213905334473, 0.01439356803894043, 0.014882922172546387, 0.015372276306152344, 0.0158616304397583, 0.016350984573364258, 0.016840338706970215, 0.017329692840576172, 0.01781904697418213, 0.018308401107788086, 0.018797755241394043, 0.019287109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 12.0, 18.0, 22.0, 27.0, 50.0, 57.0, 98.0, 141.0, 208.0, 355.0, 575.0, 1056.0, 2091.0, 4527.0, 11582.0, 30376.0, 84406.0, 207658.0, 327288.0, 227012.0, 93941.0, 34286.0, 12786.0, 5120.0, 2201.0, 1046.0, 541.0, 351.0, 236.0, 148.0, 107.0, 69.0, 55.0, 32.0, 21.0, 10.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0], "bins": [-0.04461669921875, -0.043459415435791016, -0.04230213165283203, -0.04114484786987305, -0.03998756408691406, -0.03883028030395508, -0.037672996520996094, -0.03651571273803711, -0.035358428955078125, -0.03420114517211914, -0.033043861389160156, -0.03188657760620117, -0.030729293823242188, -0.029572010040283203, -0.02841472625732422, -0.027257442474365234, -0.02610015869140625, -0.024942874908447266, -0.02378559112548828, -0.022628307342529297, -0.021471023559570312, -0.020313739776611328, -0.019156455993652344, -0.01799917221069336, -0.016841888427734375, -0.01568460464477539, -0.014527320861816406, -0.013370037078857422, -0.012212753295898438, -0.011055469512939453, -0.009898185729980469, -0.008740901947021484, -0.0075836181640625, -0.006426334381103516, -0.005269050598144531, -0.004111766815185547, -0.0029544830322265625, -0.0017971992492675781, -0.0006399154663085938, 0.0005173683166503906, 0.001674652099609375, 0.0028319358825683594, 0.003989219665527344, 0.005146503448486328, 0.0063037872314453125, 0.007461071014404297, 0.008618354797363281, 0.009775638580322266, 0.01093292236328125, 0.012090206146240234, 0.013247489929199219, 0.014404773712158203, 0.015562057495117188, 0.016719341278076172, 0.017876625061035156, 0.01903390884399414, 0.020191192626953125, 0.02134847640991211, 0.022505760192871094, 0.023663043975830078, 0.024820327758789062, 0.025977611541748047, 0.02713489532470703, 0.028292179107666016, 0.029449462890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 6.0, 6.0, 19.0, 16.0, 12.0, 31.0, 21.0, 14.0, 24.0, 36.0, 30.0, 40.0, 37.0, 42.0, 46.0, 50.0, 55.0, 41.0, 36.0, 43.0, 46.0, 46.0, 42.0, 44.0, 29.0, 29.0, 16.0, 15.0, 25.0, 21.0, 13.0, 17.0, 8.0, 16.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029083251953125, -0.027897357940673828, -0.026711463928222656, -0.025525569915771484, -0.024339675903320312, -0.02315378189086914, -0.02196788787841797, -0.020781993865966797, -0.019596099853515625, -0.018410205841064453, -0.01722431182861328, -0.01603841781616211, -0.014852523803710938, -0.013666629791259766, -0.012480735778808594, -0.011294841766357422, -0.01010894775390625, -0.008923053741455078, -0.007737159729003906, -0.006551265716552734, -0.0053653717041015625, -0.004179477691650391, -0.0029935836791992188, -0.0018076896667480469, -0.000621795654296875, 0.0005640983581542969, 0.0017499923706054688, 0.0029358863830566406, 0.0041217803955078125, 0.005307674407958984, 0.006493568420410156, 0.007679462432861328, 0.0088653564453125, 0.010051250457763672, 0.011237144470214844, 0.012423038482666016, 0.013608932495117188, 0.01479482650756836, 0.01598072052001953, 0.017166614532470703, 0.018352508544921875, 0.019538402557373047, 0.02072429656982422, 0.02191019058227539, 0.023096084594726562, 0.024281978607177734, 0.025467872619628906, 0.026653766632080078, 0.02783966064453125, 0.029025554656982422, 0.030211448669433594, 0.031397342681884766, 0.03258323669433594, 0.03376913070678711, 0.03495502471923828, 0.03614091873168945, 0.037326812744140625, 0.0385127067565918, 0.03969860076904297, 0.04088449478149414, 0.04207038879394531, 0.043256282806396484, 0.044442176818847656, 0.04562807083129883, 0.04681396484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 15.0, 13.0, 21.0, 41.0, 51.0, 77.0, 130.0, 241.0, 414.0, 875.0, 1780.0, 5211.0, 22245.0, 165385.0, 594027.0, 219093.0, 28638.0, 6136.0, 2134.0, 953.0, 450.0, 257.0, 140.0, 96.0, 44.0, 22.0, 17.0, 16.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025421142578125, -0.02453136444091797, -0.023641586303710938, -0.022751808166503906, -0.021862030029296875, -0.020972251892089844, -0.020082473754882812, -0.01919269561767578, -0.01830291748046875, -0.01741313934326172, -0.016523361206054688, -0.015633583068847656, -0.014743804931640625, -0.013854026794433594, -0.012964248657226562, -0.012074470520019531, -0.0111846923828125, -0.010294914245605469, -0.009405136108398438, -0.008515357971191406, -0.007625579833984375, -0.006735801696777344, -0.0058460235595703125, -0.004956245422363281, -0.00406646728515625, -0.0031766891479492188, -0.0022869110107421875, -0.0013971328735351562, -0.000507354736328125, 0.00038242340087890625, 0.0012722015380859375, 0.0021619796752929688, 0.0030517578125, 0.003941535949707031, 0.0048313140869140625, 0.005721092224121094, 0.006610870361328125, 0.007500648498535156, 0.008390426635742188, 0.009280204772949219, 0.01016998291015625, 0.011059761047363281, 0.011949539184570312, 0.012839317321777344, 0.013729095458984375, 0.014618873596191406, 0.015508651733398438, 0.01639842987060547, 0.0172882080078125, 0.01817798614501953, 0.019067764282226562, 0.019957542419433594, 0.020847320556640625, 0.021737098693847656, 0.022626876831054688, 0.02351665496826172, 0.02440643310546875, 0.02529621124267578, 0.026185989379882812, 0.027075767517089844, 0.027965545654296875, 0.028855323791503906, 0.029745101928710938, 0.03063488006591797, 0.031524658203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 8.0, 16.0, 22.0, 23.0, 44.0, 56.0, 65.0, 55.0, 80.0, 84.0, 73.0, 75.0, 89.0, 65.0, 76.0, 35.0, 34.0, 35.0, 21.0, 14.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-06, -7.6070427894592285e-06, -7.3462724685668945e-06, -7.0855021476745605e-06, -6.8247318267822266e-06, -6.563961505889893e-06, -6.303191184997559e-06, -6.042420864105225e-06, -5.781650543212891e-06, -5.520880222320557e-06, -5.260109901428223e-06, -4.999339580535889e-06, -4.738569259643555e-06, -4.477798938751221e-06, -4.217028617858887e-06, -3.956258296966553e-06, -3.6954879760742188e-06, -3.4347176551818848e-06, -3.1739473342895508e-06, -2.913177013397217e-06, -2.652406692504883e-06, -2.391636371612549e-06, -2.130866050720215e-06, -1.8700957298278809e-06, -1.6093254089355469e-06, -1.3485550880432129e-06, -1.087784767150879e-06, -8.270144462585449e-07, -5.662441253662109e-07, -3.0547380447387695e-07, -4.470348358154297e-08, 2.1606683731079102e-07, 4.76837158203125e-07, 7.37607479095459e-07, 9.98377799987793e-07, 1.259148120880127e-06, 1.519918441772461e-06, 1.780688762664795e-06, 2.041459083557129e-06, 2.302229404449463e-06, 2.562999725341797e-06, 2.823770046234131e-06, 3.084540367126465e-06, 3.345310688018799e-06, 3.606081008911133e-06, 3.866851329803467e-06, 4.127621650695801e-06, 4.388391971588135e-06, 4.649162292480469e-06, 4.909932613372803e-06, 5.170702934265137e-06, 5.431473255157471e-06, 5.692243576049805e-06, 5.953013896942139e-06, 6.213784217834473e-06, 6.474554538726807e-06, 6.735324859619141e-06, 6.996095180511475e-06, 7.256865501403809e-06, 7.517635822296143e-06, 7.778406143188477e-06, 8.03917646408081e-06, 8.299946784973145e-06, 8.560717105865479e-06, 8.821487426757812e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 7.0, 13.0, 27.0, 23.0, 42.0, 58.0, 101.0, 160.0, 317.0, 510.0, 1196.0, 2973.0, 8626.0, 33335.0, 157421.0, 475088.0, 284064.0, 62344.0, 14513.0, 4373.0, 1635.0, 778.0, 359.0, 225.0, 111.0, 72.0, 44.0, 38.0, 23.0, 18.0, 10.0, 12.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.023488283157348633, -0.022791385650634766, -0.0220944881439209, -0.02139759063720703, -0.020700693130493164, -0.020003795623779297, -0.01930689811706543, -0.018610000610351562, -0.017913103103637695, -0.017216205596923828, -0.01651930809020996, -0.015822410583496094, -0.015125513076782227, -0.01442861557006836, -0.013731718063354492, -0.013034820556640625, -0.012337923049926758, -0.01164102554321289, -0.010944128036499023, -0.010247230529785156, -0.009550333023071289, -0.008853435516357422, -0.008156538009643555, -0.0074596405029296875, -0.00676274299621582, -0.006065845489501953, -0.005368947982788086, -0.004672050476074219, -0.0039751529693603516, -0.0032782554626464844, -0.002581357955932617, -0.00188446044921875, -0.0011875629425048828, -0.0004906654357910156, 0.00020623207092285156, 0.0009031295776367188, 0.001600027084350586, 0.002296924591064453, 0.0029938220977783203, 0.0036907196044921875, 0.004387617111206055, 0.005084514617919922, 0.005781412124633789, 0.006478309631347656, 0.0071752071380615234, 0.00787210464477539, 0.008569002151489258, 0.009265899658203125, 0.009962797164916992, 0.01065969467163086, 0.011356592178344727, 0.012053489685058594, 0.012750387191772461, 0.013447284698486328, 0.014144182205200195, 0.014841079711914062, 0.01553797721862793, 0.016234874725341797, 0.016931772232055664, 0.01762866973876953, 0.0183255672454834, 0.019022464752197266, 0.019719362258911133, 0.020416259765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 10.0, 18.0, 13.0, 16.0, 20.0, 27.0, 42.0, 47.0, 80.0, 93.0, 93.0, 89.0, 87.0, 75.0, 82.0, 55.0, 34.0, 29.0, 23.0, 20.0, 17.0, 6.0, 6.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02972412109375, -0.02893233299255371, -0.028140544891357422, -0.027348756790161133, -0.026556968688964844, -0.025765180587768555, -0.024973392486572266, -0.024181604385375977, -0.023389816284179688, -0.0225980281829834, -0.02180624008178711, -0.02101445198059082, -0.02022266387939453, -0.019430875778198242, -0.018639087677001953, -0.017847299575805664, -0.017055511474609375, -0.016263723373413086, -0.015471935272216797, -0.014680147171020508, -0.013888359069824219, -0.01309657096862793, -0.01230478286743164, -0.011512994766235352, -0.010721206665039062, -0.009929418563842773, -0.009137630462646484, -0.008345842361450195, -0.007554054260253906, -0.006762266159057617, -0.005970478057861328, -0.005178689956665039, -0.00438690185546875, -0.003595113754272461, -0.002803325653076172, -0.002011537551879883, -0.0012197494506835938, -0.0004279613494873047, 0.0003638267517089844, 0.0011556148529052734, 0.0019474029541015625, 0.0027391910552978516, 0.0035309791564941406, 0.00432276725769043, 0.005114555358886719, 0.005906343460083008, 0.006698131561279297, 0.007489919662475586, 0.008281707763671875, 0.009073495864868164, 0.009865283966064453, 0.010657072067260742, 0.011448860168457031, 0.01224064826965332, 0.01303243637084961, 0.013824224472045898, 0.014616012573242188, 0.015407800674438477, 0.016199588775634766, 0.016991376876831055, 0.017783164978027344, 0.018574953079223633, 0.019366741180419922, 0.02015852928161621, 0.0209503173828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 13.0, 11.0, 33.0, 74.0, 172.0, 271.0, 213.0, 127.0, 56.0, 27.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43683022260665894, -0.4168679118156433, -0.3969055712223053, -0.3769432604312897, -0.35698091983795166, -0.33701860904693604, -0.3170562982559204, -0.2970939874649048, -0.2771316468715668, -0.25716933608055115, -0.23720699548721313, -0.2172446846961975, -0.1972823590040207, -0.17732003331184387, -0.15735772252082825, -0.13739539682865143, -0.11743307113647461, -0.09747074544429779, -0.07750842720270157, -0.05754610523581505, -0.03758378326892853, -0.01762145757675171, 0.002340860664844513, 0.022303178906440735, 0.042265504598617554, 0.062227826565504074, 0.0821901485323906, 0.10215246677398682, 0.12211479246616364, 0.14207711815834045, 0.16203942894935608, 0.1820017546415329, 0.2019641399383545, 0.2219264656305313, 0.24188879132270813, 0.26185110211372375, 0.28181344270706177, 0.3017757534980774, 0.321738064289093, 0.34170037508010864, 0.36166271567344666, 0.3816250264644623, 0.4015873670578003, 0.4215496778488159, 0.44151198863983154, 0.46147432923316956, 0.4814366400241852, 0.5013989806175232, 0.5213612914085388, 0.5413236021995544, 0.5612859129905701, 0.5812482833862305, 0.6012105941772461, 0.6211729049682617, 0.6411352157592773, 0.661097526550293, 0.6810598373413086, 0.7010221481323242, 0.7209844589233398, 0.7409468293190002, 0.7609091401100159, 0.7808714509010315, 0.8008337616920471, 0.8207960724830627, 0.8407584428787231]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 9.0, 4.0, 7.0, 16.0, 13.0, 22.0, 26.0, 33.0, 30.0, 32.0, 30.0, 50.0, 44.0, 60.0, 51.0, 54.0, 56.0, 48.0, 55.0, 53.0, 44.0, 37.0, 43.0, 31.0, 27.0, 19.0, 17.0, 18.0, 14.0, 10.0, 13.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27434688806533813, -0.2668404281139374, -0.2593339681625366, -0.25182750821113586, -0.2443210333585739, -0.23681457340717316, -0.2293081134557724, -0.22180165350437164, -0.2142951786518097, -0.20678871870040894, -0.19928225874900818, -0.19177579879760742, -0.18426932394504547, -0.17676286399364471, -0.16925640404224396, -0.1617499440908432, -0.15424348413944244, -0.1467370241880417, -0.13923056423664093, -0.13172408938407898, -0.12421762943267822, -0.11671116948127747, -0.10920470952987671, -0.10169824957847595, -0.0941917821764946, -0.08668532222509384, -0.07917885482311249, -0.07167239487171173, -0.06416593492031097, -0.05665946751832962, -0.049153007566928864, -0.04164654389023781, -0.03414008021354675, -0.026633616536855698, -0.01912715472280979, -0.011620692908763885, -0.00411422923207283, 0.003392234444618225, 0.010898694396018982, 0.018405158072710037, 0.025911621749401093, 0.03341808542609215, 0.0409245491027832, 0.04843100905418396, 0.055937472730875015, 0.06344393640756607, 0.07095039635896683, 0.07845686376094818, 0.08596332371234894, 0.0934697836637497, 0.10097625106573105, 0.1084827110171318, 0.11598917841911316, 0.12349563837051392, 0.13100209832191467, 0.13850855827331543, 0.1460150182247162, 0.15352147817611694, 0.1610279381275177, 0.16853439807891846, 0.1760408729314804, 0.18354733288288116, 0.19105379283428192, 0.19856025278568268, 0.20606672763824463]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 9.0, 15.0, 26.0, 43.0, 97.0, 132.0, 318.0, 912.0, 3138.0, 24242.0, 2001028.0, 2135345.0, 24480.0, 3183.0, 779.0, 271.0, 126.0, 55.0, 36.0, 14.0, 10.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.07929325103759766, -0.07551765441894531, -0.07174205780029297, -0.06796646118164062, -0.06419086456298828, -0.06041526794433594, -0.056639671325683594, -0.05286407470703125, -0.049088478088378906, -0.04531288146972656, -0.04153728485107422, -0.037761688232421875, -0.03398609161376953, -0.030210494995117188, -0.026434898376464844, -0.0226593017578125, -0.018883705139160156, -0.015108108520507812, -0.011332511901855469, -0.007556915283203125, -0.0037813186645507812, -5.7220458984375e-06, 0.0037698745727539062, 0.00754547119140625, 0.011321067810058594, 0.015096664428710938, 0.01887226104736328, 0.022647857666015625, 0.02642345428466797, 0.030199050903320312, 0.033974647521972656, 0.037750244140625, 0.041525840759277344, 0.04530143737792969, 0.04907703399658203, 0.052852630615234375, 0.05662822723388672, 0.06040382385253906, 0.0641794204711914, 0.06795501708984375, 0.0717306137084961, 0.07550621032714844, 0.07928180694580078, 0.08305740356445312, 0.08683300018310547, 0.09060859680175781, 0.09438419342041016, 0.0981597900390625, 0.10193538665771484, 0.10571098327636719, 0.10948657989501953, 0.11326217651367188, 0.11703777313232422, 0.12081336975097656, 0.1245889663696289, 0.12836456298828125, 0.1321401596069336, 0.13591575622558594, 0.13969135284423828, 0.14346694946289062, 0.14724254608154297, 0.1510181427001953, 0.15479373931884766, 0.1585693359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 18.0, 16.0, 21.0, 47.0, 49.0, 57.0, 70.0, 83.0, 86.0, 85.0, 87.0, 66.0, 74.0, 54.0, 55.0, 36.0, 23.0, 25.0, 9.0, 5.0, 9.0, 6.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01120758056640625, -0.010733723640441895, -0.010259866714477539, -0.009786009788513184, -0.009312152862548828, -0.008838295936584473, -0.008364439010620117, -0.007890582084655762, -0.007416725158691406, -0.006942868232727051, -0.006469011306762695, -0.00599515438079834, -0.005521297454833984, -0.005047440528869629, -0.0045735836029052734, -0.004099726676940918, -0.0036258697509765625, -0.003152012825012207, -0.0026781558990478516, -0.002204298973083496, -0.0017304420471191406, -0.0012565851211547852, -0.0007827281951904297, -0.0003088712692260742, 0.00016498565673828125, 0.0006388425827026367, 0.0011126995086669922, 0.0015865564346313477, 0.002060413360595703, 0.0025342702865600586, 0.003008127212524414, 0.0034819841384887695, 0.003955841064453125, 0.0044296979904174805, 0.004903554916381836, 0.005377411842346191, 0.005851268768310547, 0.006325125694274902, 0.006798982620239258, 0.007272839546203613, 0.007746696472167969, 0.008220553398132324, 0.00869441032409668, 0.009168267250061035, 0.00964212417602539, 0.010115981101989746, 0.010589838027954102, 0.011063694953918457, 0.011537551879882812, 0.012011408805847168, 0.012485265731811523, 0.012959122657775879, 0.013432979583740234, 0.01390683650970459, 0.014380693435668945, 0.0148545503616333, 0.015328407287597656, 0.01580226421356201, 0.016276121139526367, 0.016749978065490723, 0.017223834991455078, 0.017697691917419434, 0.01817154884338379, 0.018645405769348145, 0.0191192626953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 6.0, 13.0, 11.0, 25.0, 32.0, 42.0, 58.0, 107.0, 185.0, 319.0, 846.0, 5802.0, 636057.0, 3535578.0, 12776.0, 1295.0, 473.0, 253.0, 97.0, 95.0, 65.0, 39.0, 24.0, 25.0, 19.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1627197265625, -0.15713119506835938, -0.15154266357421875, -0.14595413208007812, -0.1403656005859375, -0.13477706909179688, -0.12918853759765625, -0.12360000610351562, -0.118011474609375, -0.11242294311523438, -0.10683441162109375, -0.10124588012695312, -0.0956573486328125, -0.09006881713867188, -0.08448028564453125, -0.07889175415039062, -0.07330322265625, -0.06771469116210938, -0.06212615966796875, -0.056537628173828125, -0.0509490966796875, -0.045360565185546875, -0.03977203369140625, -0.034183502197265625, -0.028594970703125, -0.023006439208984375, -0.01741790771484375, -0.011829376220703125, -0.0062408447265625, -0.000652313232421875, 0.00493621826171875, 0.010524749755859375, 0.01611328125, 0.021701812744140625, 0.02729034423828125, 0.032878875732421875, 0.0384674072265625, 0.044055938720703125, 0.04964447021484375, 0.055233001708984375, 0.060821533203125, 0.06641006469726562, 0.07199859619140625, 0.07758712768554688, 0.0831756591796875, 0.08876419067382812, 0.09435272216796875, 0.09994125366210938, 0.10552978515625, 0.11111831665039062, 0.11670684814453125, 0.12229537963867188, 0.1278839111328125, 0.13347244262695312, 0.13906097412109375, 0.14464950561523438, 0.150238037109375, 0.15582656860351562, 0.16141510009765625, 0.16700363159179688, 0.1725921630859375, 0.17818069458007812, 0.18376922607421875, 0.18935775756835938, 0.1949462890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 22.0, 30.0, 58.0, 116.0, 221.0, 452.0, 973.0, 1135.0, 478.0, 240.0, 136.0, 78.0, 36.0, 33.0, 12.0, 12.0, 8.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.01620793342590332, -0.01531076431274414, -0.014413595199584961, -0.013516426086425781, -0.012619256973266602, -0.011722087860107422, -0.010824918746948242, -0.009927749633789062, -0.009030580520629883, -0.008133411407470703, -0.0072362422943115234, -0.006339073181152344, -0.005441904067993164, -0.004544734954833984, -0.0036475658416748047, -0.002750396728515625, -0.0018532276153564453, -0.0009560585021972656, -5.888938903808594e-05, 0.0008382797241210938, 0.0017354488372802734, 0.002632617950439453, 0.003529787063598633, 0.0044269561767578125, 0.005324125289916992, 0.006221294403076172, 0.0071184635162353516, 0.008015632629394531, 0.008912801742553711, 0.00980997085571289, 0.01070713996887207, 0.01160430908203125, 0.01250147819519043, 0.01339864730834961, 0.014295816421508789, 0.015192985534667969, 0.01609015464782715, 0.016987323760986328, 0.017884492874145508, 0.018781661987304688, 0.019678831100463867, 0.020576000213623047, 0.021473169326782227, 0.022370338439941406, 0.023267507553100586, 0.024164676666259766, 0.025061845779418945, 0.025959014892578125, 0.026856184005737305, 0.027753353118896484, 0.028650522232055664, 0.029547691345214844, 0.030444860458374023, 0.0313420295715332, 0.03223919868469238, 0.03313636779785156, 0.03403353691101074, 0.03493070602416992, 0.0358278751373291, 0.03672504425048828, 0.03762221336364746, 0.03851938247680664, 0.03941655158996582, 0.040313720703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 8.0, 55.0, 650.0, 268.0, 17.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6331230401992798, -0.6052417755126953, -0.5773605108261108, -0.5494791865348816, -0.5215979218482971, -0.49371665716171265, -0.4658353924751282, -0.4379540979862213, -0.41007280349731445, -0.38219153881073, -0.3543102443218231, -0.32642897963523865, -0.2985476851463318, -0.2706664204597473, -0.24278514087200165, -0.21490386128425598, -0.1870225965976715, -0.15914131700992584, -0.13126003742218018, -0.1033787652850151, -0.07549748569726944, -0.04761621356010437, -0.019734933972358704, 0.008146345615386963, 0.03602762520313263, 0.0639089047908783, 0.09179018437862396, 0.11967145651578903, 0.1475527286529541, 0.17543400824069977, 0.20331528782844543, 0.2311965674161911, 0.25907784700393677, 0.28695911169052124, 0.3148404061794281, 0.3427216708660126, 0.37060296535491943, 0.3984842300415039, 0.4263654947280884, 0.45424678921699524, 0.4821280837059021, 0.5100093483924866, 0.537890613079071, 0.5657719373703003, 0.5936532020568848, 0.6215344667434692, 0.6494157314300537, 0.6772969961166382, 0.7051782608032227, 0.7330595254898071, 0.7609407901763916, 0.7888221144676208, 0.8167033791542053, 0.8445846438407898, 0.8724659085273743, 0.9003472328186035, 0.928228497505188, 0.9561097621917725, 0.9839910268783569, 1.0118722915649414, 1.0397535562515259, 1.0676348209381104, 1.0955162048339844, 1.1233974695205688, 1.1512787342071533]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 15.0, 20.0, 25.0, 29.0, 33.0, 39.0, 53.0, 50.0, 38.0, 52.0, 52.0, 60.0, 65.0, 63.0, 58.0, 44.0, 61.0, 40.0, 34.0, 35.0, 32.0, 13.0, 12.0, 14.0, 10.0, 3.0, 7.0, 9.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10619121789932251, -0.10272591561079025, -0.099260613322258, -0.09579531848430634, -0.09233001619577408, -0.08886471390724182, -0.08539941906929016, -0.0819341167807579, -0.07846881449222565, -0.07500351220369339, -0.07153820991516113, -0.06807291507720947, -0.06460761278867722, -0.06114231050014496, -0.057677011936903, -0.05421171337366104, -0.050746411085128784, -0.04728110879659653, -0.04381581023335457, -0.04035051167011261, -0.03688520938158035, -0.033419907093048096, -0.029954608529806137, -0.02648930810391903, -0.02302400767803192, -0.019558707252144814, -0.016093406826257706, -0.012628106400370598, -0.00916280597448349, -0.005697505548596382, -0.0022322051227092743, 0.0012330953031778336, 0.004698395729064941, 0.00816369615495205, 0.011628996580839157, 0.015094297006726265, 0.018559597432613373, 0.02202489785850048, 0.02549019828438759, 0.028955498710274696, 0.032420799136161804, 0.03588610142469406, 0.03935139998793602, 0.04281669855117798, 0.046282000839710236, 0.04974730312824249, 0.05321260169148445, 0.05667790025472641, 0.06014320254325867, 0.06360850483179092, 0.06707380712032318, 0.07053910195827484, 0.0740044042468071, 0.07746970653533936, 0.08093500137329102, 0.08440030366182327, 0.08786560595035553, 0.09133090823888779, 0.09479621052742004, 0.0982615053653717, 0.10172680765390396, 0.10519210994243622, 0.10865740478038788, 0.11212270706892014, 0.11558800935745239]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 9.0, 16.0, 14.0, 15.0, 24.0, 34.0, 45.0, 87.0, 140.0, 188.0, 381.0, 625.0, 1211.0, 2592.0, 6523.0, 21766.0, 90402.0, 336877.0, 413720.0, 128931.0, 29920.0, 8575.0, 3132.0, 1436.0, 737.0, 415.0, 248.0, 171.0, 109.0, 77.0, 28.0, 27.0, 20.0, 11.0, 14.0, 5.0, 5.0, 3.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062225341796875, -0.0602259635925293, -0.058226585388183594, -0.05622720718383789, -0.05422782897949219, -0.052228450775146484, -0.05022907257080078, -0.04822969436645508, -0.046230316162109375, -0.04423093795776367, -0.04223155975341797, -0.040232181549072266, -0.03823280334472656, -0.03623342514038086, -0.034234046936035156, -0.03223466873168945, -0.03023529052734375, -0.028235912322998047, -0.026236534118652344, -0.02423715591430664, -0.022237777709960938, -0.020238399505615234, -0.01823902130126953, -0.016239643096923828, -0.014240264892578125, -0.012240886688232422, -0.010241508483886719, -0.008242130279541016, -0.0062427520751953125, -0.004243373870849609, -0.0022439956665039062, -0.0002446174621582031, 0.0017547607421875, 0.003754138946533203, 0.005753517150878906, 0.007752895355224609, 0.009752273559570312, 0.011751651763916016, 0.013751029968261719, 0.015750408172607422, 0.017749786376953125, 0.019749164581298828, 0.02174854278564453, 0.023747920989990234, 0.025747299194335938, 0.02774667739868164, 0.029746055603027344, 0.03174543380737305, 0.03374481201171875, 0.03574419021606445, 0.037743568420410156, 0.03974294662475586, 0.04174232482910156, 0.043741703033447266, 0.04574108123779297, 0.04774045944213867, 0.049739837646484375, 0.05173921585083008, 0.05373859405517578, 0.055737972259521484, 0.05773735046386719, 0.05973672866821289, 0.061736106872558594, 0.0637354850769043, 0.06573486328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 10.0, 12.0, 15.0, 30.0, 25.0, 42.0, 53.0, 73.0, 75.0, 80.0, 78.0, 85.0, 72.0, 71.0, 66.0, 59.0, 36.0, 37.0, 20.0, 14.0, 14.0, 10.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.011181235313415527, -0.010697126388549805, -0.010213017463684082, -0.00972890853881836, -0.009244799613952637, -0.008760690689086914, -0.008276581764221191, -0.007792472839355469, -0.007308363914489746, -0.0068242549896240234, -0.006340146064758301, -0.005856037139892578, -0.0053719282150268555, -0.004887819290161133, -0.00440371036529541, -0.0039196014404296875, -0.003435492515563965, -0.002951383590698242, -0.0024672746658325195, -0.001983165740966797, -0.0014990568161010742, -0.0010149478912353516, -0.0005308389663696289, -4.673004150390625e-05, 0.0004373788833618164, 0.0009214878082275391, 0.0014055967330932617, 0.0018897056579589844, 0.002373814582824707, 0.0028579235076904297, 0.0033420324325561523, 0.003826141357421875, 0.004310250282287598, 0.00479435920715332, 0.005278468132019043, 0.005762577056884766, 0.006246685981750488, 0.006730794906616211, 0.007214903831481934, 0.007699012756347656, 0.008183121681213379, 0.008667230606079102, 0.009151339530944824, 0.009635448455810547, 0.01011955738067627, 0.010603666305541992, 0.011087775230407715, 0.011571884155273438, 0.01205599308013916, 0.012540102005004883, 0.013024210929870605, 0.013508319854736328, 0.01399242877960205, 0.014476537704467773, 0.014960646629333496, 0.015444755554199219, 0.01592886447906494, 0.016412973403930664, 0.016897082328796387, 0.01738119125366211, 0.017865300178527832, 0.018349409103393555, 0.018833518028259277, 0.019317626953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 6.0, 7.0, 13.0, 12.0, 27.0, 32.0, 52.0, 67.0, 108.0, 165.0, 260.0, 394.0, 719.0, 1460.0, 2910.0, 6815.0, 16942.0, 44163.0, 116585.0, 260927.0, 313311.0, 171787.0, 67772.0, 25358.0, 9956.0, 4203.0, 2038.0, 981.0, 574.0, 328.0, 197.0, 117.0, 81.0, 61.0, 38.0, 26.0, 24.0, 15.0, 10.0, 6.0, 7.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034271240234375, -0.03320741653442383, -0.032143592834472656, -0.031079769134521484, -0.030015945434570312, -0.02895212173461914, -0.02788829803466797, -0.026824474334716797, -0.025760650634765625, -0.024696826934814453, -0.02363300323486328, -0.02256917953491211, -0.021505355834960938, -0.020441532135009766, -0.019377708435058594, -0.018313884735107422, -0.01725006103515625, -0.016186237335205078, -0.015122413635253906, -0.014058589935302734, -0.012994766235351562, -0.01193094253540039, -0.010867118835449219, -0.009803295135498047, -0.008739471435546875, -0.007675647735595703, -0.006611824035644531, -0.005548000335693359, -0.0044841766357421875, -0.0034203529357910156, -0.0023565292358398438, -0.0012927055358886719, -0.0002288818359375, 0.0008349418640136719, 0.0018987655639648438, 0.0029625892639160156, 0.0040264129638671875, 0.005090236663818359, 0.006154060363769531, 0.007217884063720703, 0.008281707763671875, 0.009345531463623047, 0.010409355163574219, 0.01147317886352539, 0.012537002563476562, 0.013600826263427734, 0.014664649963378906, 0.015728473663330078, 0.01679229736328125, 0.017856121063232422, 0.018919944763183594, 0.019983768463134766, 0.021047592163085938, 0.02211141586303711, 0.02317523956298828, 0.024239063262939453, 0.025302886962890625, 0.026366710662841797, 0.02743053436279297, 0.02849435806274414, 0.029558181762695312, 0.030622005462646484, 0.031685829162597656, 0.03274965286254883, 0.0338134765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 9.0, 7.0, 8.0, 14.0, 9.0, 19.0, 20.0, 24.0, 19.0, 17.0, 26.0, 31.0, 35.0, 35.0, 32.0, 30.0, 28.0, 38.0, 38.0, 52.0, 32.0, 37.0, 33.0, 26.0, 52.0, 34.0, 39.0, 39.0, 40.0, 24.0, 20.0, 26.0, 11.0, 11.0, 12.0, 15.0, 10.0, 5.0, 7.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.035003662109375, -0.033916473388671875, -0.03282928466796875, -0.031742095947265625, -0.0306549072265625, -0.029567718505859375, -0.02848052978515625, -0.027393341064453125, -0.02630615234375, -0.025218963623046875, -0.02413177490234375, -0.023044586181640625, -0.0219573974609375, -0.020870208740234375, -0.01978302001953125, -0.018695831298828125, -0.017608642578125, -0.016521453857421875, -0.01543426513671875, -0.014347076416015625, -0.0132598876953125, -0.012172698974609375, -0.01108551025390625, -0.009998321533203125, -0.0089111328125, -0.007823944091796875, -0.00673675537109375, -0.005649566650390625, -0.0045623779296875, -0.003475189208984375, -0.00238800048828125, -0.001300811767578125, -0.000213623046875, 0.000873565673828125, 0.00196075439453125, 0.003047943115234375, 0.0041351318359375, 0.005222320556640625, 0.00630950927734375, 0.007396697998046875, 0.00848388671875, 0.009571075439453125, 0.01065826416015625, 0.011745452880859375, 0.0128326416015625, 0.013919830322265625, 0.01500701904296875, 0.016094207763671875, 0.017181396484375, 0.018268585205078125, 0.01935577392578125, 0.020442962646484375, 0.0215301513671875, 0.022617340087890625, 0.02370452880859375, 0.024791717529296875, 0.02587890625, 0.026966094970703125, 0.02805328369140625, 0.029140472412109375, 0.0302276611328125, 0.031314849853515625, 0.03240203857421875, 0.033489227294921875, 0.034576416015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 9.0, 12.0, 17.0, 33.0, 63.0, 89.0, 167.0, 338.0, 648.0, 1399.0, 3918.0, 18199.0, 153549.0, 613164.0, 223087.0, 25733.0, 4960.0, 1580.0, 760.0, 371.0, 195.0, 106.0, 53.0, 26.0, 21.0, 18.0, 16.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.03253173828125, -0.031688690185546875, -0.03084564208984375, -0.030002593994140625, -0.0291595458984375, -0.028316497802734375, -0.02747344970703125, -0.026630401611328125, -0.025787353515625, -0.024944305419921875, -0.02410125732421875, -0.023258209228515625, -0.0224151611328125, -0.021572113037109375, -0.02072906494140625, -0.019886016845703125, -0.01904296875, -0.018199920654296875, -0.01735687255859375, -0.016513824462890625, -0.0156707763671875, -0.014827728271484375, -0.01398468017578125, -0.013141632080078125, -0.012298583984375, -0.011455535888671875, -0.01061248779296875, -0.009769439697265625, -0.0089263916015625, -0.008083343505859375, -0.00724029541015625, -0.006397247314453125, -0.00555419921875, -0.004711151123046875, -0.00386810302734375, -0.003025054931640625, -0.0021820068359375, -0.001338958740234375, -0.00049591064453125, 0.000347137451171875, 0.001190185546875, 0.002033233642578125, 0.00287628173828125, 0.003719329833984375, 0.0045623779296875, 0.005405426025390625, 0.00624847412109375, 0.007091522216796875, 0.0079345703125, 0.008777618408203125, 0.00962066650390625, 0.010463714599609375, 0.0113067626953125, 0.012149810791015625, 0.01299285888671875, 0.013835906982421875, 0.014678955078125, 0.015522003173828125, 0.01636505126953125, 0.017208099365234375, 0.0180511474609375, 0.018894195556640625, 0.01973724365234375, 0.020580291748046875, 0.02142333984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 1.0, 8.0, 9.0, 11.0, 17.0, 12.0, 24.0, 34.0, 40.0, 73.0, 51.0, 86.0, 46.0, 62.0, 75.0, 53.0, 64.0, 59.0, 58.0, 43.0, 30.0, 46.0, 18.0, 30.0, 15.0, 4.0, 11.0, 9.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.854534149169922e-06, -6.650574505329132e-06, -6.446614861488342e-06, -6.2426552176475525e-06, -6.038695573806763e-06, -5.834735929965973e-06, -5.630776286125183e-06, -5.426816642284393e-06, -5.2228569984436035e-06, -5.018897354602814e-06, -4.814937710762024e-06, -4.610978066921234e-06, -4.407018423080444e-06, -4.2030587792396545e-06, -3.999099135398865e-06, -3.795139491558075e-06, -3.591179847717285e-06, -3.3872202038764954e-06, -3.1832605600357056e-06, -2.9793009161949158e-06, -2.775341272354126e-06, -2.571381628513336e-06, -2.3674219846725464e-06, -2.1634623408317566e-06, -1.959502696990967e-06, -1.755543053150177e-06, -1.5515834093093872e-06, -1.3476237654685974e-06, -1.1436641216278076e-06, -9.397044777870178e-07, -7.35744833946228e-07, -5.317851901054382e-07, -3.2782554626464844e-07, -1.2386590242385864e-07, 8.009374141693115e-08, 2.8405338525772095e-07, 4.880130290985107e-07, 6.919726729393005e-07, 8.959323167800903e-07, 1.0998919606208801e-06, 1.30385160446167e-06, 1.5078112483024597e-06, 1.7117708921432495e-06, 1.9157305359840393e-06, 2.119690179824829e-06, 2.323649823665619e-06, 2.5276094675064087e-06, 2.7315691113471985e-06, 2.9355287551879883e-06, 3.139488399028778e-06, 3.343448042869568e-06, 3.5474076867103577e-06, 3.7513673305511475e-06, 3.955326974391937e-06, 4.159286618232727e-06, 4.363246262073517e-06, 4.567205905914307e-06, 4.7711655497550964e-06, 4.975125193595886e-06, 5.179084837436676e-06, 5.383044481277466e-06, 5.587004125118256e-06, 5.790963768959045e-06, 5.994923412799835e-06, 6.198883056640625e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 15.0, 16.0, 18.0, 33.0, 61.0, 100.0, 213.0, 350.0, 916.0, 2465.0, 9319.0, 56316.0, 385324.0, 490598.0, 84738.0, 12949.0, 3093.0, 1074.0, 463.0, 183.0, 112.0, 81.0, 37.0, 24.0, 13.0, 14.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0282440185546875, -0.027390718460083008, -0.026537418365478516, -0.025684118270874023, -0.02483081817626953, -0.02397751808166504, -0.023124217987060547, -0.022270917892456055, -0.021417617797851562, -0.02056431770324707, -0.019711017608642578, -0.018857717514038086, -0.018004417419433594, -0.0171511173248291, -0.01629781723022461, -0.015444517135620117, -0.014591217041015625, -0.013737916946411133, -0.01288461685180664, -0.012031316757202148, -0.011178016662597656, -0.010324716567993164, -0.009471416473388672, -0.00861811637878418, -0.0077648162841796875, -0.006911516189575195, -0.006058216094970703, -0.005204916000366211, -0.004351615905761719, -0.0034983158111572266, -0.0026450157165527344, -0.0017917156219482422, -0.00093841552734375, -8.511543273925781e-05, 0.0007681846618652344, 0.0016214847564697266, 0.0024747848510742188, 0.003328084945678711, 0.004181385040283203, 0.005034685134887695, 0.0058879852294921875, 0.00674128532409668, 0.007594585418701172, 0.008447885513305664, 0.009301185607910156, 0.010154485702514648, 0.01100778579711914, 0.011861085891723633, 0.012714385986328125, 0.013567686080932617, 0.01442098617553711, 0.015274286270141602, 0.016127586364746094, 0.016980886459350586, 0.017834186553955078, 0.01868748664855957, 0.019540786743164062, 0.020394086837768555, 0.021247386932373047, 0.02210068702697754, 0.02295398712158203, 0.023807287216186523, 0.024660587310791016, 0.025513887405395508, 0.0263671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 13.0, 14.0, 27.0, 34.0, 46.0, 75.0, 82.0, 89.0, 101.0, 113.0, 93.0, 90.0, 68.0, 39.0, 29.0, 15.0, 21.0, 12.0, 12.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238800048828125, -0.023082494735717773, -0.022284984588623047, -0.02148747444152832, -0.020689964294433594, -0.019892454147338867, -0.01909494400024414, -0.018297433853149414, -0.017499923706054688, -0.01670241355895996, -0.015904903411865234, -0.015107393264770508, -0.014309883117675781, -0.013512372970581055, -0.012714862823486328, -0.011917352676391602, -0.011119842529296875, -0.010322332382202148, -0.009524822235107422, -0.008727312088012695, -0.007929801940917969, -0.007132291793823242, -0.006334781646728516, -0.005537271499633789, -0.0047397613525390625, -0.003942251205444336, -0.0031447410583496094, -0.002347230911254883, -0.0015497207641601562, -0.0007522106170654297, 4.5299530029296875e-05, 0.0008428096771240234, 0.00164031982421875, 0.0024378299713134766, 0.003235340118408203, 0.00403285026550293, 0.004830360412597656, 0.005627870559692383, 0.006425380706787109, 0.007222890853881836, 0.008020401000976562, 0.008817911148071289, 0.009615421295166016, 0.010412931442260742, 0.011210441589355469, 0.012007951736450195, 0.012805461883544922, 0.013602972030639648, 0.014400482177734375, 0.015197992324829102, 0.015995502471923828, 0.016793012619018555, 0.01759052276611328, 0.018388032913208008, 0.019185543060302734, 0.01998305320739746, 0.020780563354492188, 0.021578073501586914, 0.02237558364868164, 0.023173093795776367, 0.023970603942871094, 0.02476811408996582, 0.025565624237060547, 0.026363134384155273, 0.02716064453125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 0.0, 6.0, 14.0, 25.0, 64.0, 126.0, 182.0, 241.0, 180.0, 88.0, 37.0, 21.0, 10.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5919350981712341, -0.5757158398628235, -0.5594965219497681, -0.5432772636413574, -0.5270580053329468, -0.5108387470245361, -0.4946194589138031, -0.47840017080307007, -0.4621809124946594, -0.4459616541862488, -0.42974236607551575, -0.4135230779647827, -0.39730381965637207, -0.3810845613479614, -0.3648652732372284, -0.34864598512649536, -0.3324267268180847, -0.3162074685096741, -0.29998818039894104, -0.283768892288208, -0.26754963397979736, -0.2513303756713867, -0.2351110875606537, -0.21889181435108185, -0.20267254114151, -0.18645326793193817, -0.17023399472236633, -0.1540147215127945, -0.13779544830322266, -0.12157617509365082, -0.10535690188407898, -0.08913762867450714, -0.07291841506958008, -0.05669914186000824, -0.0404798686504364, -0.024260595440864563, -0.008041322231292725, 0.008177950978279114, 0.024397224187850952, 0.04061649739742279, 0.05683577060699463, 0.07305504381656647, 0.0892743170261383, 0.10549359023571014, 0.12171286344528198, 0.13793213665485382, 0.15415140986442566, 0.1703706830739975, 0.18658995628356934, 0.20280922949314117, 0.219028502702713, 0.23524777591228485, 0.2514670491218567, 0.26768630743026733, 0.28390559554100037, 0.3001248836517334, 0.31634414196014404, 0.3325634002685547, 0.3487826883792877, 0.36500197649002075, 0.3812212347984314, 0.39744049310684204, 0.4136597812175751, 0.4298790693283081, 0.44609832763671875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 13.0, 9.0, 7.0, 9.0, 9.0, 13.0, 18.0, 25.0, 23.0, 22.0, 22.0, 28.0, 29.0, 32.0, 38.0, 36.0, 32.0, 47.0, 44.0, 49.0, 51.0, 44.0, 41.0, 42.0, 45.0, 29.0, 30.0, 32.0, 38.0, 20.0, 28.0, 20.0, 18.0, 8.0, 9.0, 12.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.2509506344795227, -0.24388530850410461, -0.23681996762752533, -0.22975464165210724, -0.22268930077552795, -0.21562397480010986, -0.20855864882469177, -0.2014933079481125, -0.1944279670715332, -0.1873626410961151, -0.18029730021953583, -0.17323197424411774, -0.16616663336753845, -0.15910130739212036, -0.15203598141670227, -0.14497064054012299, -0.1379053145647049, -0.1308399885892868, -0.12377464771270752, -0.11670932173728943, -0.10964398086071014, -0.10257865488529205, -0.09551332145929337, -0.08844798803329468, -0.08138265460729599, -0.0743173211812973, -0.06725198775529861, -0.060186658054590225, -0.05312132462859154, -0.04605599120259285, -0.03899066150188446, -0.03192532807588577, -0.024859994649887085, -0.017794661223888397, -0.010729329660534859, -0.00366399809718132, 0.0034013353288173676, 0.010466668754816055, 0.017531998455524445, 0.024597331881523132, 0.03166266530752182, 0.03872799873352051, 0.045793332159519196, 0.052858661860227585, 0.05992399528622627, 0.06698933243751526, 0.07405465841293335, 0.08111999183893204, 0.08818532526493073, 0.09525065869092941, 0.1023159921169281, 0.10938131809234619, 0.11644665896892548, 0.12351198494434357, 0.13057732582092285, 0.13764265179634094, 0.14470797777175903, 0.15177330374717712, 0.1588386446237564, 0.1659039705991745, 0.17296931147575378, 0.18003463745117188, 0.18709996342658997, 0.19416530430316925, 0.20123064517974854]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 5.0, 20.0, 70.0, 473.0, 19351.0, 4169009.0, 5027.0, 264.0, 54.0, 7.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.08621597290039062, -0.07453155517578125, -0.06284713745117188, -0.0511627197265625, -0.039478302001953125, -0.02779388427734375, -0.016109466552734375, -0.004425048828125, 0.007259368896484375, 0.01894378662109375, 0.030628204345703125, 0.0423126220703125, 0.053997039794921875, 0.06568145751953125, 0.07736587524414062, 0.08905029296875, 0.10073471069335938, 0.11241912841796875, 0.12410354614257812, 0.1357879638671875, 0.14747238159179688, 0.15915679931640625, 0.17084121704101562, 0.182525634765625, 0.19421005249023438, 0.20589447021484375, 0.21757888793945312, 0.2292633056640625, 0.24094772338867188, 0.25263214111328125, 0.2643165588378906, 0.2760009765625, 0.2876853942871094, 0.29936981201171875, 0.3110542297363281, 0.3227386474609375, 0.3344230651855469, 0.34610748291015625, 0.3577919006347656, 0.369476318359375, 0.3811607360839844, 0.39284515380859375, 0.4045295715332031, 0.4162139892578125, 0.4278984069824219, 0.43958282470703125, 0.4512672424316406, 0.46295166015625, 0.4746360778808594, 0.48632049560546875, 0.4980049133300781, 0.5096893310546875, 0.5213737487792969, 0.5330581665039062, 0.5447425842285156, 0.556427001953125, 0.5681114196777344, 0.5797958374023438, 0.5914802551269531, 0.6031646728515625, 0.6148490905761719, 0.6265335083007812, 0.6382179260253906, 0.64990234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 6.0, 5.0, 7.0, 11.0, 13.0, 18.0, 31.0, 29.0, 38.0, 44.0, 56.0, 61.0, 66.0, 90.0, 70.0, 76.0, 55.0, 59.0, 53.0, 61.0, 40.0, 40.0, 21.0, 20.0, 13.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01154327392578125, -0.011074185371398926, -0.010605096817016602, -0.010136008262634277, -0.009666919708251953, -0.009197831153869629, -0.008728742599487305, -0.00825965404510498, -0.007790565490722656, -0.007321476936340332, -0.006852388381958008, -0.006383299827575684, -0.005914211273193359, -0.005445122718811035, -0.004976034164428711, -0.004506945610046387, -0.0040378570556640625, -0.0035687685012817383, -0.003099679946899414, -0.00263059139251709, -0.0021615028381347656, -0.0016924142837524414, -0.0012233257293701172, -0.000754237174987793, -0.00028514862060546875, 0.00018393993377685547, 0.0006530284881591797, 0.001122117042541504, 0.0015912055969238281, 0.0020602941513061523, 0.0025293827056884766, 0.0029984712600708008, 0.003467559814453125, 0.003936648368835449, 0.0044057369232177734, 0.004874825477600098, 0.005343914031982422, 0.005813002586364746, 0.00628209114074707, 0.0067511796951293945, 0.007220268249511719, 0.007689356803894043, 0.008158445358276367, 0.008627533912658691, 0.009096622467041016, 0.00956571102142334, 0.010034799575805664, 0.010503888130187988, 0.010972976684570312, 0.011442065238952637, 0.011911153793334961, 0.012380242347717285, 0.01284933090209961, 0.013318419456481934, 0.013787508010864258, 0.014256596565246582, 0.014725685119628906, 0.01519477367401123, 0.015663862228393555, 0.01613295078277588, 0.016602039337158203, 0.017071127891540527, 0.01754021644592285, 0.018009305000305176, 0.0184783935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 13.0, 9.0, 8.0, 20.0, 41.0, 61.0, 80.0, 139.0, 313.0, 579.0, 1141.0, 2510.0, 6766.0, 24098.0, 128779.0, 1928331.0, 1934923.0, 130165.0, 24387.0, 6892.0, 2607.0, 1125.0, 580.0, 297.0, 142.0, 101.0, 62.0, 39.0, 19.0, 9.0, 10.0, 4.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055145263671875, -0.053421974182128906, -0.05169868469238281, -0.04997539520263672, -0.048252105712890625, -0.04652881622314453, -0.04480552673339844, -0.043082237243652344, -0.04135894775390625, -0.039635658264160156, -0.03791236877441406, -0.03618907928466797, -0.034465789794921875, -0.03274250030517578, -0.031019210815429688, -0.029295921325683594, -0.0275726318359375, -0.025849342346191406, -0.024126052856445312, -0.02240276336669922, -0.020679473876953125, -0.01895618438720703, -0.017232894897460938, -0.015509605407714844, -0.01378631591796875, -0.012063026428222656, -0.010339736938476562, -0.008616447448730469, -0.006893157958984375, -0.005169868469238281, -0.0034465789794921875, -0.0017232894897460938, 0.0, 0.0017232894897460938, 0.0034465789794921875, 0.005169868469238281, 0.006893157958984375, 0.008616447448730469, 0.010339736938476562, 0.012063026428222656, 0.01378631591796875, 0.015509605407714844, 0.017232894897460938, 0.01895618438720703, 0.020679473876953125, 0.02240276336669922, 0.024126052856445312, 0.025849342346191406, 0.0275726318359375, 0.029295921325683594, 0.031019210815429688, 0.03274250030517578, 0.034465789794921875, 0.03618907928466797, 0.03791236877441406, 0.039635658264160156, 0.04135894775390625, 0.043082237243652344, 0.04480552673339844, 0.04652881622314453, 0.048252105712890625, 0.04997539520263672, 0.05169868469238281, 0.053421974182128906, 0.055145263671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 13.0, 17.0, 18.0, 25.0, 44.0, 52.0, 85.0, 154.0, 256.0, 473.0, 790.0, 838.0, 473.0, 260.0, 187.0, 96.0, 93.0, 49.0, 35.0, 21.0, 25.0, 16.0, 14.0, 8.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0207672119140625, -0.020052671432495117, -0.019338130950927734, -0.01862359046936035, -0.01790904998779297, -0.017194509506225586, -0.016479969024658203, -0.01576542854309082, -0.015050888061523438, -0.014336347579956055, -0.013621807098388672, -0.012907266616821289, -0.012192726135253906, -0.011478185653686523, -0.01076364517211914, -0.010049104690551758, -0.009334564208984375, -0.008620023727416992, -0.00790548324584961, -0.0071909427642822266, -0.006476402282714844, -0.005761861801147461, -0.005047321319580078, -0.004332780838012695, -0.0036182403564453125, -0.0029036998748779297, -0.002189159393310547, -0.001474618911743164, -0.0007600784301757812, -4.553794860839844e-05, 0.0006690025329589844, 0.0013835430145263672, 0.00209808349609375, 0.002812623977661133, 0.0035271644592285156, 0.0042417049407958984, 0.004956245422363281, 0.005670785903930664, 0.006385326385498047, 0.00709986686706543, 0.007814407348632812, 0.008528947830200195, 0.009243488311767578, 0.009958028793334961, 0.010672569274902344, 0.011387109756469727, 0.01210165023803711, 0.012816190719604492, 0.013530731201171875, 0.014245271682739258, 0.01495981216430664, 0.015674352645874023, 0.016388893127441406, 0.01710343360900879, 0.017817974090576172, 0.018532514572143555, 0.019247055053710938, 0.01996159553527832, 0.020676136016845703, 0.021390676498413086, 0.02210521697998047, 0.02281975746154785, 0.023534297943115234, 0.024248838424682617, 0.02496337890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 52.0, 185.0, 306.0, 305.0, 87.0, 38.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48775309324264526, -0.4748343527317047, -0.46191561222076416, -0.4489968419075012, -0.43607810139656067, -0.4231593608856201, -0.41024062037467957, -0.397321879863739, -0.3844031095504761, -0.3714843690395355, -0.35856562852859497, -0.34564685821533203, -0.3327281177043915, -0.3198093771934509, -0.3068906366825104, -0.2939718961715698, -0.2810531556606293, -0.2681344151496887, -0.25521567463874817, -0.24229691922664642, -0.22937816381454468, -0.21645942330360413, -0.20354068279266357, -0.19062194228172302, -0.17770318686962128, -0.16478444635868073, -0.15186569094657898, -0.13894695043563843, -0.12602820992469788, -0.11310945451259613, -0.10019071400165558, -0.08727196604013443, -0.0743531882762909, -0.061434440314769745, -0.048515696078538895, -0.035596951842308044, -0.022678203880786896, -0.009759455919265747, 0.0031592845916748047, 0.016078032553195953, 0.028996780514717102, 0.04191552847623825, 0.0548342727124691, 0.06775301694869995, 0.0806717649102211, 0.09359051287174225, 0.1065092533826828, 0.11942800134420395, 0.1323467493057251, 0.14526548981666565, 0.1581842452287674, 0.17110298573970795, 0.1840217411518097, 0.19694048166275024, 0.2098592221736908, 0.22277796268463135, 0.2356967180967331, 0.24861545860767365, 0.2615342140197754, 0.27445295453071594, 0.2873716950416565, 0.30029046535491943, 0.3132091760635376, 0.32612794637680054, 0.3390466868877411]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 7.0, 11.0, 21.0, 16.0, 27.0, 32.0, 25.0, 18.0, 32.0, 37.0, 40.0, 46.0, 45.0, 43.0, 61.0, 49.0, 52.0, 40.0, 43.0, 55.0, 53.0, 33.0, 26.0, 22.0, 29.0, 30.0, 25.0, 26.0, 17.0, 6.0, 11.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07917118072509766, -0.07610733062028885, -0.07304348051548004, -0.06997963786125183, -0.06691578775644302, -0.06385193765163422, -0.06078809127211571, -0.0577242448925972, -0.05466039478778839, -0.051596544682979584, -0.048532698303461075, -0.045468851923942566, -0.04240500181913376, -0.03934115171432495, -0.03627730533480644, -0.03321345895528793, -0.030149608850479126, -0.027085760608315468, -0.02402191236615181, -0.02095806412398815, -0.017894215881824493, -0.014830367639660835, -0.011766519397497177, -0.008702671155333519, -0.005638822913169861, -0.0025749746710062027, 0.0004888735711574554, 0.0035527218133211136, 0.006616570055484772, 0.00968041829764843, 0.012744266539812088, 0.015808114781975746, 0.018871963024139404, 0.021935811266303062, 0.02499965950846672, 0.02806350775063038, 0.031127355992794037, 0.034191206097602844, 0.03725505247712135, 0.04031889885663986, 0.04338274896144867, 0.04644659906625748, 0.049510445445775986, 0.052574291825294495, 0.0556381419301033, 0.05870199203491211, 0.06176583841443062, 0.06482968479394913, 0.06789353489875793, 0.07095738500356674, 0.07402123510837555, 0.07708507776260376, 0.08014892786741257, 0.08321277797222137, 0.08627662062644958, 0.08934047073125839, 0.0924043208360672, 0.09546817094087601, 0.09853202104568481, 0.10159586369991302, 0.10465971380472183, 0.10772356390953064, 0.11078740656375885, 0.11385125666856766, 0.11691510677337646]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 17.0, 16.0, 21.0, 26.0, 40.0, 76.0, 126.0, 233.0, 420.0, 981.0, 2126.0, 6024.0, 22474.0, 122395.0, 555966.0, 275977.0, 44971.0, 10506.0, 3435.0, 1374.0, 632.0, 322.0, 175.0, 88.0, 46.0, 28.0, 19.0, 12.0, 7.0, 9.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0670166015625, -0.06459903717041016, -0.06218147277832031, -0.05976390838623047, -0.057346343994140625, -0.05492877960205078, -0.05251121520996094, -0.050093650817871094, -0.04767608642578125, -0.045258522033691406, -0.04284095764160156, -0.04042339324951172, -0.038005828857421875, -0.03558826446533203, -0.03317070007324219, -0.030753135681152344, -0.0283355712890625, -0.025918006896972656, -0.023500442504882812, -0.02108287811279297, -0.018665313720703125, -0.01624774932861328, -0.013830184936523438, -0.011412620544433594, -0.00899505615234375, -0.006577491760253906, -0.0041599273681640625, -0.0017423629760742188, 0.000675201416015625, 0.0030927658081054688, 0.0055103302001953125, 0.007927894592285156, 0.010345458984375, 0.012763023376464844, 0.015180587768554688, 0.01759815216064453, 0.020015716552734375, 0.02243328094482422, 0.024850845336914062, 0.027268409729003906, 0.02968597412109375, 0.032103538513183594, 0.03452110290527344, 0.03693866729736328, 0.039356231689453125, 0.04177379608154297, 0.04419136047363281, 0.046608924865722656, 0.0490264892578125, 0.051444053649902344, 0.05386161804199219, 0.05627918243408203, 0.058696746826171875, 0.06111431121826172, 0.06353187561035156, 0.0659494400024414, 0.06836700439453125, 0.0707845687866211, 0.07320213317871094, 0.07561969757080078, 0.07803726196289062, 0.08045482635498047, 0.08287239074707031, 0.08528995513916016, 0.08770751953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 11.0, 11.0, 19.0, 21.0, 29.0, 44.0, 46.0, 64.0, 46.0, 64.0, 78.0, 64.0, 77.0, 65.0, 64.0, 53.0, 53.0, 47.0, 41.0, 26.0, 21.0, 13.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01251220703125, -0.012028217315673828, -0.011544227600097656, -0.011060237884521484, -0.010576248168945312, -0.01009225845336914, -0.009608268737792969, -0.009124279022216797, -0.008640289306640625, -0.008156299591064453, -0.007672309875488281, -0.007188320159912109, -0.0067043304443359375, -0.006220340728759766, -0.005736351013183594, -0.005252361297607422, -0.00476837158203125, -0.004284381866455078, -0.0038003921508789062, -0.0033164024353027344, -0.0028324127197265625, -0.0023484230041503906, -0.0018644332885742188, -0.0013804435729980469, -0.000896453857421875, -0.0004124641418457031, 7.152557373046875e-05, 0.0005555152893066406, 0.0010395050048828125, 0.0015234947204589844, 0.0020074844360351562, 0.002491474151611328, 0.0029754638671875, 0.003459453582763672, 0.003943443298339844, 0.004427433013916016, 0.0049114227294921875, 0.005395412445068359, 0.005879402160644531, 0.006363391876220703, 0.006847381591796875, 0.007331371307373047, 0.007815361022949219, 0.00829935073852539, 0.008783340454101562, 0.009267330169677734, 0.009751319885253906, 0.010235309600830078, 0.01071929931640625, 0.011203289031982422, 0.011687278747558594, 0.012171268463134766, 0.012655258178710938, 0.01313924789428711, 0.013623237609863281, 0.014107227325439453, 0.014591217041015625, 0.015075206756591797, 0.015559196472167969, 0.01604318618774414, 0.016527175903320312, 0.017011165618896484, 0.017495155334472656, 0.017979145050048828, 0.018463134765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 16.0, 10.0, 21.0, 17.0, 28.0, 43.0, 46.0, 103.0, 165.0, 244.0, 471.0, 896.0, 2127.0, 5207.0, 16375.0, 61314.0, 261343.0, 471642.0, 170138.0, 39673.0, 11460.0, 3909.0, 1604.0, 702.0, 383.0, 233.0, 120.0, 82.0, 51.0, 35.0, 27.0, 12.0, 18.0, 12.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05316162109375, -0.051657676696777344, -0.05015373229980469, -0.04864978790283203, -0.047145843505859375, -0.04564189910888672, -0.04413795471191406, -0.042634010314941406, -0.04113006591796875, -0.039626121520996094, -0.03812217712402344, -0.03661823272705078, -0.035114288330078125, -0.03361034393310547, -0.03210639953613281, -0.030602455139160156, -0.0290985107421875, -0.027594566345214844, -0.026090621948242188, -0.02458667755126953, -0.023082733154296875, -0.02157878875732422, -0.020074844360351562, -0.018570899963378906, -0.01706695556640625, -0.015563011169433594, -0.014059066772460938, -0.012555122375488281, -0.011051177978515625, -0.009547233581542969, -0.008043289184570312, -0.006539344787597656, -0.005035400390625, -0.0035314559936523438, -0.0020275115966796875, -0.0005235671997070312, 0.000980377197265625, 0.0024843215942382812, 0.0039882659912109375, 0.005492210388183594, 0.00699615478515625, 0.008500099182128906, 0.010004043579101562, 0.011507987976074219, 0.013011932373046875, 0.014515876770019531, 0.016019821166992188, 0.017523765563964844, 0.0190277099609375, 0.020531654357910156, 0.022035598754882812, 0.02353954315185547, 0.025043487548828125, 0.02654743194580078, 0.028051376342773438, 0.029555320739746094, 0.03105926513671875, 0.032563209533691406, 0.03406715393066406, 0.03557109832763672, 0.037075042724609375, 0.03857898712158203, 0.04008293151855469, 0.041586875915527344, 0.0430908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 6.0, 11.0, 5.0, 11.0, 9.0, 14.0, 8.0, 27.0, 21.0, 20.0, 39.0, 27.0, 31.0, 39.0, 31.0, 43.0, 44.0, 47.0, 54.0, 49.0, 56.0, 45.0, 33.0, 49.0, 43.0, 40.0, 33.0, 24.0, 24.0, 23.0, 19.0, 13.0, 11.0, 5.0, 5.0, 18.0, 4.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0391845703125, -0.037850379943847656, -0.03651618957519531, -0.03518199920654297, -0.033847808837890625, -0.03251361846923828, -0.031179428100585938, -0.029845237731933594, -0.02851104736328125, -0.027176856994628906, -0.025842666625976562, -0.02450847625732422, -0.023174285888671875, -0.02184009552001953, -0.020505905151367188, -0.019171714782714844, -0.0178375244140625, -0.016503334045410156, -0.015169143676757812, -0.013834953308105469, -0.012500762939453125, -0.011166572570800781, -0.009832382202148438, -0.008498191833496094, -0.00716400146484375, -0.005829811096191406, -0.0044956207275390625, -0.0031614303588867188, -0.001827239990234375, -0.0004930496215820312, 0.0008411407470703125, 0.0021753311157226562, 0.003509521484375, 0.004843711853027344, 0.0061779022216796875, 0.007512092590332031, 0.008846282958984375, 0.010180473327636719, 0.011514663696289062, 0.012848854064941406, 0.01418304443359375, 0.015517234802246094, 0.016851425170898438, 0.01818561553955078, 0.019519805908203125, 0.02085399627685547, 0.022188186645507812, 0.023522377014160156, 0.0248565673828125, 0.026190757751464844, 0.027524948120117188, 0.02885913848876953, 0.030193328857421875, 0.03152751922607422, 0.03286170959472656, 0.034195899963378906, 0.03553009033203125, 0.036864280700683594, 0.03819847106933594, 0.03953266143798828, 0.040866851806640625, 0.04220104217529297, 0.04353523254394531, 0.044869422912597656, 0.04620361328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 11.0, 10.0, 8.0, 25.0, 33.0, 43.0, 69.0, 121.0, 181.0, 310.0, 634.0, 1247.0, 3578.0, 15966.0, 173783.0, 693594.0, 139640.0, 13538.0, 3252.0, 1169.0, 557.0, 306.0, 175.0, 121.0, 65.0, 38.0, 29.0, 16.0, 13.0, 9.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.029083251953125, -0.028213977813720703, -0.027344703674316406, -0.02647542953491211, -0.025606155395507812, -0.024736881256103516, -0.02386760711669922, -0.022998332977294922, -0.022129058837890625, -0.021259784698486328, -0.02039051055908203, -0.019521236419677734, -0.018651962280273438, -0.01778268814086914, -0.016913414001464844, -0.016044139862060547, -0.01517486572265625, -0.014305591583251953, -0.013436317443847656, -0.01256704330444336, -0.011697769165039062, -0.010828495025634766, -0.009959220886230469, -0.009089946746826172, -0.008220672607421875, -0.007351398468017578, -0.006482124328613281, -0.005612850189208984, -0.0047435760498046875, -0.0038743019104003906, -0.0030050277709960938, -0.002135753631591797, -0.0012664794921875, -0.0003972053527832031, 0.00047206878662109375, 0.0013413429260253906, 0.0022106170654296875, 0.0030798912048339844, 0.003949165344238281, 0.004818439483642578, 0.005687713623046875, 0.006556987762451172, 0.007426261901855469, 0.008295536041259766, 0.009164810180664062, 0.01003408432006836, 0.010903358459472656, 0.011772632598876953, 0.01264190673828125, 0.013511180877685547, 0.014380455017089844, 0.01524972915649414, 0.016119003295898438, 0.016988277435302734, 0.01785755157470703, 0.018726825714111328, 0.019596099853515625, 0.020465373992919922, 0.02133464813232422, 0.022203922271728516, 0.023073196411132812, 0.02394247055053711, 0.024811744689941406, 0.025681018829345703, 0.02655029296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 8.0, 10.0, 22.0, 35.0, 33.0, 40.0, 62.0, 58.0, 73.0, 95.0, 85.0, 93.0, 86.0, 59.0, 45.0, 45.0, 43.0, 27.0, 27.0, 11.0, 13.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.58306884765625e-06, -8.334405720233917e-06, -8.085742592811584e-06, -7.837079465389252e-06, -7.588416337966919e-06, -7.339753210544586e-06, -7.091090083122253e-06, -6.842426955699921e-06, -6.593763828277588e-06, -6.345100700855255e-06, -6.096437573432922e-06, -5.84777444601059e-06, -5.599111318588257e-06, -5.350448191165924e-06, -5.101785063743591e-06, -4.8531219363212585e-06, -4.604458808898926e-06, -4.355795681476593e-06, -4.10713255405426e-06, -3.8584694266319275e-06, -3.6098062992095947e-06, -3.361143171787262e-06, -3.112480044364929e-06, -2.8638169169425964e-06, -2.6151537895202637e-06, -2.366490662097931e-06, -2.117827534675598e-06, -1.8691644072532654e-06, -1.6205012798309326e-06, -1.3718381524085999e-06, -1.123175024986267e-06, -8.745118975639343e-07, -6.258487701416016e-07, -3.771856427192688e-07, -1.2852251529693604e-07, 1.2014061212539673e-07, 3.688037395477295e-07, 6.174668669700623e-07, 8.66129994392395e-07, 1.1147931218147278e-06, 1.3634562492370605e-06, 1.6121193766593933e-06, 1.860782504081726e-06, 2.109445631504059e-06, 2.3581087589263916e-06, 2.6067718863487244e-06, 2.855435013771057e-06, 3.10409814119339e-06, 3.3527612686157227e-06, 3.6014243960380554e-06, 3.850087523460388e-06, 4.098750650882721e-06, 4.347413778305054e-06, 4.5960769057273865e-06, 4.844740033149719e-06, 5.093403160572052e-06, 5.342066287994385e-06, 5.5907294154167175e-06, 5.83939254283905e-06, 6.088055670261383e-06, 6.336718797683716e-06, 6.585381925106049e-06, 6.834045052528381e-06, 7.082708179950714e-06, 7.331371307373047e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 17.0, 29.0, 40.0, 52.0, 89.0, 150.0, 285.0, 623.0, 1531.0, 5370.0, 37560.0, 480491.0, 477048.0, 37049.0, 5460.0, 1431.0, 627.0, 276.0, 150.0, 86.0, 59.0, 32.0, 24.0, 21.0, 10.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.027008056640625, -0.026043415069580078, -0.025078773498535156, -0.024114131927490234, -0.023149490356445312, -0.02218484878540039, -0.02122020721435547, -0.020255565643310547, -0.019290924072265625, -0.018326282501220703, -0.01736164093017578, -0.01639699935913086, -0.015432357788085938, -0.014467716217041016, -0.013503074645996094, -0.012538433074951172, -0.01157379150390625, -0.010609149932861328, -0.009644508361816406, -0.008679866790771484, -0.0077152252197265625, -0.006750583648681641, -0.005785942077636719, -0.004821300506591797, -0.003856658935546875, -0.002892017364501953, -0.0019273757934570312, -0.0009627342224121094, 1.9073486328125e-06, 0.0009665489196777344, 0.0019311904907226562, 0.002895832061767578, 0.0038604736328125, 0.004825115203857422, 0.005789756774902344, 0.006754398345947266, 0.0077190399169921875, 0.00868368148803711, 0.009648323059082031, 0.010612964630126953, 0.011577606201171875, 0.012542247772216797, 0.013506889343261719, 0.01447153091430664, 0.015436172485351562, 0.016400814056396484, 0.017365455627441406, 0.018330097198486328, 0.01929473876953125, 0.020259380340576172, 0.021224021911621094, 0.022188663482666016, 0.023153305053710938, 0.02411794662475586, 0.02508258819580078, 0.026047229766845703, 0.027011871337890625, 0.027976512908935547, 0.02894115447998047, 0.02990579605102539, 0.030870437622070312, 0.031835079193115234, 0.032799720764160156, 0.03376436233520508, 0.03472900390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 7.0, 22.0, 21.0, 42.0, 50.0, 85.0, 139.0, 127.0, 122.0, 125.0, 81.0, 53.0, 42.0, 19.0, 13.0, 10.0, 9.0, 5.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265960693359375, -0.025609731674194336, -0.024623394012451172, -0.023637056350708008, -0.022650718688964844, -0.02166438102722168, -0.020678043365478516, -0.01969170570373535, -0.018705368041992188, -0.017719030380249023, -0.01673269271850586, -0.015746355056762695, -0.014760017395019531, -0.013773679733276367, -0.012787342071533203, -0.011801004409790039, -0.010814666748046875, -0.009828329086303711, -0.008841991424560547, -0.007855653762817383, -0.006869316101074219, -0.005882978439331055, -0.004896640777587891, -0.0039103031158447266, -0.0029239654541015625, -0.0019376277923583984, -0.0009512901306152344, 3.504753112792969e-05, 0.0010213851928710938, 0.002007722854614258, 0.002994060516357422, 0.003980398178100586, 0.00496673583984375, 0.005953073501586914, 0.006939411163330078, 0.007925748825073242, 0.008912086486816406, 0.00989842414855957, 0.010884761810302734, 0.011871099472045898, 0.012857437133789062, 0.013843774795532227, 0.01483011245727539, 0.015816450119018555, 0.01680278778076172, 0.017789125442504883, 0.018775463104248047, 0.01976180076599121, 0.020748138427734375, 0.02173447608947754, 0.022720813751220703, 0.023707151412963867, 0.02469348907470703, 0.025679826736450195, 0.02666616439819336, 0.027652502059936523, 0.028638839721679688, 0.02962517738342285, 0.030611515045166016, 0.03159785270690918, 0.032584190368652344, 0.03357052803039551, 0.03455686569213867, 0.035543203353881836, 0.036529541015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 9.0, 21.0, 29.0, 73.0, 141.0, 206.0, 207.0, 129.0, 99.0, 52.0, 17.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32467135787010193, -0.3099595606327057, -0.29524773359298706, -0.2805359363555908, -0.2658241391181946, -0.25111234188079834, -0.2364005297422409, -0.22168871760368347, -0.20697692036628723, -0.192265123128891, -0.17755331099033356, -0.16284149885177612, -0.14812970161437988, -0.13341790437698364, -0.11870609223842621, -0.10399428755044937, -0.08928248286247253, -0.0745706781744957, -0.05985887348651886, -0.04514706879854202, -0.030435264110565186, -0.01572345942258835, -0.0010116547346115112, 0.013700149953365326, 0.028411954641342163, 0.043123759329319, 0.05783556401729584, 0.07254736870527267, 0.08725917339324951, 0.10197097808122635, 0.11668278276920319, 0.13139459490776062, 0.14610642194747925, 0.1608182191848755, 0.17553003132343292, 0.19024184346199036, 0.2049536406993866, 0.21966543793678284, 0.23437725007534027, 0.2490890622138977, 0.26380085945129395, 0.2785126566886902, 0.2932244539260864, 0.30793628096580505, 0.3226480782032013, 0.33735987544059753, 0.35207170248031616, 0.3667834997177124, 0.38149529695510864, 0.3962070941925049, 0.4109188914299011, 0.42563071846961975, 0.440342515707016, 0.45505431294441223, 0.46976613998413086, 0.4844779372215271, 0.49918973445892334, 0.5139015316963196, 0.5286133289337158, 0.5433251261711121, 0.5580369234085083, 0.5727487802505493, 0.5874605774879456, 0.6021723747253418, 0.616884171962738]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 25.0, 18.0, 38.0, 30.0, 22.0, 27.0, 36.0, 38.0, 38.0, 34.0, 40.0, 40.0, 41.0, 44.0, 37.0, 42.0, 43.0, 38.0, 44.0, 30.0, 31.0, 29.0, 27.0, 22.0, 19.0, 16.0, 15.0, 10.0, 15.0, 14.0, 6.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.209489107131958, -0.2028724104166031, -0.19625572860240936, -0.18963903188705444, -0.18302233517169952, -0.1764056384563446, -0.16978895664215088, -0.16317225992679596, -0.15655556321144104, -0.14993886649608612, -0.1433221846818924, -0.13670548796653748, -0.13008879125118256, -0.12347210198640823, -0.11685541272163391, -0.11023871600627899, -0.10362203419208527, -0.09700534492731094, -0.09038864821195602, -0.0837719589471817, -0.07715526223182678, -0.07053857296705246, -0.06392188370227814, -0.057305190712213516, -0.050688497722148895, -0.044071804732084274, -0.03745511174201965, -0.03083842247724533, -0.02422172948718071, -0.01760503649711609, -0.010988347232341766, -0.004371654242277145, 0.0022450387477874756, 0.008861730806529522, 0.015478422865271568, 0.02209511399269104, 0.02871180698275566, 0.03532849997282028, 0.041945189237594604, 0.048561882227659225, 0.055178575217723846, 0.06179526820778847, 0.06841196119785309, 0.07502865046262741, 0.08164533972740173, 0.08826203644275665, 0.09487872570753098, 0.1014954149723053, 0.10811211168766022, 0.11472880095243454, 0.12134549766778946, 0.12796218693256378, 0.1345788836479187, 0.14119556546211243, 0.14781226217746735, 0.15442895889282227, 0.161045640707016, 0.1676623374223709, 0.17427901923656464, 0.18089571595191956, 0.18751241266727448, 0.1941291093826294, 0.20074579119682312, 0.20736248791217804, 0.21397918462753296]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 4.0, 17.0, 17.0, 32.0, 50.0, 92.0, 150.0, 299.0, 635.0, 1415.0, 4203.0, 17576.0, 176112.0, 3792536.0, 176396.0, 17608.0, 4271.0, 1530.0, 638.0, 310.0, 156.0, 85.0, 54.0, 36.0, 16.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.11553955078125, -0.11294317245483398, -0.11034679412841797, -0.10775041580200195, -0.10515403747558594, -0.10255765914916992, -0.0999612808227539, -0.09736490249633789, -0.09476852416992188, -0.09217214584350586, -0.08957576751708984, -0.08697938919067383, -0.08438301086425781, -0.0817866325378418, -0.07919025421142578, -0.07659387588500977, -0.07399749755859375, -0.07140111923217773, -0.06880474090576172, -0.0662083625793457, -0.06361198425292969, -0.06101560592651367, -0.058419227600097656, -0.05582284927368164, -0.053226470947265625, -0.05063009262084961, -0.048033714294433594, -0.04543733596801758, -0.04284095764160156, -0.04024457931518555, -0.03764820098876953, -0.035051822662353516, -0.0324554443359375, -0.029859066009521484, -0.02726268768310547, -0.024666309356689453, -0.022069931030273438, -0.019473552703857422, -0.016877174377441406, -0.01428079605102539, -0.011684417724609375, -0.00908803939819336, -0.006491661071777344, -0.003895282745361328, -0.0012989044189453125, 0.0012974739074707031, 0.0038938522338867188, 0.006490230560302734, 0.00908660888671875, 0.011682987213134766, 0.014279365539550781, 0.016875743865966797, 0.019472122192382812, 0.022068500518798828, 0.024664878845214844, 0.02726125717163086, 0.029857635498046875, 0.03245401382446289, 0.035050392150878906, 0.03764677047729492, 0.04024314880371094, 0.04283952713012695, 0.04543590545654297, 0.048032283782958984, 0.050628662109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 7.0, 11.0, 13.0, 18.0, 16.0, 21.0, 34.0, 47.0, 38.0, 48.0, 65.0, 67.0, 60.0, 67.0, 76.0, 59.0, 62.0, 53.0, 44.0, 42.0, 35.0, 26.0, 27.0, 19.0, 10.0, 8.0, 12.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0121612548828125, -0.011689186096191406, -0.011217117309570312, -0.010745048522949219, -0.010272979736328125, -0.009800910949707031, -0.009328842163085938, -0.008856773376464844, -0.00838470458984375, -0.007912635803222656, -0.0074405670166015625, -0.006968498229980469, -0.006496429443359375, -0.006024360656738281, -0.0055522918701171875, -0.005080223083496094, -0.004608154296875, -0.004136085510253906, -0.0036640167236328125, -0.0031919479370117188, -0.002719879150390625, -0.0022478103637695312, -0.0017757415771484375, -0.0013036727905273438, -0.00083160400390625, -0.00035953521728515625, 0.0001125335693359375, 0.0005846023559570312, 0.001056671142578125, 0.0015287399291992188, 0.0020008087158203125, 0.0024728775024414062, 0.0029449462890625, 0.0034170150756835938, 0.0038890838623046875, 0.004361152648925781, 0.004833221435546875, 0.005305290222167969, 0.0057773590087890625, 0.006249427795410156, 0.00672149658203125, 0.007193565368652344, 0.0076656341552734375, 0.008137702941894531, 0.008609771728515625, 0.009081840515136719, 0.009553909301757812, 0.010025978088378906, 0.010498046875, 0.010970115661621094, 0.011442184448242188, 0.011914253234863281, 0.012386322021484375, 0.012858390808105469, 0.013330459594726562, 0.013802528381347656, 0.01427459716796875, 0.014746665954589844, 0.015218734741210938, 0.01569080352783203, 0.016162872314453125, 0.01663494110107422, 0.017107009887695312, 0.017579078674316406, 0.0180511474609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 16.0, 56.0, 112.0, 167.0, 395.0, 1091.0, 4238.0, 36464.0, 3860059.0, 277594.0, 10665.0, 2153.0, 680.0, 276.0, 138.0, 59.0, 49.0, 25.0, 14.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.16375446319580078, -0.15917396545410156, -0.15459346771240234, -0.15001296997070312, -0.1454324722290039, -0.1408519744873047, -0.13627147674560547, -0.13169097900390625, -0.12711048126220703, -0.12252998352050781, -0.1179494857788086, -0.11336898803710938, -0.10878849029541016, -0.10420799255371094, -0.09962749481201172, -0.0950469970703125, -0.09046649932861328, -0.08588600158691406, -0.08130550384521484, -0.07672500610351562, -0.0721445083618164, -0.06756401062011719, -0.06298351287841797, -0.05840301513671875, -0.05382251739501953, -0.04924201965332031, -0.044661521911621094, -0.040081024169921875, -0.035500526428222656, -0.030920028686523438, -0.02633953094482422, -0.021759033203125, -0.01717853546142578, -0.012598037719726562, -0.008017539978027344, -0.003437042236328125, 0.0011434555053710938, 0.0057239532470703125, 0.010304450988769531, 0.01488494873046875, 0.01946544647216797, 0.024045944213867188, 0.028626441955566406, 0.033206939697265625, 0.037787437438964844, 0.04236793518066406, 0.04694843292236328, 0.0515289306640625, 0.05610942840576172, 0.06068992614746094, 0.06527042388916016, 0.06985092163085938, 0.0744314193725586, 0.07901191711425781, 0.08359241485595703, 0.08817291259765625, 0.09275341033935547, 0.09733390808105469, 0.1019144058227539, 0.10649490356445312, 0.11107540130615234, 0.11565589904785156, 0.12023639678955078, 0.12481689453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 16.0, 16.0, 27.0, 51.0, 88.0, 137.0, 391.0, 1194.0, 1348.0, 425.0, 184.0, 85.0, 37.0, 26.0, 10.0, 7.0, 14.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.037322998046875, -0.03625750541687012, -0.035192012786865234, -0.03412652015686035, -0.03306102752685547, -0.031995534896850586, -0.030930042266845703, -0.02986454963684082, -0.028799057006835938, -0.027733564376831055, -0.026668071746826172, -0.02560257911682129, -0.024537086486816406, -0.023471593856811523, -0.02240610122680664, -0.021340608596801758, -0.020275115966796875, -0.019209623336791992, -0.01814413070678711, -0.017078638076782227, -0.016013145446777344, -0.014947652816772461, -0.013882160186767578, -0.012816667556762695, -0.011751174926757812, -0.01068568229675293, -0.009620189666748047, -0.008554697036743164, -0.007489204406738281, -0.0064237117767333984, -0.005358219146728516, -0.004292726516723633, -0.00322723388671875, -0.002161741256713867, -0.0010962486267089844, -3.075599670410156e-05, 0.0010347366333007812, 0.002100229263305664, 0.003165721893310547, 0.00423121452331543, 0.0052967071533203125, 0.006362199783325195, 0.007427692413330078, 0.008493185043334961, 0.009558677673339844, 0.010624170303344727, 0.01168966293334961, 0.012755155563354492, 0.013820648193359375, 0.014886140823364258, 0.01595163345336914, 0.017017126083374023, 0.018082618713378906, 0.01914811134338379, 0.020213603973388672, 0.021279096603393555, 0.022344589233398438, 0.02341008186340332, 0.024475574493408203, 0.025541067123413086, 0.02660655975341797, 0.02767205238342285, 0.028737545013427734, 0.029803037643432617, 0.0308685302734375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 9.0, 41.0, 152.0, 356.0, 286.0, 96.0, 33.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1932797133922577, -0.18109093606472015, -0.16890215873718262, -0.15671338140964508, -0.14452460408210754, -0.13233582675457, -0.12014704942703247, -0.10795827209949493, -0.0957694947719574, -0.08358071744441986, -0.07139194011688232, -0.05920316278934479, -0.04701438546180725, -0.034825608134269714, -0.022636830806732178, -0.010448053479194641, 0.0017407238483428955, 0.013929501175880432, 0.02611827850341797, 0.038307055830955505, 0.05049583315849304, 0.06268461048603058, 0.07487338781356812, 0.08706216514110565, 0.09925094246864319, 0.11143971979618073, 0.12362849712371826, 0.1358172744512558, 0.14800605177879333, 0.16019482910633087, 0.1723836064338684, 0.18457238376140594, 0.1967611312866211, 0.20894990861415863, 0.22113868594169617, 0.2333274632692337, 0.24551624059677124, 0.25770503282546997, 0.2698937952518463, 0.28208255767822266, 0.2942713499069214, 0.3064601421356201, 0.31864890456199646, 0.3308376669883728, 0.34302645921707153, 0.35521525144577026, 0.3674040138721466, 0.37959277629852295, 0.3917815685272217, 0.4039703607559204, 0.41615912318229675, 0.4283478856086731, 0.4405366778373718, 0.45272547006607056, 0.4649142324924469, 0.47710299491882324, 0.489291787147522, 0.5014805793762207, 0.5136693716049194, 0.5258581042289734, 0.5380468964576721, 0.5502356886863708, 0.5624244213104248, 0.5746132135391235, 0.5868020057678223]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 7.0, 4.0, 15.0, 16.0, 22.0, 14.0, 24.0, 32.0, 42.0, 30.0, 60.0, 57.0, 56.0, 51.0, 55.0, 52.0, 51.0, 64.0, 40.0, 46.0, 42.0, 45.0, 38.0, 39.0, 25.0, 17.0, 12.0, 10.0, 10.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.11041092872619629, -0.1073741763830185, -0.1043374314904213, -0.1013006865978241, -0.0982639342546463, -0.0952271819114685, -0.09219043701887131, -0.08915369212627411, -0.08611693978309631, -0.08308018743991852, -0.08004344254732132, -0.07700669765472412, -0.07396994531154633, -0.07093319296836853, -0.06789644807577133, -0.06485970318317413, -0.06182295083999634, -0.05878620222210884, -0.055749453604221344, -0.05271270498633385, -0.04967595636844635, -0.04663920775055885, -0.043602459132671356, -0.04056571051478386, -0.03752896189689636, -0.034492213279008865, -0.03145546466112137, -0.02841871604323387, -0.025381967425346375, -0.022345218807458878, -0.01930847018957138, -0.016271721571683884, -0.013234972953796387, -0.01019822433590889, -0.007161475718021393, -0.004124727100133896, -0.001087978482246399, 0.001948770135641098, 0.004985518753528595, 0.008022267371416092, 0.011059015989303589, 0.014095764607191086, 0.017132513225078583, 0.02016926184296608, 0.023206010460853577, 0.026242759078741074, 0.02927950769662857, 0.03231625631451607, 0.035353004932403564, 0.03838975355029106, 0.04142650216817856, 0.044463250786066055, 0.04749999940395355, 0.05053674802184105, 0.053573496639728546, 0.05661024525761604, 0.05964699387550354, 0.06268374621868134, 0.06572049111127853, 0.06875723600387573, 0.07179398834705353, 0.07483074069023132, 0.07786748558282852, 0.08090423047542572, 0.08394098281860352]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 13.0, 12.0, 18.0, 31.0, 32.0, 79.0, 144.0, 245.0, 497.0, 1101.0, 2667.0, 7992.0, 38550.0, 304644.0, 577814.0, 92413.0, 15052.0, 4159.0, 1611.0, 729.0, 305.0, 170.0, 105.0, 57.0, 32.0, 28.0, 17.0, 13.0, 6.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08953857421875, -0.08675956726074219, -0.08398056030273438, -0.08120155334472656, -0.07842254638671875, -0.07564353942871094, -0.07286453247070312, -0.07008552551269531, -0.0673065185546875, -0.06452751159667969, -0.061748504638671875, -0.05896949768066406, -0.05619049072265625, -0.05341148376464844, -0.050632476806640625, -0.04785346984863281, -0.045074462890625, -0.04229545593261719, -0.039516448974609375, -0.03673744201660156, -0.03395843505859375, -0.031179428100585938, -0.028400421142578125, -0.025621414184570312, -0.0228424072265625, -0.020063400268554688, -0.017284393310546875, -0.014505386352539062, -0.01172637939453125, -0.008947372436523438, -0.006168365478515625, -0.0033893585205078125, -0.0006103515625, 0.0021686553955078125, 0.004947662353515625, 0.0077266693115234375, 0.01050567626953125, 0.013284683227539062, 0.016063690185546875, 0.018842697143554688, 0.0216217041015625, 0.024400711059570312, 0.027179718017578125, 0.029958724975585938, 0.03273773193359375, 0.03551673889160156, 0.038295745849609375, 0.04107475280761719, 0.043853759765625, 0.04663276672363281, 0.049411773681640625, 0.05219078063964844, 0.05496978759765625, 0.05774879455566406, 0.060527801513671875, 0.06330680847167969, 0.0660858154296875, 0.06886482238769531, 0.07164382934570312, 0.07442283630371094, 0.07720184326171875, 0.07998085021972656, 0.08275985717773438, 0.08553886413574219, 0.08831787109375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 9.0, 11.0, 18.0, 19.0, 25.0, 28.0, 32.0, 42.0, 59.0, 71.0, 61.0, 69.0, 69.0, 70.0, 75.0, 69.0, 44.0, 33.0, 38.0, 41.0, 25.0, 30.0, 15.0, 13.0, 9.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01430511474609375, -0.013768792152404785, -0.01323246955871582, -0.012696146965026855, -0.01215982437133789, -0.011623501777648926, -0.011087179183959961, -0.010550856590270996, -0.010014533996582031, -0.009478211402893066, -0.008941888809204102, -0.008405566215515137, -0.007869243621826172, -0.007332921028137207, -0.006796598434448242, -0.006260275840759277, -0.0057239532470703125, -0.005187630653381348, -0.004651308059692383, -0.004114985466003418, -0.003578662872314453, -0.0030423402786254883, -0.0025060176849365234, -0.0019696950912475586, -0.0014333724975585938, -0.0008970499038696289, -0.00036072731018066406, 0.00017559528350830078, 0.0007119178771972656, 0.0012482404708862305, 0.0017845630645751953, 0.00232088565826416, 0.002857208251953125, 0.00339353084564209, 0.003929853439331055, 0.0044661760330200195, 0.005002498626708984, 0.005538821220397949, 0.006075143814086914, 0.006611466407775879, 0.007147789001464844, 0.007684111595153809, 0.008220434188842773, 0.008756756782531738, 0.009293079376220703, 0.009829401969909668, 0.010365724563598633, 0.010902047157287598, 0.011438369750976562, 0.011974692344665527, 0.012511014938354492, 0.013047337532043457, 0.013583660125732422, 0.014119982719421387, 0.014656305313110352, 0.015192627906799316, 0.01572895050048828, 0.016265273094177246, 0.01680159568786621, 0.017337918281555176, 0.01787424087524414, 0.018410563468933105, 0.01894688606262207, 0.019483208656311035, 0.02001953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 9.0, 8.0, 18.0, 26.0, 59.0, 94.0, 169.0, 349.0, 750.0, 1476.0, 3300.0, 8131.0, 27540.0, 119912.0, 430009.0, 342710.0, 82479.0, 19951.0, 6457.0, 2564.0, 1256.0, 619.0, 324.0, 161.0, 72.0, 43.0, 24.0, 16.0, 6.0, 4.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0550537109375, -0.05342864990234375, -0.0518035888671875, -0.05017852783203125, -0.048553466796875, -0.04692840576171875, -0.0453033447265625, -0.04367828369140625, -0.04205322265625, -0.04042816162109375, -0.0388031005859375, -0.03717803955078125, -0.035552978515625, -0.03392791748046875, -0.0323028564453125, -0.03067779541015625, -0.029052734375, -0.02742767333984375, -0.0258026123046875, -0.02417755126953125, -0.022552490234375, -0.02092742919921875, -0.0193023681640625, -0.01767730712890625, -0.01605224609375, -0.01442718505859375, -0.0128021240234375, -0.01117706298828125, -0.009552001953125, -0.00792694091796875, -0.0063018798828125, -0.00467681884765625, -0.0030517578125, -0.00142669677734375, 0.0001983642578125, 0.00182342529296875, 0.003448486328125, 0.00507354736328125, 0.0066986083984375, 0.00832366943359375, 0.00994873046875, 0.01157379150390625, 0.0131988525390625, 0.01482391357421875, 0.016448974609375, 0.01807403564453125, 0.0196990966796875, 0.02132415771484375, 0.02294921875, 0.02457427978515625, 0.0261993408203125, 0.02782440185546875, 0.029449462890625, 0.03107452392578125, 0.0326995849609375, 0.03432464599609375, 0.03594970703125, 0.03757476806640625, 0.0391998291015625, 0.04082489013671875, 0.042449951171875, 0.04407501220703125, 0.0457000732421875, 0.04732513427734375, 0.0489501953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 0.0, 11.0, 12.0, 18.0, 16.0, 17.0, 17.0, 31.0, 19.0, 31.0, 32.0, 31.0, 30.0, 36.0, 47.0, 32.0, 53.0, 60.0, 41.0, 42.0, 48.0, 60.0, 30.0, 46.0, 34.0, 29.0, 22.0, 24.0, 15.0, 26.0, 17.0, 18.0, 10.0, 9.0, 3.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0526123046875, -0.05117654800415039, -0.04974079132080078, -0.04830503463745117, -0.04686927795410156, -0.04543352127075195, -0.043997764587402344, -0.042562007904052734, -0.041126251220703125, -0.039690494537353516, -0.038254737854003906, -0.0368189811706543, -0.03538322448730469, -0.03394746780395508, -0.03251171112060547, -0.03107595443725586, -0.02964019775390625, -0.02820444107055664, -0.02676868438720703, -0.025332927703857422, -0.023897171020507812, -0.022461414337158203, -0.021025657653808594, -0.019589900970458984, -0.018154144287109375, -0.016718387603759766, -0.015282630920410156, -0.013846874237060547, -0.012411117553710938, -0.010975360870361328, -0.009539604187011719, -0.00810384750366211, -0.0066680908203125, -0.005232334136962891, -0.0037965774536132812, -0.002360820770263672, -0.0009250640869140625, 0.0005106925964355469, 0.0019464492797851562, 0.0033822059631347656, 0.004817962646484375, 0.006253719329833984, 0.007689476013183594, 0.009125232696533203, 0.010560989379882812, 0.011996746063232422, 0.013432502746582031, 0.01486825942993164, 0.01630401611328125, 0.01773977279663086, 0.01917552947998047, 0.020611286163330078, 0.022047042846679688, 0.023482799530029297, 0.024918556213378906, 0.026354312896728516, 0.027790069580078125, 0.029225826263427734, 0.030661582946777344, 0.03209733963012695, 0.03353309631347656, 0.03496885299682617, 0.03640460968017578, 0.03784036636352539, 0.039276123046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 11.0, 12.0, 17.0, 34.0, 48.0, 94.0, 157.0, 256.0, 507.0, 882.0, 2004.0, 5031.0, 16700.0, 75315.0, 359686.0, 447183.0, 106904.0, 22343.0, 6550.0, 2416.0, 1081.0, 547.0, 315.0, 215.0, 96.0, 63.0, 33.0, 22.0, 12.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244903564453125, -0.023792743682861328, -0.023095130920410156, -0.022397518157958984, -0.021699905395507812, -0.02100229263305664, -0.02030467987060547, -0.019607067108154297, -0.018909454345703125, -0.018211841583251953, -0.01751422882080078, -0.01681661605834961, -0.016119003295898438, -0.015421390533447266, -0.014723777770996094, -0.014026165008544922, -0.01332855224609375, -0.012630939483642578, -0.011933326721191406, -0.011235713958740234, -0.010538101196289062, -0.00984048843383789, -0.009142875671386719, -0.008445262908935547, -0.007747650146484375, -0.007050037384033203, -0.006352424621582031, -0.005654811859130859, -0.0049571990966796875, -0.004259586334228516, -0.0035619735717773438, -0.002864360809326172, -0.002166748046875, -0.0014691352844238281, -0.0007715225219726562, -7.390975952148438e-05, 0.0006237030029296875, 0.0013213157653808594, 0.0020189285278320312, 0.002716541290283203, 0.003414154052734375, 0.004111766815185547, 0.004809379577636719, 0.005506992340087891, 0.0062046051025390625, 0.006902217864990234, 0.007599830627441406, 0.008297443389892578, 0.00899505615234375, 0.009692668914794922, 0.010390281677246094, 0.011087894439697266, 0.011785507202148438, 0.01248311996459961, 0.013180732727050781, 0.013878345489501953, 0.014575958251953125, 0.015273571014404297, 0.01597118377685547, 0.01666879653930664, 0.017366409301757812, 0.018064022064208984, 0.018761634826660156, 0.019459247589111328, 0.0201568603515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 9.0, 12.0, 13.0, 15.0, 23.0, 33.0, 38.0, 48.0, 56.0, 64.0, 73.0, 80.0, 72.0, 69.0, 74.0, 71.0, 64.0, 48.0, 33.0, 26.0, 22.0, 12.0, 16.0, 13.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.888542652130127e-06, -8.657574653625488e-06, -8.42660665512085e-06, -8.195638656616211e-06, -7.964670658111572e-06, -7.733702659606934e-06, -7.502734661102295e-06, -7.271766662597656e-06, -7.040798664093018e-06, -6.809830665588379e-06, -6.57886266708374e-06, -6.3478946685791016e-06, -6.116926670074463e-06, -5.885958671569824e-06, -5.6549906730651855e-06, -5.424022674560547e-06, -5.193054676055908e-06, -4.9620866775512695e-06, -4.731118679046631e-06, -4.500150680541992e-06, -4.2691826820373535e-06, -4.038214683532715e-06, -3.807246685028076e-06, -3.5762786865234375e-06, -3.345310688018799e-06, -3.11434268951416e-06, -2.8833746910095215e-06, -2.652406692504883e-06, -2.421438694000244e-06, -2.1904706954956055e-06, -1.959502696990967e-06, -1.7285346984863281e-06, -1.4975666999816895e-06, -1.2665987014770508e-06, -1.0356307029724121e-06, -8.046627044677734e-07, -5.736947059631348e-07, -3.427267074584961e-07, -1.1175870895385742e-07, 1.1920928955078125e-07, 3.501772880554199e-07, 5.811452865600586e-07, 8.121132850646973e-07, 1.043081283569336e-06, 1.2740492820739746e-06, 1.5050172805786133e-06, 1.735985279083252e-06, 1.9669532775878906e-06, 2.1979212760925293e-06, 2.428889274597168e-06, 2.6598572731018066e-06, 2.8908252716064453e-06, 3.121793270111084e-06, 3.3527612686157227e-06, 3.5837292671203613e-06, 3.814697265625e-06, 4.045665264129639e-06, 4.276633262634277e-06, 4.507601261138916e-06, 4.738569259643555e-06, 4.969537258148193e-06, 5.200505256652832e-06, 5.431473255157471e-06, 5.662441253662109e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 9.0, 4.0, 7.0, 12.0, 28.0, 38.0, 75.0, 153.0, 273.0, 514.0, 1177.0, 3036.0, 10084.0, 45920.0, 252489.0, 522023.0, 170170.0, 30911.0, 7445.0, 2336.0, 952.0, 421.0, 224.0, 100.0, 57.0, 40.0, 17.0, 20.0, 8.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015472412109375, -0.014780998229980469, -0.014089584350585938, -0.013398170471191406, -0.012706756591796875, -0.012015342712402344, -0.011323928833007812, -0.010632514953613281, -0.00994110107421875, -0.009249687194824219, -0.008558273315429688, -0.007866859436035156, -0.007175445556640625, -0.006484031677246094, -0.0057926177978515625, -0.005101203918457031, -0.0044097900390625, -0.0037183761596679688, -0.0030269622802734375, -0.0023355484008789062, -0.001644134521484375, -0.0009527206420898438, -0.0002613067626953125, 0.00043010711669921875, 0.00112152099609375, 0.0018129348754882812, 0.0025043487548828125, 0.0031957626342773438, 0.003887176513671875, 0.004578590393066406, 0.0052700042724609375, 0.005961418151855469, 0.00665283203125, 0.007344245910644531, 0.008035659790039062, 0.008727073669433594, 0.009418487548828125, 0.010109901428222656, 0.010801315307617188, 0.011492729187011719, 0.01218414306640625, 0.012875556945800781, 0.013566970825195312, 0.014258384704589844, 0.014949798583984375, 0.015641212463378906, 0.016332626342773438, 0.01702404022216797, 0.0177154541015625, 0.01840686798095703, 0.019098281860351562, 0.019789695739746094, 0.020481109619140625, 0.021172523498535156, 0.021863937377929688, 0.02255535125732422, 0.02324676513671875, 0.02393817901611328, 0.024629592895507812, 0.025321006774902344, 0.026012420654296875, 0.026703834533691406, 0.027395248413085938, 0.02808666229248047, 0.028778076171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 2.0, 8.0, 15.0, 14.0, 19.0, 39.0, 39.0, 67.0, 62.0, 76.0, 78.0, 63.0, 85.0, 97.0, 66.0, 64.0, 58.0, 41.0, 36.0, 19.0, 13.0, 11.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01299285888671875, -0.01231372356414795, -0.011634588241577148, -0.010955452919006348, -0.010276317596435547, -0.009597182273864746, -0.008918046951293945, -0.008238911628723145, -0.007559776306152344, -0.006880640983581543, -0.006201505661010742, -0.005522370338439941, -0.004843235015869141, -0.00416409969329834, -0.003484964370727539, -0.0028058290481567383, -0.0021266937255859375, -0.0014475584030151367, -0.0007684230804443359, -8.928775787353516e-05, 0.0005898475646972656, 0.0012689828872680664, 0.0019481182098388672, 0.002627253532409668, 0.0033063888549804688, 0.0039855241775512695, 0.00466465950012207, 0.005343794822692871, 0.006022930145263672, 0.006702065467834473, 0.0073812007904052734, 0.008060336112976074, 0.008739471435546875, 0.009418606758117676, 0.010097742080688477, 0.010776877403259277, 0.011456012725830078, 0.012135148048400879, 0.01281428337097168, 0.01349341869354248, 0.014172554016113281, 0.014851689338684082, 0.015530824661254883, 0.016209959983825684, 0.016889095306396484, 0.017568230628967285, 0.018247365951538086, 0.018926501274108887, 0.019605636596679688, 0.02028477191925049, 0.02096390724182129, 0.02164304256439209, 0.02232217788696289, 0.02300131320953369, 0.023680448532104492, 0.024359583854675293, 0.025038719177246094, 0.025717854499816895, 0.026396989822387695, 0.027076125144958496, 0.027755260467529297, 0.028434395790100098, 0.0291135311126709, 0.0297926664352417, 0.0304718017578125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 14.0, 49.0, 100.0, 215.0, 261.0, 214.0, 100.0, 37.0, 14.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.006171464920044, -0.984614908695221, -0.9630584120750427, -0.9415018558502197, -0.9199453592300415, -0.8983888030052185, -0.8768322467803955, -0.8552757501602173, -0.8337192535400391, -0.8121626973152161, -0.7906062006950378, -0.7690496444702148, -0.7474931478500366, -0.7259365916252136, -0.7043800354003906, -0.6828235387802124, -0.6612669825553894, -0.6397104263305664, -0.6181539297103882, -0.5965973734855652, -0.575040876865387, -0.553484320640564, -0.5319278240203857, -0.5103712677955627, -0.48881474137306213, -0.4672582149505615, -0.4457016885280609, -0.4241451621055603, -0.4025886058807373, -0.3810321092605591, -0.3594755530357361, -0.3379190266132355, -0.31636252999305725, -0.29480600357055664, -0.27324947714805603, -0.2516929507255554, -0.23013640940189362, -0.208579882979393, -0.1870233416557312, -0.1654668152332306, -0.14391028881072998, -0.12235376238822937, -0.10079722851514816, -0.07924069464206696, -0.057684168219566345, -0.036127641797065735, -0.01457110047340393, 0.00698542594909668, 0.02854195237159729, 0.0500984825193882, 0.07165501266717911, 0.09321154654026031, 0.11476807296276093, 0.13632459938526154, 0.15788114070892334, 0.17943766713142395, 0.20099419355392456, 0.22255071997642517, 0.24410724639892578, 0.2656638026237488, 0.287220299243927, 0.30877685546875, 0.3303333818912506, 0.3518899083137512, 0.37344643473625183]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 9.0, 11.0, 9.0, 13.0, 23.0, 16.0, 18.0, 25.0, 29.0, 29.0, 38.0, 43.0, 41.0, 44.0, 44.0, 52.0, 50.0, 48.0, 48.0, 47.0, 55.0, 35.0, 42.0, 35.0, 27.0, 26.0, 26.0, 27.0, 20.0, 14.0, 14.0, 3.0, 12.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21193480491638184, -0.2048100084066391, -0.19768521189689636, -0.19056040048599243, -0.1834356039762497, -0.17631080746650696, -0.16918599605560303, -0.1620611995458603, -0.15493640303611755, -0.14781160652637482, -0.14068681001663208, -0.13356199860572815, -0.1264372020959854, -0.11931240558624268, -0.11218760162591934, -0.10506279766559601, -0.09793800115585327, -0.09081320464611053, -0.0836884006857872, -0.07656359672546387, -0.06943880021572113, -0.062313999980688095, -0.05518919974565506, -0.048064399510622025, -0.04093959927558899, -0.033814799040555954, -0.02668999880552292, -0.019565198570489883, -0.012440398335456848, -0.005315598100423813, 0.0018092021346092224, 0.008934002369642258, 0.016058802604675293, 0.023183602839708328, 0.030308403074741364, 0.0374332033097744, 0.044558003544807434, 0.05168280377984047, 0.058807604014873505, 0.06593240797519684, 0.07305720448493958, 0.08018200099468231, 0.08730680495500565, 0.09443160891532898, 0.10155640542507172, 0.10868120193481445, 0.11580600589513779, 0.12293080985546112, 0.13005560636520386, 0.1371804028749466, 0.14430519938468933, 0.15143001079559326, 0.158554807305336, 0.16567960381507874, 0.17280441522598267, 0.1799292117357254, 0.18705400824546814, 0.19417880475521088, 0.2013036012649536, 0.20842841267585754, 0.21555320918560028, 0.22267800569534302, 0.22980281710624695, 0.23692761361598969, 0.24405241012573242]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 6.0, 2.0, 19.0, 20.0, 28.0, 34.0, 42.0, 59.0, 90.0, 119.0, 188.0, 277.0, 486.0, 992.0, 2093.0, 5383.0, 18588.0, 115589.0, 3751542.0, 257749.0, 28279.0, 7274.0, 2729.0, 1144.0, 582.0, 313.0, 204.0, 130.0, 102.0, 58.0, 55.0, 34.0, 19.0, 20.0, 11.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.09796142578125, -0.0955510139465332, -0.0931406021118164, -0.09073019027709961, -0.08831977844238281, -0.08590936660766602, -0.08349895477294922, -0.08108854293823242, -0.07867813110351562, -0.07626771926879883, -0.07385730743408203, -0.07144689559936523, -0.06903648376464844, -0.06662607192993164, -0.06421566009521484, -0.06180524826049805, -0.05939483642578125, -0.05698442459106445, -0.054574012756347656, -0.05216360092163086, -0.04975318908691406, -0.047342777252197266, -0.04493236541748047, -0.04252195358276367, -0.040111541748046875, -0.03770112991333008, -0.03529071807861328, -0.032880306243896484, -0.030469894409179688, -0.02805948257446289, -0.025649070739746094, -0.023238658905029297, -0.0208282470703125, -0.018417835235595703, -0.016007423400878906, -0.01359701156616211, -0.011186599731445312, -0.008776187896728516, -0.006365776062011719, -0.003955364227294922, -0.001544952392578125, 0.0008654594421386719, 0.0032758712768554688, 0.005686283111572266, 0.008096694946289062, 0.01050710678100586, 0.012917518615722656, 0.015327930450439453, 0.01773834228515625, 0.020148754119873047, 0.022559165954589844, 0.02496957778930664, 0.027379989624023438, 0.029790401458740234, 0.03220081329345703, 0.03461122512817383, 0.037021636962890625, 0.03943204879760742, 0.04184246063232422, 0.044252872467041016, 0.04666328430175781, 0.04907369613647461, 0.051484107971191406, 0.0538945198059082, 0.056304931640625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 15.0, 10.0, 12.0, 16.0, 27.0, 23.0, 27.0, 43.0, 56.0, 42.0, 49.0, 68.0, 86.0, 69.0, 64.0, 69.0, 67.0, 50.0, 30.0, 36.0, 29.0, 23.0, 17.0, 23.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01435089111328125, -0.013805031776428223, -0.013259172439575195, -0.012713313102722168, -0.01216745376586914, -0.011621594429016113, -0.011075735092163086, -0.010529875755310059, -0.009984016418457031, -0.009438157081604004, -0.008892297744750977, -0.00834643840789795, -0.007800579071044922, -0.0072547197341918945, -0.006708860397338867, -0.00616300106048584, -0.0056171417236328125, -0.005071282386779785, -0.004525423049926758, -0.0039795637130737305, -0.003433704376220703, -0.0028878450393676758, -0.0023419857025146484, -0.001796126365661621, -0.0012502670288085938, -0.0007044076919555664, -0.00015854835510253906, 0.0003873109817504883, 0.0009331703186035156, 0.001479029655456543, 0.0020248889923095703, 0.0025707483291625977, 0.003116607666015625, 0.0036624670028686523, 0.00420832633972168, 0.004754185676574707, 0.005300045013427734, 0.005845904350280762, 0.006391763687133789, 0.006937623023986816, 0.007483482360839844, 0.008029341697692871, 0.008575201034545898, 0.009121060371398926, 0.009666919708251953, 0.01021277904510498, 0.010758638381958008, 0.011304497718811035, 0.011850357055664062, 0.01239621639251709, 0.012942075729370117, 0.013487935066223145, 0.014033794403076172, 0.0145796537399292, 0.015125513076782227, 0.015671372413635254, 0.01621723175048828, 0.01676309108734131, 0.017308950424194336, 0.017854809761047363, 0.01840066909790039, 0.018946528434753418, 0.019492387771606445, 0.020038247108459473, 0.0205841064453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 8.0, 25.0, 28.0, 32.0, 59.0, 79.0, 104.0, 142.0, 229.0, 369.0, 578.0, 979.0, 1955.0, 4066.0, 11368.0, 43580.0, 434535.0, 3535151.0, 125012.0, 22724.0, 6712.0, 2844.0, 1392.0, 837.0, 505.0, 274.0, 200.0, 141.0, 104.0, 72.0, 50.0, 43.0, 30.0, 11.0, 14.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0618896484375, -0.05962085723876953, -0.05735206604003906, -0.055083274841308594, -0.052814483642578125, -0.050545692443847656, -0.04827690124511719, -0.04600811004638672, -0.04373931884765625, -0.04147052764892578, -0.03920173645019531, -0.036932945251464844, -0.034664154052734375, -0.032395362854003906, -0.030126571655273438, -0.02785778045654297, -0.0255889892578125, -0.02332019805908203, -0.021051406860351562, -0.018782615661621094, -0.016513824462890625, -0.014245033264160156, -0.011976242065429688, -0.009707450866699219, -0.00743865966796875, -0.005169868469238281, -0.0029010772705078125, -0.0006322860717773438, 0.001636505126953125, 0.0039052963256835938, 0.0061740875244140625, 0.008442878723144531, 0.010711669921875, 0.012980461120605469, 0.015249252319335938, 0.017518043518066406, 0.019786834716796875, 0.022055625915527344, 0.024324417114257812, 0.02659320831298828, 0.02886199951171875, 0.03113079071044922, 0.03339958190917969, 0.035668373107910156, 0.037937164306640625, 0.040205955505371094, 0.04247474670410156, 0.04474353790283203, 0.0470123291015625, 0.04928112030029297, 0.05154991149902344, 0.053818702697753906, 0.056087493896484375, 0.058356285095214844, 0.06062507629394531, 0.06289386749267578, 0.06516265869140625, 0.06743144989013672, 0.06970024108886719, 0.07196903228759766, 0.07423782348632812, 0.0765066146850586, 0.07877540588378906, 0.08104419708251953, 0.08331298828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 13.0, 32.0, 46.0, 94.0, 186.0, 555.0, 2116.0, 562.0, 228.0, 82.0, 51.0, 25.0, 15.0, 11.0, 14.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03118896484375, -0.03013324737548828, -0.029077529907226562, -0.028021812438964844, -0.026966094970703125, -0.025910377502441406, -0.024854660034179688, -0.02379894256591797, -0.02274322509765625, -0.02168750762939453, -0.020631790161132812, -0.019576072692871094, -0.018520355224609375, -0.017464637756347656, -0.016408920288085938, -0.015353202819824219, -0.0142974853515625, -0.013241767883300781, -0.012186050415039062, -0.011130332946777344, -0.010074615478515625, -0.009018898010253906, -0.007963180541992188, -0.006907463073730469, -0.00585174560546875, -0.004796028137207031, -0.0037403106689453125, -0.0026845932006835938, -0.001628875732421875, -0.0005731582641601562, 0.0004825592041015625, 0.0015382766723632812, 0.002593994140625, 0.0036497116088867188, 0.0047054290771484375, 0.005761146545410156, 0.006816864013671875, 0.007872581481933594, 0.008928298950195312, 0.009984016418457031, 0.01103973388671875, 0.012095451354980469, 0.013151168823242188, 0.014206886291503906, 0.015262603759765625, 0.016318321228027344, 0.017374038696289062, 0.01842975616455078, 0.0194854736328125, 0.02054119110107422, 0.021596908569335938, 0.022652626037597656, 0.023708343505859375, 0.024764060974121094, 0.025819778442382812, 0.02687549591064453, 0.02793121337890625, 0.02898693084716797, 0.030042648315429688, 0.031098365783691406, 0.032154083251953125, 0.033209800720214844, 0.03426551818847656, 0.03532123565673828, 0.036376953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 11.0, 106.0, 363.0, 391.0, 104.0, 16.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23375248908996582, -0.21816407144069672, -0.20257563889026642, -0.18698722124099731, -0.17139878869056702, -0.1558103710412979, -0.1402219533920288, -0.12463352829217911, -0.1090451031923294, -0.0934566780924797, -0.07786825299263, -0.0622798353433609, -0.0466914102435112, -0.0311029851436615, -0.015514567494392395, 7.385760545730591e-05, 0.015662282705307007, 0.03125070780515671, 0.04683912917971611, 0.06242755055427551, 0.07801597565412521, 0.09360440075397491, 0.10919281840324402, 0.12478124350309372, 0.14036966860294342, 0.15595808625221252, 0.17154651880264282, 0.18713493645191193, 0.20272335410118103, 0.21831178665161133, 0.23390020430088043, 0.24948862195014954, 0.26507705450057983, 0.28066548705101013, 0.29625388979911804, 0.31184232234954834, 0.32743075489997864, 0.34301918745040894, 0.35860759019851685, 0.37419602274894714, 0.38978445529937744, 0.40537288784980774, 0.42096129059791565, 0.43654972314834595, 0.45213815569877625, 0.46772658824920654, 0.48331499099731445, 0.49890342354774475, 0.5144917964935303, 0.5300801992416382, 0.5456686615943909, 0.5612570643424988, 0.5768454670906067, 0.5924339294433594, 0.6080223321914673, 0.6236107349395752, 0.6391991972923279, 0.6547876000404358, 0.6703760623931885, 0.6859644651412964, 0.7015528678894043, 0.717141330242157, 0.7327297329902649, 0.7483181357383728, 0.7639065980911255]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 5.0, 11.0, 9.0, 18.0, 22.0, 32.0, 31.0, 28.0, 38.0, 42.0, 35.0, 53.0, 70.0, 68.0, 54.0, 46.0, 59.0, 40.0, 49.0, 37.0, 49.0, 44.0, 23.0, 27.0, 24.0, 16.0, 14.0, 8.0, 9.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07100558280944824, -0.06855235993862152, -0.0660991445183754, -0.06364592909812927, -0.06119270622730255, -0.05873948708176613, -0.056286267936229706, -0.05383304879069328, -0.05137982964515686, -0.04892661049962044, -0.046473391354084015, -0.04402017220854759, -0.04156695306301117, -0.03911373391747475, -0.036660514771938324, -0.0342072956264019, -0.03175407648086548, -0.029300857335329056, -0.026847638189792633, -0.02439441904425621, -0.021941199898719788, -0.019487980753183365, -0.017034761607646942, -0.01458154246211052, -0.012128323316574097, -0.009675104171037674, -0.007221885025501251, -0.0047686658799648285, -0.0023154467344284058, 0.00013777241110801697, 0.0025909915566444397, 0.005044210702180862, 0.007497429847717285, 0.009950648993253708, 0.01240386813879013, 0.014857087284326553, 0.017310306429862976, 0.0197635255753994, 0.02221674472093582, 0.024669963866472244, 0.027123183012008667, 0.02957640215754509, 0.03202962130308151, 0.034482840448617935, 0.03693605959415436, 0.03938927873969078, 0.0418424978852272, 0.044295717030763626, 0.04674893617630005, 0.04920215532183647, 0.051655374467372894, 0.05410859361290932, 0.05656181275844574, 0.05901503190398216, 0.061468251049518585, 0.06392146646976471, 0.06637468934059143, 0.06882791221141815, 0.07128112763166428, 0.0737343430519104, 0.07618756592273712, 0.07864078879356384, 0.08109400421380997, 0.08354721963405609, 0.08600044250488281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 3.0, 6.0, 5.0, 4.0, 5.0, 14.0, 26.0, 27.0, 47.0, 82.0, 153.0, 243.0, 404.0, 633.0, 1229.0, 2479.0, 5225.0, 12622.0, 33630.0, 95440.0, 241992.0, 340985.0, 195571.0, 72864.0, 25938.0, 10009.0, 4294.0, 2079.0, 1045.0, 611.0, 331.0, 192.0, 120.0, 72.0, 50.0, 30.0, 30.0, 18.0, 15.0, 8.0, 11.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04888916015625, -0.04746675491333008, -0.046044349670410156, -0.044621944427490234, -0.04319953918457031, -0.04177713394165039, -0.04035472869873047, -0.03893232345581055, -0.037509918212890625, -0.0360875129699707, -0.03466510772705078, -0.03324270248413086, -0.03182029724121094, -0.030397891998291016, -0.028975486755371094, -0.027553081512451172, -0.02613067626953125, -0.024708271026611328, -0.023285865783691406, -0.021863460540771484, -0.020441055297851562, -0.01901865005493164, -0.01759624481201172, -0.016173839569091797, -0.014751434326171875, -0.013329029083251953, -0.011906623840332031, -0.01048421859741211, -0.009061813354492188, -0.007639408111572266, -0.006217002868652344, -0.004794597625732422, -0.0033721923828125, -0.0019497871398925781, -0.0005273818969726562, 0.0008950233459472656, 0.0023174285888671875, 0.0037398338317871094, 0.005162239074707031, 0.006584644317626953, 0.008007049560546875, 0.009429454803466797, 0.010851860046386719, 0.01227426528930664, 0.013696670532226562, 0.015119075775146484, 0.016541481018066406, 0.017963886260986328, 0.01938629150390625, 0.020808696746826172, 0.022231101989746094, 0.023653507232666016, 0.025075912475585938, 0.02649831771850586, 0.02792072296142578, 0.029343128204345703, 0.030765533447265625, 0.03218793869018555, 0.03361034393310547, 0.03503274917602539, 0.03645515441894531, 0.037877559661865234, 0.039299964904785156, 0.04072237014770508, 0.042144775390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 11.0, 12.0, 11.0, 18.0, 31.0, 36.0, 32.0, 39.0, 56.0, 55.0, 53.0, 59.0, 61.0, 77.0, 54.0, 58.0, 41.0, 56.0, 39.0, 38.0, 25.0, 27.0, 18.0, 19.0, 12.0, 18.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01517486572265625, -0.014615178108215332, -0.014055490493774414, -0.013495802879333496, -0.012936115264892578, -0.01237642765045166, -0.011816740036010742, -0.011257052421569824, -0.010697364807128906, -0.010137677192687988, -0.00957798957824707, -0.009018301963806152, -0.008458614349365234, -0.007898926734924316, -0.0073392391204833984, -0.0067795515060424805, -0.0062198638916015625, -0.0056601762771606445, -0.0051004886627197266, -0.004540801048278809, -0.003981113433837891, -0.0034214258193969727, -0.0028617382049560547, -0.0023020505905151367, -0.0017423629760742188, -0.0011826753616333008, -0.0006229877471923828, -6.330013275146484e-05, 0.0004963874816894531, 0.001056075096130371, 0.001615762710571289, 0.002175450325012207, 0.002735137939453125, 0.003294825553894043, 0.003854513168334961, 0.004414200782775879, 0.004973888397216797, 0.005533576011657715, 0.006093263626098633, 0.006652951240539551, 0.007212638854980469, 0.007772326469421387, 0.008332014083862305, 0.008891701698303223, 0.00945138931274414, 0.010011076927185059, 0.010570764541625977, 0.011130452156066895, 0.011690139770507812, 0.01224982738494873, 0.012809514999389648, 0.013369202613830566, 0.013928890228271484, 0.014488577842712402, 0.01504826545715332, 0.015607953071594238, 0.016167640686035156, 0.016727328300476074, 0.017287015914916992, 0.01784670352935791, 0.018406391143798828, 0.018966078758239746, 0.019525766372680664, 0.020085453987121582, 0.0206451416015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 10.0, 12.0, 29.0, 28.0, 30.0, 33.0, 61.0, 69.0, 83.0, 149.0, 228.0, 338.0, 691.0, 1324.0, 2885.0, 7318.0, 20685.0, 69097.0, 225225.0, 398249.0, 221432.0, 67462.0, 20207.0, 6892.0, 2901.0, 1309.0, 700.0, 365.0, 218.0, 135.0, 96.0, 68.0, 54.0, 37.0, 21.0, 13.0, 18.0, 12.0, 12.0, 9.0, 9.0, 2.0, 7.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0443115234375, -0.04294776916503906, -0.041584014892578125, -0.04022026062011719, -0.03885650634765625, -0.03749275207519531, -0.036128997802734375, -0.03476524353027344, -0.0334014892578125, -0.03203773498535156, -0.030673980712890625, -0.029310226440429688, -0.02794647216796875, -0.026582717895507812, -0.025218963623046875, -0.023855209350585938, -0.022491455078125, -0.021127700805664062, -0.019763946533203125, -0.018400192260742188, -0.01703643798828125, -0.015672683715820312, -0.014308929443359375, -0.012945175170898438, -0.0115814208984375, -0.010217666625976562, -0.008853912353515625, -0.0074901580810546875, -0.00612640380859375, -0.0047626495361328125, -0.003398895263671875, -0.0020351409912109375, -0.00067138671875, 0.0006923675537109375, 0.002056121826171875, 0.0034198760986328125, 0.00478363037109375, 0.0061473846435546875, 0.007511138916015625, 0.008874893188476562, 0.0102386474609375, 0.011602401733398438, 0.012966156005859375, 0.014329910278320312, 0.01569366455078125, 0.017057418823242188, 0.018421173095703125, 0.019784927368164062, 0.021148681640625, 0.022512435913085938, 0.023876190185546875, 0.025239944458007812, 0.02660369873046875, 0.027967453002929688, 0.029331207275390625, 0.030694961547851562, 0.0320587158203125, 0.03342247009277344, 0.034786224365234375, 0.03614997863769531, 0.03751373291015625, 0.03887748718261719, 0.040241241455078125, 0.04160499572753906, 0.04296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 5.0, 11.0, 9.0, 17.0, 25.0, 24.0, 25.0, 29.0, 28.0, 31.0, 48.0, 38.0, 36.0, 58.0, 48.0, 51.0, 37.0, 45.0, 48.0, 50.0, 41.0, 50.0, 30.0, 30.0, 33.0, 27.0, 23.0, 22.0, 12.0, 14.0, 16.0, 5.0, 8.0, 1.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0732421875, -0.07119894027709961, -0.06915569305419922, -0.06711244583129883, -0.06506919860839844, -0.06302595138549805, -0.060982704162597656, -0.058939456939697266, -0.056896209716796875, -0.054852962493896484, -0.052809715270996094, -0.0507664680480957, -0.04872322082519531, -0.04667997360229492, -0.04463672637939453, -0.04259347915649414, -0.04055023193359375, -0.03850698471069336, -0.03646373748779297, -0.03442049026489258, -0.03237724304199219, -0.030333995819091797, -0.028290748596191406, -0.026247501373291016, -0.024204254150390625, -0.022161006927490234, -0.020117759704589844, -0.018074512481689453, -0.016031265258789062, -0.013988018035888672, -0.011944770812988281, -0.00990152359008789, -0.0078582763671875, -0.005815029144287109, -0.0037717819213867188, -0.0017285346984863281, 0.0003147125244140625, 0.002357959747314453, 0.004401206970214844, 0.006444454193115234, 0.008487701416015625, 0.010530948638916016, 0.012574195861816406, 0.014617443084716797, 0.016660690307617188, 0.018703937530517578, 0.02074718475341797, 0.02279043197631836, 0.02483367919921875, 0.02687692642211914, 0.02892017364501953, 0.030963420867919922, 0.03300666809082031, 0.0350499153137207, 0.037093162536621094, 0.039136409759521484, 0.041179656982421875, 0.043222904205322266, 0.045266151428222656, 0.04730939865112305, 0.04935264587402344, 0.05139589309692383, 0.05343914031982422, 0.05548238754272461, 0.057525634765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 1.0, 9.0, 4.0, 14.0, 18.0, 23.0, 31.0, 30.0, 46.0, 55.0, 111.0, 148.0, 293.0, 578.0, 1396.0, 4125.0, 19349.0, 168669.0, 687513.0, 142785.0, 16923.0, 3871.0, 1240.0, 531.0, 274.0, 161.0, 105.0, 65.0, 48.0, 36.0, 25.0, 25.0, 15.0, 8.0, 6.0, 6.0, 2.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.03407692909240723, -0.03305864334106445, -0.03204035758972168, -0.031022071838378906, -0.030003786087036133, -0.02898550033569336, -0.027967214584350586, -0.026948928833007812, -0.02593064308166504, -0.024912357330322266, -0.023894071578979492, -0.02287578582763672, -0.021857500076293945, -0.020839214324951172, -0.0198209285736084, -0.018802642822265625, -0.01778435707092285, -0.016766071319580078, -0.015747785568237305, -0.014729499816894531, -0.013711214065551758, -0.012692928314208984, -0.011674642562866211, -0.010656356811523438, -0.009638071060180664, -0.00861978530883789, -0.007601499557495117, -0.006583213806152344, -0.00556492805480957, -0.004546642303466797, -0.0035283565521240234, -0.00251007080078125, -0.0014917850494384766, -0.0004734992980957031, 0.0005447864532470703, 0.0015630722045898438, 0.002581357955932617, 0.0035996437072753906, 0.004617929458618164, 0.0056362152099609375, 0.006654500961303711, 0.007672786712646484, 0.008691072463989258, 0.009709358215332031, 0.010727643966674805, 0.011745929718017578, 0.012764215469360352, 0.013782501220703125, 0.014800786972045898, 0.015819072723388672, 0.016837358474731445, 0.01785564422607422, 0.018873929977416992, 0.019892215728759766, 0.02091050148010254, 0.021928787231445312, 0.022947072982788086, 0.02396535873413086, 0.024983644485473633, 0.026001930236816406, 0.02702021598815918, 0.028038501739501953, 0.029056787490844727, 0.0300750732421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 9.0, 9.0, 14.0, 25.0, 40.0, 55.0, 67.0, 72.0, 76.0, 107.0, 97.0, 92.0, 87.0, 86.0, 39.0, 45.0, 32.0, 16.0, 12.0, 7.0, 5.0, 8.0, 1.0, 1.0, 0.0, 5.0, 1.0], "bins": [-1.3113021850585938e-05, -1.283455640077591e-05, -1.2556090950965881e-05, -1.2277625501155853e-05, -1.1999160051345825e-05, -1.1720694601535797e-05, -1.1442229151725769e-05, -1.1163763701915741e-05, -1.0885298252105713e-05, -1.0606832802295685e-05, -1.0328367352485657e-05, -1.0049901902675629e-05, -9.7714364528656e-06, -9.492971003055573e-06, -9.214505553245544e-06, -8.936040103435516e-06, -8.657574653625488e-06, -8.37910920381546e-06, -8.100643754005432e-06, -7.822178304195404e-06, -7.543712854385376e-06, -7.265247404575348e-06, -6.98678195476532e-06, -6.708316504955292e-06, -6.429851055145264e-06, -6.151385605335236e-06, -5.8729201555252075e-06, -5.5944547057151794e-06, -5.315989255905151e-06, -5.037523806095123e-06, -4.759058356285095e-06, -4.480592906475067e-06, -4.202127456665039e-06, -3.923662006855011e-06, -3.645196557044983e-06, -3.366731107234955e-06, -3.0882656574249268e-06, -2.8098002076148987e-06, -2.5313347578048706e-06, -2.2528693079948425e-06, -1.9744038581848145e-06, -1.6959384083747864e-06, -1.4174729585647583e-06, -1.1390075087547302e-06, -8.605420589447021e-07, -5.820766091346741e-07, -3.03611159324646e-07, -2.514570951461792e-08, 2.5331974029541016e-07, 5.317851901054382e-07, 8.102506399154663e-07, 1.0887160897254944e-06, 1.3671815395355225e-06, 1.6456469893455505e-06, 1.9241124391555786e-06, 2.2025778889656067e-06, 2.4810433387756348e-06, 2.759508788585663e-06, 3.037974238395691e-06, 3.316439688205719e-06, 3.594905138015747e-06, 3.873370587825775e-06, 4.151836037635803e-06, 4.430301487445831e-06, 4.708766937255859e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 13.0, 17.0, 28.0, 28.0, 48.0, 99.0, 163.0, 342.0, 1101.0, 4527.0, 35633.0, 470260.0, 491683.0, 37993.0, 4794.0, 1048.0, 334.0, 163.0, 84.0, 63.0, 43.0, 23.0, 14.0, 3.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0498046875, -0.04845905303955078, -0.04711341857910156, -0.045767784118652344, -0.044422149658203125, -0.043076515197753906, -0.04173088073730469, -0.04038524627685547, -0.03903961181640625, -0.03769397735595703, -0.03634834289550781, -0.035002708435058594, -0.033657073974609375, -0.032311439514160156, -0.030965805053710938, -0.02962017059326172, -0.0282745361328125, -0.02692890167236328, -0.025583267211914062, -0.024237632751464844, -0.022891998291015625, -0.021546363830566406, -0.020200729370117188, -0.01885509490966797, -0.01750946044921875, -0.01616382598876953, -0.014818191528320312, -0.013472557067871094, -0.012126922607421875, -0.010781288146972656, -0.009435653686523438, -0.008090019226074219, -0.006744384765625, -0.005398750305175781, -0.0040531158447265625, -0.0027074813842773438, -0.001361846923828125, -1.621246337890625e-05, 0.0013294219970703125, 0.0026750564575195312, 0.00402069091796875, 0.005366325378417969, 0.0067119598388671875, 0.008057594299316406, 0.009403228759765625, 0.010748863220214844, 0.012094497680664062, 0.013440132141113281, 0.0147857666015625, 0.01613140106201172, 0.017477035522460938, 0.018822669982910156, 0.020168304443359375, 0.021513938903808594, 0.022859573364257812, 0.02420520782470703, 0.02555084228515625, 0.02689647674560547, 0.028242111206054688, 0.029587745666503906, 0.030933380126953125, 0.032279014587402344, 0.03362464904785156, 0.03497028350830078, 0.03631591796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 18.0, 19.0, 36.0, 56.0, 113.0, 140.0, 149.0, 168.0, 134.0, 80.0, 47.0, 22.0, 14.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08245849609375, -0.08083176612854004, -0.07920503616333008, -0.07757830619812012, -0.07595157623291016, -0.0743248462677002, -0.07269811630249023, -0.07107138633728027, -0.06944465637207031, -0.06781792640686035, -0.06619119644165039, -0.06456446647644043, -0.06293773651123047, -0.06131100654602051, -0.05968427658081055, -0.058057546615600586, -0.056430816650390625, -0.054804086685180664, -0.0531773567199707, -0.05155062675476074, -0.04992389678955078, -0.04829716682434082, -0.04667043685913086, -0.0450437068939209, -0.04341697692871094, -0.04179024696350098, -0.040163516998291016, -0.038536787033081055, -0.036910057067871094, -0.03528332710266113, -0.03365659713745117, -0.03202986717224121, -0.03040313720703125, -0.02877640724182129, -0.027149677276611328, -0.025522947311401367, -0.023896217346191406, -0.022269487380981445, -0.020642757415771484, -0.019016027450561523, -0.017389297485351562, -0.0157625675201416, -0.01413583755493164, -0.01250910758972168, -0.010882377624511719, -0.009255647659301758, -0.007628917694091797, -0.006002187728881836, -0.004375457763671875, -0.002748727798461914, -0.0011219978332519531, 0.0005047321319580078, 0.0021314620971679688, 0.0037581920623779297, 0.005384922027587891, 0.0070116519927978516, 0.008638381958007812, 0.010265111923217773, 0.011891841888427734, 0.013518571853637695, 0.015145301818847656, 0.016772031784057617, 0.018398761749267578, 0.02002549171447754, 0.0216522216796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 13.0, 15.0, 38.0, 46.0, 89.0, 142.0, 147.0, 177.0, 126.0, 85.0, 58.0, 35.0, 12.0, 8.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2502748966217041, -0.2343837171792984, -0.2184925377368927, -0.2026013433933258, -0.1867101788520813, -0.1708189845085144, -0.1549278050661087, -0.139036625623703, -0.1231454461812973, -0.1072542667388916, -0.0913630872964859, -0.0754719004034996, -0.0595807209610939, -0.0436895415186882, -0.027798354625701904, -0.011907175183296204, 0.003984004259109497, 0.019875185564160347, 0.0357663668692112, 0.051657550036907196, 0.0675487294793129, 0.0834399089217186, 0.0993310958147049, 0.1152222752571106, 0.1311134546995163, 0.147004634141922, 0.1628958135843277, 0.1787869930267334, 0.1946781873703003, 0.2105693519115448, 0.2264605462551117, 0.2423517256975174, 0.2582429051399231, 0.27413409948349, 0.2900252640247345, 0.3059164583683014, 0.3218076229095459, 0.3376988172531128, 0.3535900115966797, 0.3694811761379242, 0.3853723406791687, 0.4012635350227356, 0.4171546995639801, 0.433045893907547, 0.4489370584487915, 0.4648282527923584, 0.4807194471359253, 0.4966106116771698, 0.5125018358230591, 0.528393030166626, 0.5442842245101929, 0.560175359249115, 0.5760665535926819, 0.5919577479362488, 0.6078489422798157, 0.6237400770187378, 0.6396312713623047, 0.6555224657058716, 0.6714136600494385, 0.6873047947883606, 0.7031959891319275, 0.7190871834754944, 0.7349783778190613, 0.7508695125579834, 0.7667607069015503]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 2.0, 8.0, 6.0, 5.0, 13.0, 18.0, 11.0, 10.0, 23.0, 18.0, 18.0, 24.0, 26.0, 26.0, 29.0, 39.0, 36.0, 40.0, 28.0, 38.0, 48.0, 49.0, 40.0, 45.0, 41.0, 42.0, 36.0, 34.0, 20.0, 27.0, 22.0, 19.0, 23.0, 23.0, 16.0, 13.0, 15.0, 13.0, 15.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2698708176612854, -0.261054664850235, -0.25223854184150696, -0.24342238903045654, -0.23460623621940613, -0.2257900983095169, -0.21697396039962769, -0.20815780758857727, -0.19934166967868805, -0.19052553176879883, -0.1817093789577484, -0.1728932410478592, -0.16407710313796997, -0.15526095032691956, -0.14644481241703033, -0.1376286745071411, -0.1288125216960907, -0.11999637633562088, -0.11118023097515106, -0.10236409306526184, -0.09354794770479202, -0.0847318023443222, -0.07591566443443298, -0.06709951907396317, -0.05828337371349335, -0.04946722835302353, -0.04065108671784401, -0.03183494508266449, -0.02301879972219467, -0.014202654361724854, -0.005386512726545334, 0.003429628908634186, 0.012245774269104004, 0.021061917766928673, 0.02987806126475334, 0.03869420289993286, 0.04751034826040268, 0.0563264936208725, 0.06514263153076172, 0.07395877689123154, 0.08277492225170135, 0.09159106761217117, 0.10040721297264099, 0.10922335088253021, 0.11803949624300003, 0.12685564160346985, 0.13567177951335907, 0.1444879174232483, 0.1533040702342987, 0.16212020814418793, 0.17093636095523834, 0.17975249886512756, 0.18856865167617798, 0.1973847895860672, 0.20620092749595642, 0.21501708030700684, 0.22383321821689606, 0.23264935612678528, 0.2414655089378357, 0.2502816617488861, 0.25909778475761414, 0.26791393756866455, 0.27673009037971497, 0.285546213388443, 0.2943623661994934]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 11.0, 9.0, 9.0, 17.0, 19.0, 38.0, 61.0, 105.0, 206.0, 373.0, 776.0, 1885.0, 5765.0, 27858.0, 667688.0, 3436368.0, 41646.0, 7331.0, 2251.0, 914.0, 440.0, 212.0, 125.0, 64.0, 43.0, 24.0, 12.0, 11.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.0985708236694336, -0.09576225280761719, -0.09295368194580078, -0.09014511108398438, -0.08733654022216797, -0.08452796936035156, -0.08171939849853516, -0.07891082763671875, -0.07610225677490234, -0.07329368591308594, -0.07048511505126953, -0.06767654418945312, -0.06486797332763672, -0.06205940246582031, -0.059250831604003906, -0.0564422607421875, -0.053633689880371094, -0.05082511901855469, -0.04801654815673828, -0.045207977294921875, -0.04239940643310547, -0.03959083557128906, -0.036782264709472656, -0.03397369384765625, -0.031165122985839844, -0.028356552124023438, -0.02554798126220703, -0.022739410400390625, -0.01993083953857422, -0.017122268676757812, -0.014313697814941406, -0.011505126953125, -0.008696556091308594, -0.0058879852294921875, -0.0030794143676757812, -0.000270843505859375, 0.0025377273559570312, 0.0053462982177734375, 0.008154869079589844, 0.01096343994140625, 0.013772010803222656, 0.016580581665039062, 0.01938915252685547, 0.022197723388671875, 0.02500629425048828, 0.027814865112304688, 0.030623435974121094, 0.0334320068359375, 0.036240577697753906, 0.03904914855957031, 0.04185771942138672, 0.044666290283203125, 0.04747486114501953, 0.05028343200683594, 0.053092002868652344, 0.05590057373046875, 0.058709144592285156, 0.06151771545410156, 0.06432628631591797, 0.06713485717773438, 0.06994342803955078, 0.07275199890136719, 0.0755605697631836, 0.078369140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 14.0, 18.0, 16.0, 34.0, 38.0, 36.0, 35.0, 46.0, 57.0, 59.0, 48.0, 61.0, 69.0, 60.0, 59.0, 49.0, 54.0, 44.0, 34.0, 32.0, 17.0, 23.0, 15.0, 17.0, 13.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0163421630859375, -0.015761852264404297, -0.015181541442871094, -0.01460123062133789, -0.014020919799804688, -0.013440608978271484, -0.012860298156738281, -0.012279987335205078, -0.011699676513671875, -0.011119365692138672, -0.010539054870605469, -0.009958744049072266, -0.009378433227539062, -0.00879812240600586, -0.008217811584472656, -0.007637500762939453, -0.00705718994140625, -0.006476879119873047, -0.005896568298339844, -0.005316257476806641, -0.0047359466552734375, -0.004155635833740234, -0.0035753250122070312, -0.002995014190673828, -0.002414703369140625, -0.0018343925476074219, -0.0012540817260742188, -0.0006737709045410156, -9.34600830078125e-05, 0.0004868507385253906, 0.0010671615600585938, 0.0016474723815917969, 0.002227783203125, 0.002808094024658203, 0.0033884048461914062, 0.003968715667724609, 0.0045490264892578125, 0.005129337310791016, 0.005709648132324219, 0.006289958953857422, 0.006870269775390625, 0.007450580596923828, 0.008030891418457031, 0.008611202239990234, 0.009191513061523438, 0.00977182388305664, 0.010352134704589844, 0.010932445526123047, 0.01151275634765625, 0.012093067169189453, 0.012673377990722656, 0.01325368881225586, 0.013833999633789062, 0.014414310455322266, 0.014994621276855469, 0.015574932098388672, 0.016155242919921875, 0.016735553741455078, 0.01731586456298828, 0.017896175384521484, 0.018476486206054688, 0.01905679702758789, 0.019637107849121094, 0.020217418670654297, 0.0207977294921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 11.0, 14.0, 16.0, 40.0, 41.0, 94.0, 139.0, 183.0, 328.0, 472.0, 841.0, 1406.0, 2538.0, 5225.0, 13498.0, 45570.0, 313302.0, 3537283.0, 214424.0, 36902.0, 11630.0, 4787.0, 2283.0, 1239.0, 752.0, 454.0, 269.0, 180.0, 120.0, 82.0, 47.0, 32.0, 33.0, 12.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05023193359375, -0.04852485656738281, -0.046817779541015625, -0.04511070251464844, -0.04340362548828125, -0.04169654846191406, -0.039989471435546875, -0.03828239440917969, -0.0365753173828125, -0.03486824035644531, -0.033161163330078125, -0.03145408630371094, -0.02974700927734375, -0.028039932250976562, -0.026332855224609375, -0.024625778198242188, -0.022918701171875, -0.021211624145507812, -0.019504547119140625, -0.017797470092773438, -0.01609039306640625, -0.014383316040039062, -0.012676239013671875, -0.010969161987304688, -0.0092620849609375, -0.0075550079345703125, -0.005847930908203125, -0.0041408538818359375, -0.00243377685546875, -0.0007266998291015625, 0.000980377197265625, 0.0026874542236328125, 0.00439453125, 0.0061016082763671875, 0.007808685302734375, 0.009515762329101562, 0.01122283935546875, 0.012929916381835938, 0.014636993408203125, 0.016344070434570312, 0.0180511474609375, 0.019758224487304688, 0.021465301513671875, 0.023172378540039062, 0.02487945556640625, 0.026586532592773438, 0.028293609619140625, 0.030000686645507812, 0.031707763671875, 0.03341484069824219, 0.035121917724609375, 0.03682899475097656, 0.03853607177734375, 0.04024314880371094, 0.041950225830078125, 0.04365730285644531, 0.0453643798828125, 0.04707145690917969, 0.048778533935546875, 0.05048561096191406, 0.05219268798828125, 0.05389976501464844, 0.055606842041015625, 0.05731391906738281, 0.05902099609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 5.0, 5.0, 3.0, 6.0, 14.0, 12.0, 29.0, 22.0, 47.0, 87.0, 182.0, 497.0, 1931.0, 699.0, 224.0, 107.0, 66.0, 39.0, 34.0, 17.0, 17.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0369873046875, -0.03603053092956543, -0.03507375717163086, -0.03411698341369629, -0.03316020965576172, -0.03220343589782715, -0.031246662139892578, -0.030289888381958008, -0.029333114624023438, -0.028376340866088867, -0.027419567108154297, -0.026462793350219727, -0.025506019592285156, -0.024549245834350586, -0.023592472076416016, -0.022635698318481445, -0.021678924560546875, -0.020722150802612305, -0.019765377044677734, -0.018808603286743164, -0.017851829528808594, -0.016895055770874023, -0.015938282012939453, -0.014981508255004883, -0.014024734497070312, -0.013067960739135742, -0.012111186981201172, -0.011154413223266602, -0.010197639465332031, -0.009240865707397461, -0.00828409194946289, -0.00732731819152832, -0.00637054443359375, -0.00541377067565918, -0.004456996917724609, -0.003500223159790039, -0.0025434494018554688, -0.0015866756439208984, -0.0006299018859863281, 0.0003268718719482422, 0.0012836456298828125, 0.002240419387817383, 0.003197193145751953, 0.0041539669036865234, 0.005110740661621094, 0.006067514419555664, 0.007024288177490234, 0.007981061935424805, 0.008937835693359375, 0.009894609451293945, 0.010851383209228516, 0.011808156967163086, 0.012764930725097656, 0.013721704483032227, 0.014678478240966797, 0.015635251998901367, 0.016592025756835938, 0.017548799514770508, 0.018505573272705078, 0.01946234703063965, 0.02041912078857422, 0.02137589454650879, 0.02233266830444336, 0.02328944206237793, 0.0242462158203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 11.0, 27.0, 86.0, 185.0, 269.0, 223.0, 106.0, 57.0, 16.0, 8.0, 1.0, 2.0, 1.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14779752492904663, -0.13767382502555847, -0.1275501400232315, -0.11742644757032394, -0.10730275511741638, -0.09717906266450882, -0.08705537021160126, -0.0769316777586937, -0.06680798530578613, -0.05668429285287857, -0.04656060039997101, -0.036436907947063446, -0.026313215494155884, -0.01618952304124832, -0.006065830588340759, 0.004057861864566803, 0.014181554317474365, 0.024305246770381927, 0.03442893922328949, 0.04455263167619705, 0.054676324129104614, 0.06480001658201218, 0.07492370903491974, 0.0850474014878273, 0.09517109394073486, 0.10529478639364243, 0.11541847884654999, 0.12554216384887695, 0.1356658637523651, 0.14578956365585327, 0.15591324865818024, 0.1660369336605072, 0.17616063356399536, 0.18628433346748352, 0.19640801846981049, 0.20653170347213745, 0.2166554033756256, 0.22677910327911377, 0.23690278828144073, 0.2470264732837677, 0.25715017318725586, 0.267273873090744, 0.2773975729942322, 0.28752124309539795, 0.2976449429988861, 0.30776864290237427, 0.31789231300354004, 0.3280160129070282, 0.33813971281051636, 0.3482634127140045, 0.3583871126174927, 0.36851078271865845, 0.3786344826221466, 0.38875818252563477, 0.39888185262680054, 0.4090055525302887, 0.41912925243377686, 0.429252952337265, 0.4393766522407532, 0.44950032234191895, 0.4596240222454071, 0.46974772214889526, 0.47987139225006104, 0.4899950921535492, 0.5001187920570374]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 3.0, 5.0, 7.0, 14.0, 13.0, 14.0, 16.0, 26.0, 11.0, 32.0, 39.0, 31.0, 37.0, 39.0, 40.0, 40.0, 36.0, 43.0, 53.0, 45.0, 47.0, 45.0, 50.0, 55.0, 46.0, 27.0, 25.0, 28.0, 14.0, 21.0, 16.0, 19.0, 15.0, 13.0, 13.0, 5.0, 5.0, 2.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08048182725906372, -0.07811357080936432, -0.07574531435966492, -0.07337705045938492, -0.07100879400968552, -0.06864053755998611, -0.06627227365970612, -0.06390401721000671, -0.06153576076030731, -0.05916750431060791, -0.05679924413561821, -0.05443098396062851, -0.05206272751092911, -0.049694471061229706, -0.047326210886240005, -0.044957950711250305, -0.0425896942615509, -0.0402214378118515, -0.0378531776368618, -0.0354849174618721, -0.0331166610121727, -0.030748402699828148, -0.028380144387483597, -0.026011886075139046, -0.023643627762794495, -0.021275369450449944, -0.018907111138105392, -0.01653885282576084, -0.01417059451341629, -0.01180233620107174, -0.009434077888727188, -0.007065819576382637, -0.004697561264038086, -0.002329302951693535, 3.8955360651016235e-05, 0.0024072136729955673, 0.004775471985340118, 0.0071437302976846695, 0.00951198861002922, 0.011880246922373772, 0.014248505234718323, 0.016616763547062874, 0.018985021859407425, 0.021353280171751976, 0.023721538484096527, 0.026089796796441078, 0.02845805510878563, 0.03082631342113018, 0.03319457173347473, 0.03556282818317413, 0.037931088358163834, 0.040299348533153534, 0.042667604982852936, 0.04503586143255234, 0.04740412160754204, 0.04977238178253174, 0.05214063823223114, 0.05450889468193054, 0.05687715485692024, 0.05924541503190994, 0.061613671481609344, 0.06398192793130875, 0.06635019183158875, 0.06871844828128815, 0.07108670473098755]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 13.0, 10.0, 10.0, 12.0, 21.0, 29.0, 38.0, 67.0, 126.0, 169.0, 316.0, 643.0, 1181.0, 2361.0, 5424.0, 14712.0, 44939.0, 141126.0, 351363.0, 313862.0, 114902.0, 36077.0, 12276.0, 4624.0, 2007.0, 955.0, 526.0, 291.0, 171.0, 108.0, 59.0, 53.0, 20.0, 21.0, 8.0, 9.0, 7.0, 9.0, 8.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04559326171875, -0.04406881332397461, -0.04254436492919922, -0.04101991653442383, -0.03949546813964844, -0.03797101974487305, -0.036446571350097656, -0.034922122955322266, -0.033397674560546875, -0.031873226165771484, -0.030348777770996094, -0.028824329376220703, -0.027299880981445312, -0.025775432586669922, -0.02425098419189453, -0.02272653579711914, -0.02120208740234375, -0.01967763900756836, -0.01815319061279297, -0.016628742218017578, -0.015104293823242188, -0.013579845428466797, -0.012055397033691406, -0.010530948638916016, -0.009006500244140625, -0.007482051849365234, -0.005957603454589844, -0.004433155059814453, -0.0029087066650390625, -0.0013842582702636719, 0.00014019012451171875, 0.0016646385192871094, 0.0031890869140625, 0.004713535308837891, 0.006237983703613281, 0.007762432098388672, 0.009286880493164062, 0.010811328887939453, 0.012335777282714844, 0.013860225677490234, 0.015384674072265625, 0.016909122467041016, 0.018433570861816406, 0.019958019256591797, 0.021482467651367188, 0.023006916046142578, 0.02453136444091797, 0.02605581283569336, 0.02758026123046875, 0.02910470962524414, 0.03062915802001953, 0.03215360641479492, 0.03367805480957031, 0.0352025032043457, 0.036726951599121094, 0.038251399993896484, 0.039775848388671875, 0.041300296783447266, 0.042824745178222656, 0.04434919357299805, 0.04587364196777344, 0.04739809036254883, 0.04892253875732422, 0.05044698715209961, 0.051971435546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 13.0, 11.0, 25.0, 44.0, 26.0, 34.0, 23.0, 54.0, 39.0, 50.0, 52.0, 62.0, 51.0, 47.0, 56.0, 58.0, 61.0, 53.0, 28.0, 46.0, 26.0, 29.0, 19.0, 15.0, 14.0, 9.0, 4.0, 6.0, 3.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017059326171875, -0.01646733283996582, -0.01587533950805664, -0.015283346176147461, -0.014691352844238281, -0.014099359512329102, -0.013507366180419922, -0.012915372848510742, -0.012323379516601562, -0.011731386184692383, -0.011139392852783203, -0.010547399520874023, -0.009955406188964844, -0.009363412857055664, -0.008771419525146484, -0.008179426193237305, -0.007587432861328125, -0.006995439529418945, -0.006403446197509766, -0.005811452865600586, -0.005219459533691406, -0.0046274662017822266, -0.004035472869873047, -0.003443479537963867, -0.0028514862060546875, -0.002259492874145508, -0.0016674995422363281, -0.0010755062103271484, -0.00048351287841796875, 0.00010848045349121094, 0.0007004737854003906, 0.0012924671173095703, 0.00188446044921875, 0.0024764537811279297, 0.0030684471130371094, 0.003660440444946289, 0.004252433776855469, 0.0048444271087646484, 0.005436420440673828, 0.006028413772583008, 0.0066204071044921875, 0.007212400436401367, 0.007804393768310547, 0.008396387100219727, 0.008988380432128906, 0.009580373764038086, 0.010172367095947266, 0.010764360427856445, 0.011356353759765625, 0.011948347091674805, 0.012540340423583984, 0.013132333755493164, 0.013724327087402344, 0.014316320419311523, 0.014908313751220703, 0.015500307083129883, 0.016092300415039062, 0.016684293746948242, 0.017276287078857422, 0.0178682804107666, 0.01846027374267578, 0.01905226707458496, 0.01964426040649414, 0.02023625373840332, 0.0208282470703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 9.0, 6.0, 13.0, 13.0, 22.0, 23.0, 39.0, 40.0, 67.0, 83.0, 110.0, 127.0, 258.0, 420.0, 759.0, 1775.0, 5058.0, 17306.0, 72018.0, 324899.0, 464859.0, 120377.0, 27782.0, 7542.0, 2496.0, 993.0, 526.0, 287.0, 187.0, 114.0, 84.0, 57.0, 42.0, 37.0, 24.0, 23.0, 17.0, 11.0, 13.0, 11.0, 5.0, 5.0, 3.0, 9.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.054718017578125, -0.05301713943481445, -0.051316261291503906, -0.04961538314819336, -0.04791450500488281, -0.046213626861572266, -0.04451274871826172, -0.04281187057495117, -0.041110992431640625, -0.03941011428833008, -0.03770923614501953, -0.036008358001708984, -0.03430747985839844, -0.03260660171508789, -0.030905723571777344, -0.029204845428466797, -0.02750396728515625, -0.025803089141845703, -0.024102210998535156, -0.02240133285522461, -0.020700454711914062, -0.018999576568603516, -0.01729869842529297, -0.015597820281982422, -0.013896942138671875, -0.012196063995361328, -0.010495185852050781, -0.008794307708740234, -0.0070934295654296875, -0.005392551422119141, -0.0036916732788085938, -0.001990795135498047, -0.0002899169921875, 0.0014109611511230469, 0.0031118392944335938, 0.004812717437744141, 0.0065135955810546875, 0.008214473724365234, 0.009915351867675781, 0.011616230010986328, 0.013317108154296875, 0.015017986297607422, 0.01671886444091797, 0.018419742584228516, 0.020120620727539062, 0.02182149887084961, 0.023522377014160156, 0.025223255157470703, 0.02692413330078125, 0.028625011444091797, 0.030325889587402344, 0.03202676773071289, 0.03372764587402344, 0.035428524017333984, 0.03712940216064453, 0.03883028030395508, 0.040531158447265625, 0.04223203659057617, 0.04393291473388672, 0.045633792877197266, 0.04733467102050781, 0.04903554916381836, 0.050736427307128906, 0.05243730545043945, 0.05413818359375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 5.0, 13.0, 10.0, 15.0, 13.0, 23.0, 26.0, 26.0, 27.0, 35.0, 42.0, 35.0, 36.0, 38.0, 38.0, 45.0, 43.0, 49.0, 48.0, 43.0, 48.0, 46.0, 39.0, 32.0, 44.0, 31.0, 27.0, 24.0, 22.0, 16.0, 9.0, 11.0, 7.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072509765625, -0.07020759582519531, -0.06790542602539062, -0.06560325622558594, -0.06330108642578125, -0.06099891662597656, -0.058696746826171875, -0.05639457702636719, -0.0540924072265625, -0.05179023742675781, -0.049488067626953125, -0.04718589782714844, -0.04488372802734375, -0.04258155822753906, -0.040279388427734375, -0.03797721862792969, -0.035675048828125, -0.03337287902832031, -0.031070709228515625, -0.028768539428710938, -0.02646636962890625, -0.024164199829101562, -0.021862030029296875, -0.019559860229492188, -0.0172576904296875, -0.014955520629882812, -0.012653350830078125, -0.010351181030273438, -0.00804901123046875, -0.0057468414306640625, -0.003444671630859375, -0.0011425018310546875, 0.00115966796875, 0.0034618377685546875, 0.005764007568359375, 0.008066177368164062, 0.01036834716796875, 0.012670516967773438, 0.014972686767578125, 0.017274856567382812, 0.0195770263671875, 0.021879196166992188, 0.024181365966796875, 0.026483535766601562, 0.02878570556640625, 0.031087875366210938, 0.033390045166015625, 0.03569221496582031, 0.037994384765625, 0.04029655456542969, 0.042598724365234375, 0.04490089416503906, 0.04720306396484375, 0.04950523376464844, 0.051807403564453125, 0.05410957336425781, 0.0564117431640625, 0.05871391296386719, 0.061016082763671875, 0.06331825256347656, 0.06562042236328125, 0.06792259216308594, 0.07022476196289062, 0.07252693176269531, 0.0748291015625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 2.0, 14.0, 17.0, 24.0, 43.0, 39.0, 75.0, 135.0, 188.0, 327.0, 618.0, 1045.0, 1836.0, 3797.0, 8566.0, 30185.0, 294625.0, 633059.0, 51876.0, 12102.0, 4695.0, 2292.0, 1253.0, 656.0, 406.0, 251.0, 142.0, 105.0, 64.0, 35.0, 33.0, 15.0, 10.0, 10.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047393798828125, -0.046045780181884766, -0.04469776153564453, -0.0433497428894043, -0.04200172424316406, -0.04065370559692383, -0.039305686950683594, -0.03795766830444336, -0.036609649658203125, -0.03526163101196289, -0.033913612365722656, -0.03256559371948242, -0.031217575073242188, -0.029869556427001953, -0.02852153778076172, -0.027173519134521484, -0.02582550048828125, -0.024477481842041016, -0.02312946319580078, -0.021781444549560547, -0.020433425903320312, -0.019085407257080078, -0.017737388610839844, -0.01638936996459961, -0.015041351318359375, -0.01369333267211914, -0.012345314025878906, -0.010997295379638672, -0.009649276733398438, -0.008301258087158203, -0.006953239440917969, -0.005605220794677734, -0.0042572021484375, -0.0029091835021972656, -0.0015611648559570312, -0.00021314620971679688, 0.0011348724365234375, 0.002482891082763672, 0.0038309097290039062, 0.005178928375244141, 0.006526947021484375, 0.00787496566772461, 0.009222984313964844, 0.010571002960205078, 0.011919021606445312, 0.013267040252685547, 0.014615058898925781, 0.015963077545166016, 0.01731109619140625, 0.018659114837646484, 0.02000713348388672, 0.021355152130126953, 0.022703170776367188, 0.024051189422607422, 0.025399208068847656, 0.02674722671508789, 0.028095245361328125, 0.02944326400756836, 0.030791282653808594, 0.03213930130004883, 0.03348731994628906, 0.0348353385925293, 0.03618335723876953, 0.037531375885009766, 0.03887939453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 21.0, 49.0, 59.0, 105.0, 187.0, 159.0, 138.0, 110.0, 68.0, 32.0, 32.0, 12.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.710653305053711e-05, -1.6526319086551666e-05, -1.5946105122566223e-05, -1.536589115858078e-05, -1.4785677194595337e-05, -1.4205463230609894e-05, -1.362524926662445e-05, -1.3045035302639008e-05, -1.2464821338653564e-05, -1.1884607374668121e-05, -1.1304393410682678e-05, -1.0724179446697235e-05, -1.0143965482711792e-05, -9.563751518726349e-06, -8.983537554740906e-06, -8.403323590755463e-06, -7.82310962677002e-06, -7.242895662784576e-06, -6.662681698799133e-06, -6.08246773481369e-06, -5.502253770828247e-06, -4.922039806842804e-06, -4.341825842857361e-06, -3.7616118788719177e-06, -3.1813979148864746e-06, -2.6011839509010315e-06, -2.0209699869155884e-06, -1.4407560229301453e-06, -8.605420589447021e-07, -2.8032809495925903e-07, 2.998858690261841e-07, 8.800998330116272e-07, 1.4603137969970703e-06, 2.0405277609825134e-06, 2.6207417249679565e-06, 3.2009556889533997e-06, 3.7811696529388428e-06, 4.361383616924286e-06, 4.941597580909729e-06, 5.521811544895172e-06, 6.102025508880615e-06, 6.682239472866058e-06, 7.2624534368515015e-06, 7.842667400836945e-06, 8.422881364822388e-06, 9.00309532880783e-06, 9.583309292793274e-06, 1.0163523256778717e-05, 1.074373722076416e-05, 1.1323951184749603e-05, 1.1904165148735046e-05, 1.248437911272049e-05, 1.3064593076705933e-05, 1.3644807040691376e-05, 1.4225021004676819e-05, 1.4805234968662262e-05, 1.5385448932647705e-05, 1.5965662896633148e-05, 1.654587686061859e-05, 1.7126090824604034e-05, 1.7706304788589478e-05, 1.828651875257492e-05, 1.8866732716560364e-05, 1.9446946680545807e-05, 2.002716064453125e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 2.0, 11.0, 3.0, 10.0, 21.0, 39.0, 58.0, 88.0, 155.0, 271.0, 450.0, 849.0, 1632.0, 3502.0, 8193.0, 23581.0, 116809.0, 648870.0, 194020.0, 31599.0, 9914.0, 4141.0, 2004.0, 1018.0, 566.0, 294.0, 190.0, 94.0, 63.0, 31.0, 33.0, 20.0, 9.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040740966796875, -0.0396578311920166, -0.0385746955871582, -0.037491559982299805, -0.036408424377441406, -0.03532528877258301, -0.03424215316772461, -0.03315901756286621, -0.03207588195800781, -0.030992746353149414, -0.029909610748291016, -0.028826475143432617, -0.02774333953857422, -0.02666020393371582, -0.025577068328857422, -0.024493932723999023, -0.023410797119140625, -0.022327661514282227, -0.021244525909423828, -0.02016139030456543, -0.01907825469970703, -0.017995119094848633, -0.016911983489990234, -0.015828847885131836, -0.014745712280273438, -0.013662576675415039, -0.01257944107055664, -0.011496305465698242, -0.010413169860839844, -0.009330034255981445, -0.008246898651123047, -0.0071637630462646484, -0.00608062744140625, -0.0049974918365478516, -0.003914356231689453, -0.0028312206268310547, -0.0017480850219726562, -0.0006649494171142578, 0.0004181861877441406, 0.001501321792602539, 0.0025844573974609375, 0.003667593002319336, 0.004750728607177734, 0.005833864212036133, 0.006916999816894531, 0.00800013542175293, 0.009083271026611328, 0.010166406631469727, 0.011249542236328125, 0.012332677841186523, 0.013415813446044922, 0.01449894905090332, 0.015582084655761719, 0.016665220260620117, 0.017748355865478516, 0.018831491470336914, 0.019914627075195312, 0.02099776268005371, 0.02208089828491211, 0.023164033889770508, 0.024247169494628906, 0.025330305099487305, 0.026413440704345703, 0.0274965763092041, 0.0285797119140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 7.0, 13.0, 6.0, 23.0, 25.0, 33.0, 32.0, 60.0, 87.0, 112.0, 121.0, 128.0, 87.0, 84.0, 43.0, 44.0, 33.0, 17.0, 10.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04290771484375, -0.041768550872802734, -0.04062938690185547, -0.0394902229309082, -0.03835105895996094, -0.03721189498901367, -0.036072731018066406, -0.03493356704711914, -0.033794403076171875, -0.03265523910522461, -0.031516075134277344, -0.030376911163330078, -0.029237747192382812, -0.028098583221435547, -0.02695941925048828, -0.025820255279541016, -0.02468109130859375, -0.023541927337646484, -0.02240276336669922, -0.021263599395751953, -0.020124435424804688, -0.018985271453857422, -0.017846107482910156, -0.01670694351196289, -0.015567779541015625, -0.01442861557006836, -0.013289451599121094, -0.012150287628173828, -0.011011123657226562, -0.009871959686279297, -0.008732795715332031, -0.007593631744384766, -0.0064544677734375, -0.005315303802490234, -0.004176139831542969, -0.003036975860595703, -0.0018978118896484375, -0.0007586479187011719, 0.00038051605224609375, 0.0015196800231933594, 0.002658843994140625, 0.0037980079650878906, 0.004937171936035156, 0.006076335906982422, 0.0072154998779296875, 0.008354663848876953, 0.009493827819824219, 0.010632991790771484, 0.01177215576171875, 0.012911319732666016, 0.014050483703613281, 0.015189647674560547, 0.016328811645507812, 0.017467975616455078, 0.018607139587402344, 0.01974630355834961, 0.020885467529296875, 0.02202463150024414, 0.023163795471191406, 0.024302959442138672, 0.025442123413085938, 0.026581287384033203, 0.02772045135498047, 0.028859615325927734, 0.029998779296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 11.0, 20.0, 47.0, 70.0, 142.0, 192.0, 186.0, 152.0, 95.0, 40.0, 25.0, 15.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.874065637588501, -0.8530946373939514, -0.8321236371994019, -0.8111525774002075, -0.790181577205658, -0.7692105770111084, -0.7482395768165588, -0.7272685766220093, -0.7062975168228149, -0.6853265166282654, -0.6643555164337158, -0.6433844566345215, -0.6224134564399719, -0.6014424562454224, -0.5804714560508728, -0.5595004558563232, -0.5385294556617737, -0.5175584554672241, -0.4965874254703522, -0.4756164252758026, -0.45464539527893066, -0.4336743950843811, -0.41270339488983154, -0.391732394695282, -0.37076136469841003, -0.3497903645038605, -0.3288193345069885, -0.30784833431243896, -0.2868773341178894, -0.26590630412101746, -0.2449353039264679, -0.22396428883075714, -0.2029932141304016, -0.18202219903469086, -0.1610511839389801, -0.14008018374443054, -0.11910916864871979, -0.09813815355300903, -0.07716715335845947, -0.05619613826274872, -0.035225123167037964, -0.014254111796617508, 0.006716899573802948, 0.027687907218933105, 0.04865892231464386, 0.06962993741035461, 0.09060093760490417, 0.11157195270061493, 0.13254296779632568, 0.15351398289203644, 0.1744849979877472, 0.19545599818229675, 0.2164270132780075, 0.23739802837371826, 0.2583690285682678, 0.2793400287628174, 0.30031105875968933, 0.3212820589542389, 0.34225308895111084, 0.3632240891456604, 0.38419508934020996, 0.4051661193370819, 0.42613711953163147, 0.4471081495285034, 0.468079149723053]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 14.0, 14.0, 13.0, 14.0, 19.0, 26.0, 24.0, 29.0, 34.0, 24.0, 38.0, 33.0, 38.0, 37.0, 45.0, 39.0, 52.0, 36.0, 38.0, 44.0, 51.0, 40.0, 35.0, 30.0, 26.0, 14.0, 22.0, 24.0, 24.0, 18.0, 17.0, 11.0, 11.0, 10.0, 15.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3077883720397949, -0.297630250453949, -0.287472128868103, -0.2773140072822571, -0.26715588569641113, -0.2569977343082428, -0.24683961272239685, -0.2366814911365509, -0.22652336955070496, -0.216365247964859, -0.20620712637901306, -0.19604898989200592, -0.18589086830615997, -0.17573274672031403, -0.16557461023330688, -0.15541648864746094, -0.145258367061615, -0.13510024547576904, -0.1249421164393425, -0.11478398740291595, -0.10462586581707001, -0.09446774423122406, -0.08430961519479752, -0.07415148615837097, -0.06399336457252502, -0.05383523926138878, -0.04367711395025253, -0.03351898863911629, -0.02336086332798004, -0.013202738016843796, -0.00304461270570755, 0.007113516330718994, 0.01727163791656494, 0.027429763227701187, 0.03758788853883743, 0.04774601384997368, 0.057904139161109924, 0.06806226074695587, 0.07822038978338242, 0.08837851881980896, 0.09853664040565491, 0.10869476199150085, 0.1188528910279274, 0.12901102006435394, 0.1391691416501999, 0.14932726323604584, 0.15948539972305298, 0.16964352130889893, 0.17980164289474487, 0.18995976448059082, 0.20011788606643677, 0.2102760225534439, 0.22043414413928986, 0.2305922657251358, 0.24075040221214294, 0.2509085237979889, 0.26106664538383484, 0.2712247669696808, 0.28138288855552673, 0.2915410101413727, 0.301699161529541, 0.31185728311538696, 0.3220154047012329, 0.33217352628707886, 0.3423316478729248]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 19.0, 25.0, 47.0, 115.0, 236.0, 923.0, 10207.0, 4170529.0, 10735.0, 1008.0, 210.0, 109.0, 50.0, 29.0, 17.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.333740234375, -0.3260688781738281, -0.31839752197265625, -0.3107261657714844, -0.3030548095703125, -0.2953834533691406, -0.28771209716796875, -0.2800407409667969, -0.272369384765625, -0.2646980285644531, -0.25702667236328125, -0.24935531616210938, -0.2416839599609375, -0.23401260375976562, -0.22634124755859375, -0.21866989135742188, -0.21099853515625, -0.20332717895507812, -0.19565582275390625, -0.18798446655273438, -0.1803131103515625, -0.17264175415039062, -0.16497039794921875, -0.15729904174804688, -0.149627685546875, -0.14195632934570312, -0.13428497314453125, -0.12661361694335938, -0.1189422607421875, -0.11127090454101562, -0.10359954833984375, -0.09592819213867188, -0.0882568359375, -0.08058547973632812, -0.07291412353515625, -0.06524276733398438, -0.0575714111328125, -0.049900054931640625, -0.04222869873046875, -0.034557342529296875, -0.026885986328125, -0.019214630126953125, -0.01154327392578125, -0.003871917724609375, 0.0037994384765625, 0.011470794677734375, 0.01914215087890625, 0.026813507080078125, 0.03448486328125, 0.042156219482421875, 0.04982757568359375, 0.057498931884765625, 0.0651702880859375, 0.07284164428710938, 0.08051300048828125, 0.08818435668945312, 0.095855712890625, 0.10352706909179688, 0.11119842529296875, 0.11886978149414062, 0.1265411376953125, 0.13421249389648438, 0.14188385009765625, 0.14955520629882812, 0.1572265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 9.0, 19.0, 19.0, 25.0, 31.0, 33.0, 36.0, 39.0, 35.0, 50.0, 43.0, 55.0, 53.0, 53.0, 52.0, 49.0, 51.0, 46.0, 44.0, 36.0, 31.0, 34.0, 23.0, 16.0, 23.0, 13.0, 12.0, 13.0, 6.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.019012451171875, -0.018410205841064453, -0.017807960510253906, -0.01720571517944336, -0.016603469848632812, -0.016001224517822266, -0.015398979187011719, -0.014796733856201172, -0.014194488525390625, -0.013592243194580078, -0.012989997863769531, -0.012387752532958984, -0.011785507202148438, -0.01118326187133789, -0.010581016540527344, -0.009978771209716797, -0.00937652587890625, -0.008774280548095703, -0.008172035217285156, -0.007569789886474609, -0.0069675445556640625, -0.006365299224853516, -0.005763053894042969, -0.005160808563232422, -0.004558563232421875, -0.003956317901611328, -0.0033540725708007812, -0.0027518272399902344, -0.0021495819091796875, -0.0015473365783691406, -0.0009450912475585938, -0.0003428459167480469, 0.0002593994140625, 0.0008616447448730469, 0.0014638900756835938, 0.0020661354064941406, 0.0026683807373046875, 0.0032706260681152344, 0.0038728713989257812, 0.004475116729736328, 0.005077362060546875, 0.005679607391357422, 0.006281852722167969, 0.006884098052978516, 0.0074863433837890625, 0.00808858871459961, 0.008690834045410156, 0.009293079376220703, 0.00989532470703125, 0.010497570037841797, 0.011099815368652344, 0.01170206069946289, 0.012304306030273438, 0.012906551361083984, 0.013508796691894531, 0.014111042022705078, 0.014713287353515625, 0.015315532684326172, 0.01591777801513672, 0.016520023345947266, 0.017122268676757812, 0.01772451400756836, 0.018326759338378906, 0.018929004669189453, 0.01953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 6.0, 11.0, 13.0, 18.0, 25.0, 29.0, 19.0, 37.0, 43.0, 73.0, 126.0, 247.0, 440.0, 964.0, 2385.0, 8887.0, 182107.0, 3979218.0, 13987.0, 3210.0, 1121.0, 534.0, 269.0, 157.0, 81.0, 51.0, 45.0, 28.0, 20.0, 24.0, 23.0, 16.0, 15.0, 8.0, 7.0, 4.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093994140625, -0.09052848815917969, -0.08706283569335938, -0.08359718322753906, -0.08013153076171875, -0.07666587829589844, -0.07320022583007812, -0.06973457336425781, -0.0662689208984375, -0.06280326843261719, -0.059337615966796875, -0.05587196350097656, -0.05240631103515625, -0.04894065856933594, -0.045475006103515625, -0.04200935363769531, -0.038543701171875, -0.03507804870605469, -0.031612396240234375, -0.028146743774414062, -0.02468109130859375, -0.021215438842773438, -0.017749786376953125, -0.014284133911132812, -0.0108184814453125, -0.0073528289794921875, -0.003887176513671875, -0.0004215240478515625, 0.00304412841796875, 0.0065097808837890625, 0.009975433349609375, 0.013441085815429688, 0.01690673828125, 0.020372390747070312, 0.023838043212890625, 0.027303695678710938, 0.03076934814453125, 0.03423500061035156, 0.037700653076171875, 0.04116630554199219, 0.0446319580078125, 0.04809761047363281, 0.051563262939453125, 0.05502891540527344, 0.05849456787109375, 0.06196022033691406, 0.06542587280273438, 0.06889152526855469, 0.072357177734375, 0.07582283020019531, 0.07928848266601562, 0.08275413513183594, 0.08621978759765625, 0.08968544006347656, 0.09315109252929688, 0.09661674499511719, 0.1000823974609375, 0.10354804992675781, 0.10701370239257812, 0.11047935485839844, 0.11394500732421875, 0.11741065979003906, 0.12087631225585938, 0.12434196472167969, 0.1278076171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 17.0, 15.0, 52.0, 132.0, 3455.0, 261.0, 72.0, 28.0, 11.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00844573974609375, -0.00791013240814209, -0.00737452507019043, -0.0068389177322387695, -0.006303310394287109, -0.005767703056335449, -0.005232095718383789, -0.004696488380432129, -0.004160881042480469, -0.0036252737045288086, -0.0030896663665771484, -0.0025540590286254883, -0.002018451690673828, -0.001482844352722168, -0.0009472370147705078, -0.00041162967681884766, 0.0001239776611328125, 0.0006595849990844727, 0.0011951923370361328, 0.001730799674987793, 0.002266407012939453, 0.0028020143508911133, 0.0033376216888427734, 0.0038732290267944336, 0.004408836364746094, 0.004944443702697754, 0.005480051040649414, 0.006015658378601074, 0.006551265716552734, 0.0070868730545043945, 0.007622480392456055, 0.008158087730407715, 0.008693695068359375, 0.009229302406311035, 0.009764909744262695, 0.010300517082214355, 0.010836124420166016, 0.011371731758117676, 0.011907339096069336, 0.012442946434020996, 0.012978553771972656, 0.013514161109924316, 0.014049768447875977, 0.014585375785827637, 0.015120983123779297, 0.015656590461730957, 0.016192197799682617, 0.016727805137634277, 0.017263412475585938, 0.017799019813537598, 0.018334627151489258, 0.018870234489440918, 0.019405841827392578, 0.01994144916534424, 0.0204770565032959, 0.02101266384124756, 0.02154827117919922, 0.02208387851715088, 0.02261948585510254, 0.0231550931930542, 0.02369070053100586, 0.02422630786895752, 0.02476191520690918, 0.02529752254486084, 0.0258331298828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 17.0, 13.0, 24.0, 41.0, 63.0, 113.0, 116.0, 131.0, 110.0, 126.0, 77.0, 57.0, 40.0, 23.0, 15.0, 7.0, 8.0, 5.0, 10.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07439583539962769, -0.07263271510601044, -0.07086958736181259, -0.06910646706819534, -0.0673433467745781, -0.06558021903038025, -0.063817098736763, -0.06205397844314575, -0.060290854424238205, -0.05852773040533066, -0.05676461011171341, -0.05500148609280586, -0.053238362073898315, -0.05147524178028107, -0.04971211776137352, -0.04794899374246597, -0.046185873448848724, -0.04442274942994118, -0.04265962913632393, -0.04089650511741638, -0.03913338482379913, -0.037370260804891586, -0.03560713678598404, -0.03384401649236679, -0.032080892473459244, -0.030317770317196846, -0.028554648160934448, -0.0267915241420269, -0.025028401985764503, -0.023265279829502106, -0.02150215581059456, -0.01973903365433216, -0.017975911498069763, -0.016212789341807365, -0.014449666254222393, -0.01268654316663742, -0.010923421010375023, -0.009160298854112625, -0.007397175766527653, -0.00563405267894268, -0.0038709305226802826, -0.0021078079007565975, -0.00034468527883291245, 0.0014184373430907726, 0.0031815599650144577, 0.0049446821212768555, 0.006707805208861828, 0.0084709282964468, 0.010234050452709198, 0.011997172608971596, 0.013760295696556568, 0.01552341878414154, 0.01728654094040394, 0.019049663096666336, 0.020812787115573883, 0.02257590927183628, 0.02433903142809868, 0.026102153584361076, 0.027865275740623474, 0.02962839975953102, 0.03139152377843857, 0.03315464407205582, 0.034917768090963364, 0.03668089210987091, 0.03844401240348816]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 2.0, 8.0, 7.0, 16.0, 19.0, 18.0, 17.0, 19.0, 23.0, 20.0, 32.0, 36.0, 46.0, 36.0, 37.0, 53.0, 41.0, 38.0, 28.0, 43.0, 47.0, 35.0, 31.0, 32.0, 35.0, 27.0, 32.0, 41.0, 22.0, 26.0, 18.0, 15.0, 26.0, 14.0, 12.0, 9.0, 6.0, 7.0, 6.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.023025810718536377, -0.022339005023241043, -0.02165219932794571, -0.020965393632650375, -0.02027858793735504, -0.019591782242059708, -0.018904976546764374, -0.01821817085146904, -0.017531365156173706, -0.016844559460878372, -0.01615775376558304, -0.015470948070287704, -0.01478414237499237, -0.014097336679697037, -0.013410530984401703, -0.012723725289106369, -0.012036919593811035, -0.011350113898515701, -0.010663308203220367, -0.009976502507925034, -0.0092896968126297, -0.008602891117334366, -0.007916085422039032, -0.007229279726743698, -0.006542474031448364, -0.00585566833615303, -0.0051688626408576965, -0.004482056945562363, -0.003795251250267029, -0.003108445554971695, -0.002421639859676361, -0.0017348341643810272, -0.0010480284690856934, -0.0003612227737903595, 0.00032558292150497437, 0.0010123886168003082, 0.001699194312095642, 0.002386000007390976, 0.00307280570268631, 0.0037596113979816437, 0.0044464170932769775, 0.005133222788572311, 0.005820028483867645, 0.006506834179162979, 0.007193639874458313, 0.007880445569753647, 0.00856725126504898, 0.009254056960344315, 0.009940862655639648, 0.010627668350934982, 0.011314474046230316, 0.01200127974152565, 0.012688085436820984, 0.013374891132116318, 0.014061696827411652, 0.014748502522706985, 0.01543530821800232, 0.016122113913297653, 0.016808919608592987, 0.01749572530388832, 0.018182530999183655, 0.01886933669447899, 0.019556142389774323, 0.020242948085069656, 0.02092975378036499]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 8.0, 14.0, 30.0, 37.0, 58.0, 91.0, 133.0, 180.0, 350.0, 571.0, 1087.0, 1945.0, 3958.0, 8341.0, 18768.0, 44802.0, 108622.0, 235136.0, 301847.0, 183906.0, 79409.0, 32214.0, 13845.0, 6330.0, 3149.0, 1619.0, 802.0, 476.0, 286.0, 171.0, 103.0, 83.0, 47.0, 35.0, 30.0, 18.0, 16.0, 10.0, 8.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.042694091796875, -0.04148530960083008, -0.040276527404785156, -0.039067745208740234, -0.03785896301269531, -0.03665018081665039, -0.03544139862060547, -0.03423261642456055, -0.033023834228515625, -0.0318150520324707, -0.03060626983642578, -0.02939748764038086, -0.028188705444335938, -0.026979923248291016, -0.025771141052246094, -0.024562358856201172, -0.02335357666015625, -0.022144794464111328, -0.020936012268066406, -0.019727230072021484, -0.018518447875976562, -0.01730966567993164, -0.01610088348388672, -0.014892101287841797, -0.013683319091796875, -0.012474536895751953, -0.011265754699707031, -0.01005697250366211, -0.008848190307617188, -0.007639408111572266, -0.006430625915527344, -0.005221843719482422, -0.0040130615234375, -0.002804279327392578, -0.0015954971313476562, -0.0003867149353027344, 0.0008220672607421875, 0.0020308494567871094, 0.0032396316528320312, 0.004448413848876953, 0.005657196044921875, 0.006865978240966797, 0.008074760437011719, 0.00928354263305664, 0.010492324829101562, 0.011701107025146484, 0.012909889221191406, 0.014118671417236328, 0.01532745361328125, 0.016536235809326172, 0.017745018005371094, 0.018953800201416016, 0.020162582397460938, 0.02137136459350586, 0.02258014678955078, 0.023788928985595703, 0.024997711181640625, 0.026206493377685547, 0.02741527557373047, 0.02862405776977539, 0.029832839965820312, 0.031041622161865234, 0.032250404357910156, 0.03345918655395508, 0.03466796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 7.0, 10.0, 5.0, 9.0, 12.0, 17.0, 20.0, 28.0, 33.0, 36.0, 37.0, 46.0, 40.0, 35.0, 45.0, 46.0, 56.0, 37.0, 48.0, 60.0, 45.0, 42.0, 41.0, 33.0, 38.0, 26.0, 31.0, 27.0, 8.0, 18.0, 14.0, 6.0, 9.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186614990234375, -0.018048524856567383, -0.017435550689697266, -0.01682257652282715, -0.01620960235595703, -0.015596628189086914, -0.014983654022216797, -0.01437067985534668, -0.013757705688476562, -0.013144731521606445, -0.012531757354736328, -0.011918783187866211, -0.011305809020996094, -0.010692834854125977, -0.01007986068725586, -0.009466886520385742, -0.008853912353515625, -0.008240938186645508, -0.007627964019775391, -0.0070149898529052734, -0.006402015686035156, -0.005789041519165039, -0.005176067352294922, -0.004563093185424805, -0.0039501190185546875, -0.0033371448516845703, -0.002724170684814453, -0.002111196517944336, -0.0014982223510742188, -0.0008852481842041016, -0.0002722740173339844, 0.0003407001495361328, 0.00095367431640625, 0.0015666484832763672, 0.0021796226501464844, 0.0027925968170166016, 0.0034055709838867188, 0.004018545150756836, 0.004631519317626953, 0.00524449348449707, 0.0058574676513671875, 0.006470441818237305, 0.007083415985107422, 0.007696390151977539, 0.008309364318847656, 0.008922338485717773, 0.00953531265258789, 0.010148286819458008, 0.010761260986328125, 0.011374235153198242, 0.01198720932006836, 0.012600183486938477, 0.013213157653808594, 0.013826131820678711, 0.014439105987548828, 0.015052080154418945, 0.015665054321289062, 0.01627802848815918, 0.016891002655029297, 0.017503976821899414, 0.01811695098876953, 0.01872992515563965, 0.019342899322509766, 0.019955873489379883, 0.02056884765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 6.0, 8.0, 17.0, 17.0, 25.0, 35.0, 29.0, 41.0, 45.0, 68.0, 102.0, 190.0, 275.0, 575.0, 1148.0, 2856.0, 8286.0, 30320.0, 152453.0, 563724.0, 227894.0, 42689.0, 11146.0, 3641.0, 1379.0, 637.0, 342.0, 180.0, 108.0, 99.0, 48.0, 33.0, 30.0, 25.0, 20.0, 14.0, 11.0, 16.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05731201171875, -0.05543994903564453, -0.05356788635253906, -0.051695823669433594, -0.049823760986328125, -0.047951698303222656, -0.04607963562011719, -0.04420757293701172, -0.04233551025390625, -0.04046344757080078, -0.03859138488769531, -0.036719322204589844, -0.034847259521484375, -0.032975196838378906, -0.031103134155273438, -0.02923107147216797, -0.0273590087890625, -0.02548694610595703, -0.023614883422851562, -0.021742820739746094, -0.019870758056640625, -0.017998695373535156, -0.016126632690429688, -0.014254570007324219, -0.01238250732421875, -0.010510444641113281, -0.008638381958007812, -0.006766319274902344, -0.004894256591796875, -0.0030221939086914062, -0.0011501312255859375, 0.0007219314575195312, 0.002593994140625, 0.004466056823730469, 0.0063381195068359375, 0.008210182189941406, 0.010082244873046875, 0.011954307556152344, 0.013826370239257812, 0.01569843292236328, 0.01757049560546875, 0.01944255828857422, 0.021314620971679688, 0.023186683654785156, 0.025058746337890625, 0.026930809020996094, 0.028802871704101562, 0.03067493438720703, 0.0325469970703125, 0.03441905975341797, 0.03629112243652344, 0.038163185119628906, 0.040035247802734375, 0.041907310485839844, 0.04377937316894531, 0.04565143585205078, 0.04752349853515625, 0.04939556121826172, 0.05126762390136719, 0.053139686584472656, 0.055011749267578125, 0.056883811950683594, 0.05875587463378906, 0.06062793731689453, 0.0625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 4.0, 5.0, 16.0, 9.0, 10.0, 17.0, 18.0, 20.0, 26.0, 28.0, 31.0, 32.0, 25.0, 41.0, 34.0, 47.0, 50.0, 45.0, 41.0, 39.0, 39.0, 52.0, 40.0, 41.0, 26.0, 42.0, 31.0, 31.0, 12.0, 27.0, 21.0, 14.0, 19.0, 13.0, 5.0, 9.0, 7.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.07916259765625, -0.07684516906738281, -0.07452774047851562, -0.07221031188964844, -0.06989288330078125, -0.06757545471191406, -0.06525802612304688, -0.06294059753417969, -0.0606231689453125, -0.05830574035644531, -0.055988311767578125, -0.05367088317871094, -0.05135345458984375, -0.04903602600097656, -0.046718597412109375, -0.04440116882324219, -0.042083740234375, -0.03976631164550781, -0.037448883056640625, -0.03513145446777344, -0.03281402587890625, -0.030496597290039062, -0.028179168701171875, -0.025861740112304688, -0.0235443115234375, -0.021226882934570312, -0.018909454345703125, -0.016592025756835938, -0.01427459716796875, -0.011957168579101562, -0.009639739990234375, -0.0073223114013671875, -0.0050048828125, -0.0026874542236328125, -0.000370025634765625, 0.0019474029541015625, 0.00426483154296875, 0.0065822601318359375, 0.008899688720703125, 0.011217117309570312, 0.0135345458984375, 0.015851974487304688, 0.018169403076171875, 0.020486831665039062, 0.02280426025390625, 0.025121688842773438, 0.027439117431640625, 0.029756546020507812, 0.032073974609375, 0.03439140319824219, 0.036708831787109375, 0.03902626037597656, 0.04134368896484375, 0.04366111755371094, 0.045978546142578125, 0.04829597473144531, 0.0506134033203125, 0.05293083190917969, 0.055248260498046875, 0.05756568908691406, 0.05988311767578125, 0.06220054626464844, 0.06451797485351562, 0.06683540344238281, 0.06915283203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 16.0, 15.0, 17.0, 37.0, 66.0, 116.0, 235.0, 641.0, 1940.0, 6125.0, 25670.0, 193889.0, 694576.0, 102180.0, 16455.0, 4296.0, 1330.0, 485.0, 223.0, 94.0, 44.0, 25.0, 26.0, 18.0, 11.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0283660888671875, -0.027365922927856445, -0.02636575698852539, -0.025365591049194336, -0.02436542510986328, -0.023365259170532227, -0.022365093231201172, -0.021364927291870117, -0.020364761352539062, -0.019364595413208008, -0.018364429473876953, -0.0173642635345459, -0.016364097595214844, -0.015363931655883789, -0.014363765716552734, -0.01336359977722168, -0.012363433837890625, -0.01136326789855957, -0.010363101959228516, -0.009362936019897461, -0.008362770080566406, -0.0073626041412353516, -0.006362438201904297, -0.005362272262573242, -0.0043621063232421875, -0.003361940383911133, -0.002361774444580078, -0.0013616085052490234, -0.00036144256591796875, 0.0006387233734130859, 0.0016388893127441406, 0.0026390552520751953, 0.00363922119140625, 0.004639387130737305, 0.005639553070068359, 0.006639719009399414, 0.007639884948730469, 0.008640050888061523, 0.009640216827392578, 0.010640382766723633, 0.011640548706054688, 0.012640714645385742, 0.013640880584716797, 0.014641046524047852, 0.015641212463378906, 0.01664137840270996, 0.017641544342041016, 0.01864171028137207, 0.019641876220703125, 0.02064204216003418, 0.021642208099365234, 0.02264237403869629, 0.023642539978027344, 0.0246427059173584, 0.025642871856689453, 0.026643037796020508, 0.027643203735351562, 0.028643369674682617, 0.029643535614013672, 0.030643701553344727, 0.03164386749267578, 0.032644033432006836, 0.03364419937133789, 0.034644365310668945, 0.03564453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 7.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 16.0, 16.0, 23.0, 36.0, 23.0, 34.0, 46.0, 40.0, 55.0, 56.0, 63.0, 74.0, 49.0, 67.0, 56.0, 37.0, 60.0, 30.0, 32.0, 34.0, 18.0, 17.0, 21.0, 11.0, 8.0, 2.0, 7.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.67572021484375e-06, -6.4782798290252686e-06, -6.280839443206787e-06, -6.083399057388306e-06, -5.885958671569824e-06, -5.688518285751343e-06, -5.491077899932861e-06, -5.29363751411438e-06, -5.0961971282958984e-06, -4.898756742477417e-06, -4.7013163566589355e-06, -4.503875970840454e-06, -4.306435585021973e-06, -4.108995199203491e-06, -3.91155481338501e-06, -3.7141144275665283e-06, -3.516674041748047e-06, -3.3192336559295654e-06, -3.121793270111084e-06, -2.9243528842926025e-06, -2.726912498474121e-06, -2.5294721126556396e-06, -2.332031726837158e-06, -2.1345913410186768e-06, -1.9371509552001953e-06, -1.7397105693817139e-06, -1.5422701835632324e-06, -1.344829797744751e-06, -1.1473894119262695e-06, -9.499490261077881e-07, -7.525086402893066e-07, -5.550682544708252e-07, -3.5762786865234375e-07, -1.601874828338623e-07, 3.725290298461914e-08, 2.3469328880310059e-07, 4.3213367462158203e-07, 6.295740604400635e-07, 8.270144462585449e-07, 1.0244548320770264e-06, 1.2218952178955078e-06, 1.4193356037139893e-06, 1.6167759895324707e-06, 1.8142163753509521e-06, 2.0116567611694336e-06, 2.209097146987915e-06, 2.4065375328063965e-06, 2.603977918624878e-06, 2.8014183044433594e-06, 2.998858690261841e-06, 3.1962990760803223e-06, 3.3937394618988037e-06, 3.591179847717285e-06, 3.7886202335357666e-06, 3.986060619354248e-06, 4.1835010051727295e-06, 4.380941390991211e-06, 4.578381776809692e-06, 4.775822162628174e-06, 4.973262548446655e-06, 5.170702934265137e-06, 5.368143320083618e-06, 5.5655837059021e-06, 5.763024091720581e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 3.0, 4.0, 13.0, 16.0, 11.0, 32.0, 59.0, 72.0, 154.0, 319.0, 737.0, 1582.0, 3657.0, 9373.0, 26616.0, 91826.0, 349333.0, 405304.0, 110304.0, 31169.0, 10530.0, 4195.0, 1673.0, 788.0, 372.0, 176.0, 102.0, 48.0, 33.0, 24.0, 9.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0222625732421875, -0.021645307540893555, -0.02102804183959961, -0.020410776138305664, -0.01979351043701172, -0.019176244735717773, -0.018558979034423828, -0.017941713333129883, -0.017324447631835938, -0.016707181930541992, -0.016089916229248047, -0.015472650527954102, -0.014855384826660156, -0.014238119125366211, -0.013620853424072266, -0.01300358772277832, -0.012386322021484375, -0.01176905632019043, -0.011151790618896484, -0.010534524917602539, -0.009917259216308594, -0.009299993515014648, -0.008682727813720703, -0.008065462112426758, -0.0074481964111328125, -0.006830930709838867, -0.006213665008544922, -0.0055963993072509766, -0.004979133605957031, -0.004361867904663086, -0.0037446022033691406, -0.0031273365020751953, -0.00251007080078125, -0.0018928050994873047, -0.0012755393981933594, -0.0006582736968994141, -4.100799560546875e-05, 0.0005762577056884766, 0.0011935234069824219, 0.0018107891082763672, 0.0024280548095703125, 0.003045320510864258, 0.003662586212158203, 0.0042798519134521484, 0.004897117614746094, 0.005514383316040039, 0.006131649017333984, 0.00674891471862793, 0.007366180419921875, 0.00798344612121582, 0.008600711822509766, 0.009217977523803711, 0.009835243225097656, 0.010452508926391602, 0.011069774627685547, 0.011687040328979492, 0.012304306030273438, 0.012921571731567383, 0.013538837432861328, 0.014156103134155273, 0.014773368835449219, 0.015390634536743164, 0.01600790023803711, 0.016625165939331055, 0.017242431640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 4.0, 10.0, 18.0, 19.0, 18.0, 20.0, 30.0, 44.0, 49.0, 63.0, 75.0, 70.0, 85.0, 90.0, 72.0, 45.0, 54.0, 43.0, 42.0, 27.0, 28.0, 21.0, 21.0, 6.0, 8.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184326171875, -0.017811059951782227, -0.017189502716064453, -0.01656794548034668, -0.015946388244628906, -0.015324831008911133, -0.01470327377319336, -0.014081716537475586, -0.013460159301757812, -0.012838602066040039, -0.012217044830322266, -0.011595487594604492, -0.010973930358886719, -0.010352373123168945, -0.009730815887451172, -0.009109258651733398, -0.008487701416015625, -0.007866144180297852, -0.007244586944580078, -0.006623029708862305, -0.006001472473144531, -0.005379915237426758, -0.004758358001708984, -0.004136800765991211, -0.0035152435302734375, -0.002893686294555664, -0.0022721290588378906, -0.0016505718231201172, -0.0010290145874023438, -0.0004074573516845703, 0.00021409988403320312, 0.0008356571197509766, 0.00145721435546875, 0.0020787715911865234, 0.002700328826904297, 0.0033218860626220703, 0.003943443298339844, 0.004565000534057617, 0.005186557769775391, 0.005808115005493164, 0.0064296722412109375, 0.007051229476928711, 0.007672786712646484, 0.008294343948364258, 0.008915901184082031, 0.009537458419799805, 0.010159015655517578, 0.010780572891235352, 0.011402130126953125, 0.012023687362670898, 0.012645244598388672, 0.013266801834106445, 0.013888359069824219, 0.014509916305541992, 0.015131473541259766, 0.01575303077697754, 0.016374588012695312, 0.016996145248413086, 0.01761770248413086, 0.018239259719848633, 0.018860816955566406, 0.01948237419128418, 0.020103931427001953, 0.020725488662719727, 0.0213470458984375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 12.0, 29.0, 140.0, 361.0, 319.0, 112.0, 26.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.554503321647644, -0.5115044116973877, -0.46850547194480896, -0.4255065321922302, -0.3825076222419739, -0.33950871229171753, -0.2965097725391388, -0.25351083278656006, -0.2105119228363037, -0.16751299798488617, -0.12451407313346863, -0.08151514828205109, -0.038516223430633545, 0.004482701420783997, 0.04748162627220154, 0.09048056602478027, 0.13347947597503662, 0.17647840082645416, 0.2194773256778717, 0.26247626543045044, 0.3054751753807068, 0.34847408533096313, 0.39147302508354187, 0.4344719648361206, 0.47747087478637695, 0.5204697847366333, 0.5634686946868896, 0.6064676642417908, 0.6494665741920471, 0.6924654841423035, 0.7354644536972046, 0.7784633636474609, 0.8214621543884277, 0.8644610643386841, 0.9074599742889404, 0.9504589438438416, 0.9934578537940979, 1.036456823348999, 1.0794557332992554, 1.1224546432495117, 1.165453553199768, 1.2084524631500244, 1.2514513731002808, 1.294450283050537, 1.337449312210083, 1.3804482221603394, 1.4234471321105957, 1.466446042060852, 1.5094449520111084, 1.5524438619613647, 1.595442771911621, 1.6384416818618774, 1.6814405918121338, 1.7244396209716797, 1.767438530921936, 1.8104374408721924, 1.8534363508224487, 1.896435260772705, 1.9394341707229614, 1.9824330806732178, 2.0254321098327637, 2.0684309005737305, 2.1114299297332764, 2.1544289588928223, 2.197427749633789]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 7.0, 5.0, 14.0, 10.0, 12.0, 15.0, 22.0, 17.0, 29.0, 19.0, 36.0, 31.0, 36.0, 37.0, 41.0, 49.0, 49.0, 52.0, 64.0, 49.0, 41.0, 43.0, 34.0, 42.0, 24.0, 37.0, 30.0, 25.0, 21.0, 18.0, 19.0, 12.0, 12.0, 10.0, 7.0, 6.0, 7.0, 7.0, 8.0, 2.0, 4.0, 1.0, 4.0], "bins": [-0.4827003479003906, -0.47040027379989624, -0.45810016989707947, -0.4458000957965851, -0.4334999918937683, -0.4211999177932739, -0.40889984369277954, -0.39659976959228516, -0.3842996656894684, -0.371999591588974, -0.3596994876861572, -0.34739941358566284, -0.33509933948516846, -0.3227992355823517, -0.3104991614818573, -0.2981990575790405, -0.28589898347854614, -0.27359890937805176, -0.261298805475235, -0.2489987313747406, -0.23669864237308502, -0.22439855337142944, -0.21209847927093506, -0.19979839026927948, -0.1874983012676239, -0.17519821226596832, -0.16289812326431274, -0.15059804916381836, -0.13829796016216278, -0.1259978711605072, -0.11369778960943222, -0.10139770805835724, -0.08909761905670166, -0.07679753005504608, -0.0644974485039711, -0.05219736322760582, -0.03989727795124054, -0.02759719267487526, -0.01529710739850998, -0.0029970258474349976, 0.009303063154220581, 0.02160314843058586, 0.03390323370695114, 0.04620331898331642, 0.0585034042596817, 0.07080349326133728, 0.08310357481241226, 0.09540365636348724, 0.10770374536514282, 0.1200038343667984, 0.13230392336845398, 0.14460399746894836, 0.15690408647060394, 0.16920417547225952, 0.1815042495727539, 0.19380433857440948, 0.20610442757606506, 0.21840451657772064, 0.23070460557937622, 0.2430046796798706, 0.255304753780365, 0.26760485768318176, 0.27990493178367615, 0.2922050356864929, 0.3045051097869873]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 10.0, 19.0, 18.0, 42.0, 66.0, 136.0, 210.0, 431.0, 931.0, 2404.0, 10315.0, 3918412.0, 248723.0, 8631.0, 2150.0, 865.0, 372.0, 215.0, 109.0, 80.0, 49.0, 24.0, 21.0, 11.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1280517578125, -0.1249246597290039, -0.12179756164550781, -0.11867046356201172, -0.11554336547851562, -0.11241626739501953, -0.10928916931152344, -0.10616207122802734, -0.10303497314453125, -0.09990787506103516, -0.09678077697753906, -0.09365367889404297, -0.09052658081054688, -0.08739948272705078, -0.08427238464355469, -0.0811452865600586, -0.0780181884765625, -0.0748910903930664, -0.07176399230957031, -0.06863689422607422, -0.06550979614257812, -0.06238269805908203, -0.05925559997558594, -0.056128501892089844, -0.05300140380859375, -0.049874305725097656, -0.04674720764160156, -0.04362010955810547, -0.040493011474609375, -0.03736591339111328, -0.03423881530761719, -0.031111717224121094, -0.027984619140625, -0.024857521057128906, -0.021730422973632812, -0.01860332489013672, -0.015476226806640625, -0.012349128723144531, -0.009222030639648438, -0.006094932556152344, -0.00296783447265625, 0.00015926361083984375, 0.0032863616943359375, 0.006413459777832031, 0.009540557861328125, 0.012667655944824219, 0.015794754028320312, 0.018921852111816406, 0.0220489501953125, 0.025176048278808594, 0.028303146362304688, 0.03143024444580078, 0.034557342529296875, 0.03768444061279297, 0.04081153869628906, 0.043938636779785156, 0.04706573486328125, 0.050192832946777344, 0.05331993103027344, 0.05644702911376953, 0.059574127197265625, 0.06270122528076172, 0.06582832336425781, 0.0689554214477539, 0.07208251953125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 10.0, 5.0, 3.0, 7.0, 16.0, 17.0, 29.0, 22.0, 38.0, 36.0, 41.0, 28.0, 40.0, 50.0, 49.0, 38.0, 53.0, 49.0, 46.0, 57.0, 39.0, 44.0, 56.0, 35.0, 37.0, 33.0, 17.0, 22.0, 11.0, 8.0, 14.0, 3.0, 13.0, 8.0, 9.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0185546875, -0.017944812774658203, -0.017334938049316406, -0.01672506332397461, -0.016115188598632812, -0.015505313873291016, -0.014895439147949219, -0.014285564422607422, -0.013675689697265625, -0.013065814971923828, -0.012455940246582031, -0.011846065521240234, -0.011236190795898438, -0.01062631607055664, -0.010016441345214844, -0.009406566619873047, -0.00879669189453125, -0.008186817169189453, -0.007576942443847656, -0.006967067718505859, -0.0063571929931640625, -0.005747318267822266, -0.005137443542480469, -0.004527568817138672, -0.003917694091796875, -0.003307819366455078, -0.0026979446411132812, -0.0020880699157714844, -0.0014781951904296875, -0.0008683204650878906, -0.00025844573974609375, 0.0003514289855957031, 0.0009613037109375, 0.0015711784362792969, 0.0021810531616210938, 0.0027909278869628906, 0.0034008026123046875, 0.004010677337646484, 0.004620552062988281, 0.005230426788330078, 0.005840301513671875, 0.006450176239013672, 0.007060050964355469, 0.007669925689697266, 0.008279800415039062, 0.00888967514038086, 0.009499549865722656, 0.010109424591064453, 0.01071929931640625, 0.011329174041748047, 0.011939048767089844, 0.01254892349243164, 0.013158798217773438, 0.013768672943115234, 0.014378547668457031, 0.014988422393798828, 0.015598297119140625, 0.016208171844482422, 0.01681804656982422, 0.017427921295166016, 0.018037796020507812, 0.01864767074584961, 0.019257545471191406, 0.019867420196533203, 0.020477294921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 12.0, 14.0, 13.0, 18.0, 22.0, 33.0, 44.0, 51.0, 59.0, 101.0, 117.0, 152.0, 208.0, 255.0, 381.0, 532.0, 742.0, 1209.0, 2063.0, 3886.0, 8001.0, 21294.0, 85599.0, 3822450.0, 189099.0, 34290.0, 11232.0, 5051.0, 2607.0, 1460.0, 925.0, 662.0, 431.0, 309.0, 237.0, 187.0, 106.0, 117.0, 74.0, 63.0, 35.0, 44.0, 25.0, 17.0, 16.0, 11.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.031646728515625, -0.030678749084472656, -0.029710769653320312, -0.02874279022216797, -0.027774810791015625, -0.02680683135986328, -0.025838851928710938, -0.024870872497558594, -0.02390289306640625, -0.022934913635253906, -0.021966934204101562, -0.02099895477294922, -0.020030975341796875, -0.01906299591064453, -0.018095016479492188, -0.017127037048339844, -0.0161590576171875, -0.015191078186035156, -0.014223098754882812, -0.013255119323730469, -0.012287139892578125, -0.011319160461425781, -0.010351181030273438, -0.009383201599121094, -0.00841522216796875, -0.007447242736816406, -0.0064792633056640625, -0.005511283874511719, -0.004543304443359375, -0.0035753250122070312, -0.0026073455810546875, -0.0016393661499023438, -0.00067138671875, 0.00029659271240234375, 0.0012645721435546875, 0.0022325515747070312, 0.003200531005859375, 0.004168510437011719, 0.0051364898681640625, 0.006104469299316406, 0.00707244873046875, 0.008040428161621094, 0.009008407592773438, 0.009976387023925781, 0.010944366455078125, 0.011912345886230469, 0.012880325317382812, 0.013848304748535156, 0.0148162841796875, 0.015784263610839844, 0.016752243041992188, 0.01772022247314453, 0.018688201904296875, 0.01965618133544922, 0.020624160766601562, 0.021592140197753906, 0.02256011962890625, 0.023528099060058594, 0.024496078491210938, 0.02546405792236328, 0.026432037353515625, 0.02740001678466797, 0.028367996215820312, 0.029335975646972656, 0.030303955078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 16.0, 9.0, 16.0, 31.0, 66.0, 113.0, 365.0, 3133.0, 135.0, 54.0, 47.0, 17.0, 13.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01078033447265625, -0.010464191436767578, -0.010148048400878906, -0.009831905364990234, -0.009515762329101562, -0.00919961929321289, -0.008883476257324219, -0.008567333221435547, -0.008251190185546875, -0.007935047149658203, -0.007618904113769531, -0.007302761077880859, -0.0069866180419921875, -0.006670475006103516, -0.006354331970214844, -0.006038188934326172, -0.0057220458984375, -0.005405902862548828, -0.005089759826660156, -0.004773616790771484, -0.0044574737548828125, -0.004141330718994141, -0.0038251876831054688, -0.003509044647216797, -0.003192901611328125, -0.002876758575439453, -0.0025606155395507812, -0.0022444725036621094, -0.0019283294677734375, -0.0016121864318847656, -0.0012960433959960938, -0.0009799003601074219, -0.00066375732421875, -0.0003476142883300781, -3.147125244140625e-05, 0.0002846717834472656, 0.0006008148193359375, 0.0009169578552246094, 0.0012331008911132812, 0.0015492439270019531, 0.001865386962890625, 0.002181529998779297, 0.0024976730346679688, 0.0028138160705566406, 0.0031299591064453125, 0.0034461021423339844, 0.0037622451782226562, 0.004078388214111328, 0.00439453125, 0.004710674285888672, 0.005026817321777344, 0.005342960357666016, 0.0056591033935546875, 0.005975246429443359, 0.006291389465332031, 0.006607532501220703, 0.006923675537109375, 0.007239818572998047, 0.007555961608886719, 0.00787210464477539, 0.008188247680664062, 0.008504390716552734, 0.008820533752441406, 0.009136676788330078, 0.00945281982421875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 15.0, 15.0, 35.0, 52.0, 71.0, 102.0, 129.0, 141.0, 142.0, 107.0, 83.0, 39.0, 27.0, 12.0, 12.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06282146275043488, -0.061213742941617966, -0.059606023132801056, -0.057998303323984146, -0.056390583515167236, -0.054782867431640625, -0.05317514389753342, -0.051567427814006805, -0.049959708005189896, -0.048351988196372986, -0.046744268387556076, -0.045136548578739166, -0.043528828769922256, -0.04192110896110535, -0.040313392877578735, -0.038705673068761826, -0.037097953259944916, -0.035490233451128006, -0.033882513642311096, -0.032274793833494186, -0.030667075887322426, -0.029059356078505516, -0.027451636269688606, -0.025843918323516846, -0.024236194789409637, -0.022628474980592728, -0.021020755171775818, -0.019413035362958908, -0.017805317416787148, -0.016197597607970238, -0.014589877799153328, -0.012982158921658993, -0.011374440044164658, -0.009766720235347748, -0.008159001357853413, -0.006551281549036503, -0.00494356220588088, -0.003335842862725258, -0.001728123053908348, -0.00012040417641401291, 0.0014873156324028969, 0.0030950349755585194, 0.004702754318714142, 0.006310474127531052, 0.007918193936347961, 0.009525912813842297, 0.011133632622659206, 0.012741351500153542, 0.014349071308970451, 0.01595679111778736, 0.01756451092660427, 0.01917222887277603, 0.02077994868159294, 0.02238766849040985, 0.02399538829922676, 0.02560310810804367, 0.02721082791686058, 0.02881854772567749, 0.0304262675344944, 0.03203398734331131, 0.03364170715212822, 0.03524942696094513, 0.03685714304447174, 0.03846486285328865, 0.04007258266210556]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 9.0, 5.0, 15.0, 12.0, 16.0, 17.0, 21.0, 26.0, 25.0, 31.0, 27.0, 31.0, 23.0, 36.0, 39.0, 29.0, 35.0, 53.0, 39.0, 42.0, 53.0, 33.0, 34.0, 32.0, 34.0, 36.0, 31.0, 31.0, 20.0, 28.0, 23.0, 18.0, 20.0, 20.0, 10.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.021174967288970947, -0.020530428737401962, -0.019885890185832977, -0.019241351634263992, -0.018596813082695007, -0.017952274531126022, -0.017307735979557037, -0.016663197427988052, -0.016018658876419067, -0.015374120324850082, -0.014729581773281097, -0.014085043221712112, -0.013440504670143127, -0.012795966118574142, -0.012151427567005157, -0.011506889015436172, -0.010862350463867188, -0.010217811912298203, -0.009573273360729218, -0.008928734809160233, -0.008284196257591248, -0.007639657706022263, -0.006995119154453278, -0.006350580602884293, -0.005706042051315308, -0.005061503499746323, -0.004416964948177338, -0.0037724263966083527, -0.0031278878450393677, -0.0024833492934703827, -0.0018388107419013977, -0.0011942721903324127, -0.0005497336387634277, 9.480491280555725e-05, 0.0007393434643745422, 0.0013838820159435272, 0.002028420567512512, 0.002672959119081497, 0.003317497670650482, 0.003962036222219467, 0.004606574773788452, 0.005251113325357437, 0.005895651876926422, 0.006540190428495407, 0.007184728980064392, 0.007829267531633377, 0.008473806083202362, 0.009118344634771347, 0.009762883186340332, 0.010407421737909317, 0.011051960289478302, 0.011696498841047287, 0.012341037392616272, 0.012985575944185257, 0.013630114495754242, 0.014274653047323227, 0.014919191598892212, 0.015563730150461197, 0.016208268702030182, 0.016852807253599167, 0.017497345805168152, 0.018141884356737137, 0.018786422908306122, 0.019430961459875107, 0.020075500011444092]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 18.0, 20.0, 15.0, 49.0, 80.0, 115.0, 179.0, 332.0, 649.0, 1246.0, 2809.0, 6777.0, 18764.0, 56488.0, 184928.0, 406313.0, 250590.0, 78009.0, 25210.0, 9075.0, 3604.0, 1547.0, 731.0, 403.0, 234.0, 107.0, 84.0, 57.0, 32.0, 31.0, 11.0, 7.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04290771484375, -0.04140949249267578, -0.03991127014160156, -0.038413047790527344, -0.036914825439453125, -0.035416603088378906, -0.03391838073730469, -0.03242015838623047, -0.03092193603515625, -0.02942371368408203, -0.027925491333007812, -0.026427268981933594, -0.024929046630859375, -0.023430824279785156, -0.021932601928710938, -0.02043437957763672, -0.0189361572265625, -0.01743793487548828, -0.015939712524414062, -0.014441490173339844, -0.012943267822265625, -0.011445045471191406, -0.009946823120117188, -0.008448600769042969, -0.00695037841796875, -0.005452156066894531, -0.0039539337158203125, -0.0024557113647460938, -0.000957489013671875, 0.0005407333374023438, 0.0020389556884765625, 0.0035371780395507812, 0.005035400390625, 0.006533622741699219, 0.008031845092773438, 0.009530067443847656, 0.011028289794921875, 0.012526512145996094, 0.014024734497070312, 0.015522956848144531, 0.01702117919921875, 0.01851940155029297, 0.020017623901367188, 0.021515846252441406, 0.023014068603515625, 0.024512290954589844, 0.026010513305664062, 0.02750873565673828, 0.0290069580078125, 0.03050518035888672, 0.03200340270996094, 0.033501625061035156, 0.034999847412109375, 0.036498069763183594, 0.03799629211425781, 0.03949451446533203, 0.04099273681640625, 0.04249095916748047, 0.04398918151855469, 0.045487403869628906, 0.046985626220703125, 0.048483848571777344, 0.04998207092285156, 0.05148029327392578, 0.052978515625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 7.0, 14.0, 24.0, 15.0, 34.0, 28.0, 30.0, 43.0, 36.0, 52.0, 47.0, 45.0, 52.0, 44.0, 44.0, 47.0, 53.0, 55.0, 39.0, 44.0, 34.0, 44.0, 27.0, 10.0, 16.0, 18.0, 13.0, 12.0, 9.0, 12.0, 11.0, 5.0, 3.0, 6.0, 4.0, 4.0, 0.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0192108154296875, -0.018580198287963867, -0.017949581146240234, -0.0173189640045166, -0.01668834686279297, -0.016057729721069336, -0.015427112579345703, -0.01479649543762207, -0.014165878295898438, -0.013535261154174805, -0.012904644012451172, -0.012274026870727539, -0.011643409729003906, -0.011012792587280273, -0.01038217544555664, -0.009751558303833008, -0.009120941162109375, -0.008490324020385742, -0.00785970687866211, -0.0072290897369384766, -0.006598472595214844, -0.005967855453491211, -0.005337238311767578, -0.004706621170043945, -0.0040760040283203125, -0.0034453868865966797, -0.002814769744873047, -0.002184152603149414, -0.0015535354614257812, -0.0009229183197021484, -0.0002923011779785156, 0.0003383159637451172, 0.00096893310546875, 0.0015995502471923828, 0.0022301673889160156, 0.0028607845306396484, 0.0034914016723632812, 0.004122018814086914, 0.004752635955810547, 0.00538325309753418, 0.0060138702392578125, 0.006644487380981445, 0.007275104522705078, 0.007905721664428711, 0.008536338806152344, 0.009166955947875977, 0.00979757308959961, 0.010428190231323242, 0.011058807373046875, 0.011689424514770508, 0.01232004165649414, 0.012950658798217773, 0.013581275939941406, 0.014211893081665039, 0.014842510223388672, 0.015473127365112305, 0.016103744506835938, 0.01673436164855957, 0.017364978790283203, 0.017995595932006836, 0.01862621307373047, 0.0192568302154541, 0.019887447357177734, 0.020518064498901367, 0.021148681640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 9.0, 15.0, 20.0, 12.0, 32.0, 40.0, 36.0, 54.0, 125.0, 175.0, 312.0, 608.0, 1661.0, 5057.0, 19459.0, 106178.0, 621306.0, 244513.0, 36107.0, 8387.0, 2554.0, 853.0, 385.0, 187.0, 113.0, 95.0, 68.0, 36.0, 29.0, 23.0, 15.0, 22.0, 12.0, 12.0, 11.0, 6.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055938720703125, -0.053919315338134766, -0.05189990997314453, -0.0498805046081543, -0.04786109924316406, -0.04584169387817383, -0.043822288513183594, -0.04180288314819336, -0.039783477783203125, -0.03776407241821289, -0.035744667053222656, -0.03372526168823242, -0.03170585632324219, -0.029686450958251953, -0.02766704559326172, -0.025647640228271484, -0.02362823486328125, -0.021608829498291016, -0.01958942413330078, -0.017570018768310547, -0.015550613403320312, -0.013531208038330078, -0.011511802673339844, -0.00949239730834961, -0.007472991943359375, -0.005453586578369141, -0.0034341812133789062, -0.0014147758483886719, 0.0006046295166015625, 0.002624034881591797, 0.004643440246582031, 0.006662845611572266, 0.0086822509765625, 0.010701656341552734, 0.012721061706542969, 0.014740467071533203, 0.016759872436523438, 0.018779277801513672, 0.020798683166503906, 0.02281808853149414, 0.024837493896484375, 0.02685689926147461, 0.028876304626464844, 0.030895709991455078, 0.03291511535644531, 0.03493452072143555, 0.03695392608642578, 0.038973331451416016, 0.04099273681640625, 0.043012142181396484, 0.04503154754638672, 0.04705095291137695, 0.04907035827636719, 0.05108976364135742, 0.053109169006347656, 0.05512857437133789, 0.057147979736328125, 0.05916738510131836, 0.061186790466308594, 0.06320619583129883, 0.06522560119628906, 0.0672450065612793, 0.06926441192626953, 0.07128381729125977, 0.07330322265625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 7.0, 10.0, 18.0, 20.0, 29.0, 20.0, 25.0, 30.0, 35.0, 40.0, 35.0, 44.0, 42.0, 49.0, 43.0, 51.0, 45.0, 50.0, 41.0, 55.0, 37.0, 37.0, 34.0, 27.0, 25.0, 27.0, 19.0, 21.0, 12.0, 10.0, 12.0, 12.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0863037109375, -0.08392143249511719, -0.08153915405273438, -0.07915687561035156, -0.07677459716796875, -0.07439231872558594, -0.07201004028320312, -0.06962776184082031, -0.0672454833984375, -0.06486320495605469, -0.062480926513671875, -0.06009864807128906, -0.05771636962890625, -0.05533409118652344, -0.052951812744140625, -0.05056953430175781, -0.048187255859375, -0.04580497741699219, -0.043422698974609375, -0.04104042053222656, -0.03865814208984375, -0.03627586364746094, -0.033893585205078125, -0.03151130676269531, -0.0291290283203125, -0.026746749877929688, -0.024364471435546875, -0.021982192993164062, -0.01959991455078125, -0.017217636108398438, -0.014835357666015625, -0.012453079223632812, -0.01007080078125, -0.0076885223388671875, -0.005306243896484375, -0.0029239654541015625, -0.00054168701171875, 0.0018405914306640625, 0.004222869873046875, 0.0066051483154296875, 0.0089874267578125, 0.011369705200195312, 0.013751983642578125, 0.016134262084960938, 0.01851654052734375, 0.020898818969726562, 0.023281097412109375, 0.025663375854492188, 0.028045654296875, 0.030427932739257812, 0.032810211181640625, 0.03519248962402344, 0.03757476806640625, 0.03995704650878906, 0.042339324951171875, 0.04472160339355469, 0.0471038818359375, 0.04948616027832031, 0.051868438720703125, 0.05425071716308594, 0.05663299560546875, 0.05901527404785156, 0.061397552490234375, 0.06377983093261719, 0.066162109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 11.0, 22.0, 38.0, 61.0, 114.0, 176.0, 275.0, 551.0, 1143.0, 2730.0, 9003.0, 57146.0, 671603.0, 272805.0, 24061.0, 5180.0, 1788.0, 829.0, 418.0, 219.0, 126.0, 96.0, 60.0, 39.0, 19.0, 11.0, 6.0, 0.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.035730600357055664, -0.03480958938598633, -0.03388857841491699, -0.032967567443847656, -0.03204655647277832, -0.031125545501708984, -0.03020453453063965, -0.029283523559570312, -0.028362512588500977, -0.02744150161743164, -0.026520490646362305, -0.02559947967529297, -0.024678468704223633, -0.023757457733154297, -0.02283644676208496, -0.021915435791015625, -0.02099442481994629, -0.020073413848876953, -0.019152402877807617, -0.01823139190673828, -0.017310380935668945, -0.01638936996459961, -0.015468358993530273, -0.014547348022460938, -0.013626337051391602, -0.012705326080322266, -0.01178431510925293, -0.010863304138183594, -0.009942293167114258, -0.009021282196044922, -0.008100271224975586, -0.00717926025390625, -0.006258249282836914, -0.005337238311767578, -0.004416227340698242, -0.0034952163696289062, -0.0025742053985595703, -0.0016531944274902344, -0.0007321834564208984, 0.0001888275146484375, 0.0011098384857177734, 0.0020308494567871094, 0.0029518604278564453, 0.0038728713989257812, 0.004793882369995117, 0.005714893341064453, 0.006635904312133789, 0.007556915283203125, 0.008477926254272461, 0.009398937225341797, 0.010319948196411133, 0.011240959167480469, 0.012161970138549805, 0.01308298110961914, 0.014003992080688477, 0.014925003051757812, 0.01584601402282715, 0.016767024993896484, 0.01768803596496582, 0.018609046936035156, 0.019530057907104492, 0.020451068878173828, 0.021372079849243164, 0.0222930908203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 12.0, 9.0, 19.0, 28.0, 33.0, 27.0, 54.0, 59.0, 69.0, 72.0, 95.0, 86.0, 78.0, 66.0, 70.0, 59.0, 42.0, 22.0, 21.0, 20.0, 13.0, 10.0, 11.0, 7.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.332993507385254e-06, -6.109476089477539e-06, -5.885958671569824e-06, -5.662441253662109e-06, -5.4389238357543945e-06, -5.21540641784668e-06, -4.991888999938965e-06, -4.76837158203125e-06, -4.544854164123535e-06, -4.32133674621582e-06, -4.0978193283081055e-06, -3.874301910400391e-06, -3.6507844924926758e-06, -3.427267074584961e-06, -3.203749656677246e-06, -2.9802322387695312e-06, -2.7567148208618164e-06, -2.5331974029541016e-06, -2.3096799850463867e-06, -2.086162567138672e-06, -1.862645149230957e-06, -1.6391277313232422e-06, -1.4156103134155273e-06, -1.1920928955078125e-06, -9.685754776000977e-07, -7.450580596923828e-07, -5.21540641784668e-07, -2.980232238769531e-07, -7.450580596923828e-08, 1.4901161193847656e-07, 3.725290298461914e-07, 5.960464477539062e-07, 8.195638656616211e-07, 1.043081283569336e-06, 1.2665987014770508e-06, 1.4901161193847656e-06, 1.7136335372924805e-06, 1.9371509552001953e-06, 2.16066837310791e-06, 2.384185791015625e-06, 2.60770320892334e-06, 2.8312206268310547e-06, 3.0547380447387695e-06, 3.2782554626464844e-06, 3.5017728805541992e-06, 3.725290298461914e-06, 3.948807716369629e-06, 4.172325134277344e-06, 4.395842552185059e-06, 4.6193599700927734e-06, 4.842877388000488e-06, 5.066394805908203e-06, 5.289912223815918e-06, 5.513429641723633e-06, 5.736947059631348e-06, 5.9604644775390625e-06, 6.183981895446777e-06, 6.407499313354492e-06, 6.631016731262207e-06, 6.854534149169922e-06, 7.078051567077637e-06, 7.3015689849853516e-06, 7.525086402893066e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 10.0, 7.0, 18.0, 23.0, 33.0, 43.0, 92.0, 129.0, 179.0, 355.0, 553.0, 1203.0, 2899.0, 9383.0, 55761.0, 536981.0, 389010.0, 39385.0, 7680.0, 2413.0, 1005.0, 565.0, 300.0, 177.0, 126.0, 66.0, 59.0, 20.0, 28.0, 10.0, 11.0, 6.0, 6.0, 2.0, 9.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0257568359375, -0.024866104125976562, -0.023975372314453125, -0.023084640502929688, -0.02219390869140625, -0.021303176879882812, -0.020412445068359375, -0.019521713256835938, -0.0186309814453125, -0.017740249633789062, -0.016849517822265625, -0.015958786010742188, -0.01506805419921875, -0.014177322387695312, -0.013286590576171875, -0.012395858764648438, -0.011505126953125, -0.010614395141601562, -0.009723663330078125, -0.008832931518554688, -0.00794219970703125, -0.0070514678955078125, -0.006160736083984375, -0.0052700042724609375, -0.0043792724609375, -0.0034885406494140625, -0.002597808837890625, -0.0017070770263671875, -0.00081634521484375, 7.43865966796875e-05, 0.000965118408203125, 0.0018558502197265625, 0.00274658203125, 0.0036373138427734375, 0.004528045654296875, 0.0054187774658203125, 0.00630950927734375, 0.0072002410888671875, 0.008090972900390625, 0.008981704711914062, 0.0098724365234375, 0.010763168334960938, 0.011653900146484375, 0.012544631958007812, 0.01343536376953125, 0.014326095581054688, 0.015216827392578125, 0.016107559204101562, 0.016998291015625, 0.017889022827148438, 0.018779754638671875, 0.019670486450195312, 0.02056121826171875, 0.021451950073242188, 0.022342681884765625, 0.023233413696289062, 0.0241241455078125, 0.025014877319335938, 0.025905609130859375, 0.026796340942382812, 0.02768707275390625, 0.028577804565429688, 0.029468536376953125, 0.030359268188476562, 0.03125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 17.0, 24.0, 31.0, 37.0, 64.0, 81.0, 115.0, 119.0, 131.0, 121.0, 77.0, 69.0, 34.0, 26.0, 17.0, 12.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038299560546875, -0.03726387023925781, -0.036228179931640625, -0.03519248962402344, -0.03415679931640625, -0.03312110900878906, -0.032085418701171875, -0.031049728393554688, -0.0300140380859375, -0.028978347778320312, -0.027942657470703125, -0.026906967163085938, -0.02587127685546875, -0.024835586547851562, -0.023799896240234375, -0.022764205932617188, -0.021728515625, -0.020692825317382812, -0.019657135009765625, -0.018621444702148438, -0.01758575439453125, -0.016550064086914062, -0.015514373779296875, -0.014478683471679688, -0.0134429931640625, -0.012407302856445312, -0.011371612548828125, -0.010335922241210938, -0.00930023193359375, -0.008264541625976562, -0.007228851318359375, -0.0061931610107421875, -0.005157470703125, -0.0041217803955078125, -0.003086090087890625, -0.0020503997802734375, -0.00101470947265625, 2.09808349609375e-05, 0.001056671142578125, 0.0020923614501953125, 0.0031280517578125, 0.0041637420654296875, 0.005199432373046875, 0.0062351226806640625, 0.00727081298828125, 0.008306503295898438, 0.009342193603515625, 0.010377883911132812, 0.01141357421875, 0.012449264526367188, 0.013484954833984375, 0.014520645141601562, 0.01555633544921875, 0.016592025756835938, 0.017627716064453125, 0.018663406372070312, 0.0196990966796875, 0.020734786987304688, 0.021770477294921875, 0.022806167602539062, 0.02384185791015625, 0.024877548217773438, 0.025913238525390625, 0.026948928833007812, 0.027984619140625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 16.0, 15.0, 25.0, 45.0, 73.0, 108.0, 123.0, 158.0, 131.0, 96.0, 82.0, 58.0, 40.0, 17.0, 5.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5062981247901917, -0.491531640291214, -0.47676515579223633, -0.46199867129325867, -0.447232186794281, -0.43246573209762573, -0.41769924759864807, -0.4029327630996704, -0.38816627860069275, -0.3733997941017151, -0.3586333096027374, -0.34386682510375977, -0.3291003704071045, -0.31433385610580444, -0.29956740140914917, -0.2848009169101715, -0.27003443241119385, -0.2552679479122162, -0.24050146341323853, -0.22573499381542206, -0.2109685093164444, -0.19620202481746674, -0.18143555521965027, -0.1666690707206726, -0.15190258622169495, -0.13713610172271729, -0.12236962467432022, -0.10760314762592316, -0.0928366631269455, -0.07807017862796783, -0.06330370157957077, -0.048537224531173706, -0.033770740032196045, -0.019004259258508682, -0.00423777848482132, 0.010528702288866043, 0.025295183062553406, 0.04006166756153107, 0.05482814460992813, 0.0695946216583252, 0.08436110615730286, 0.09912759065628052, 0.11389406770467758, 0.12866054475307465, 0.1434270292520523, 0.15819351375102997, 0.17295998334884644, 0.1877264678478241, 0.20249295234680176, 0.21725943684577942, 0.23202592134475708, 0.24679239094257355, 0.2615588903427124, 0.2763253450393677, 0.29109182953834534, 0.305858314037323, 0.32062479853630066, 0.3353912830352783, 0.350157767534256, 0.36492425203323364, 0.3796907067298889, 0.39445722103118896, 0.40922367572784424, 0.4239901602268219, 0.43875664472579956]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 8.0, 12.0, 21.0, 14.0, 16.0, 19.0, 19.0, 31.0, 28.0, 33.0, 51.0, 43.0, 62.0, 51.0, 56.0, 46.0, 61.0, 48.0, 45.0, 39.0, 50.0, 40.0, 28.0, 32.0, 19.0, 20.0, 27.0, 14.0, 13.0, 10.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.362491250038147, -0.3505464792251587, -0.3386017084121704, -0.32665690779685974, -0.31471213698387146, -0.3027673661708832, -0.2908225953578949, -0.27887779474258423, -0.26693302392959595, -0.25498825311660767, -0.2430434674024582, -0.2310986965894699, -0.21915391087532043, -0.20720914006233215, -0.19526436924934387, -0.1833195835351944, -0.17137481272220612, -0.15943004190921783, -0.14748525619506836, -0.13554048538208008, -0.1235956996679306, -0.11165092885494232, -0.09970615059137344, -0.08776137232780457, -0.07581659406423569, -0.06387181580066681, -0.05192703753709793, -0.03998226299881935, -0.028037484735250473, -0.016092706471681595, -0.004147931933403015, 0.007796846330165863, 0.01974162459373474, 0.03168640285730362, 0.0436311811208725, 0.05557595565915108, 0.06752073764801025, 0.07946550846099854, 0.09141028672456741, 0.10335506498813629, 0.11529984325170517, 0.12724462151527405, 0.13918939232826233, 0.1511341780424118, 0.16307894885540009, 0.17502373456954956, 0.18696850538253784, 0.19891327619552612, 0.2108580619096756, 0.22280283272266388, 0.23474761843681335, 0.24669238924980164, 0.2586371600627899, 0.2705819606781006, 0.28252673149108887, 0.29447150230407715, 0.30641627311706543, 0.3183610439300537, 0.330305814743042, 0.34225061535835266, 0.35419538617134094, 0.3661401569843292, 0.3780849277973175, 0.3900297284126282, 0.40197449922561646]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 11.0, 5.0, 9.0, 13.0, 20.0, 15.0, 32.0, 53.0, 46.0, 67.0, 133.0, 369.0, 2415.0, 4143212.0, 45958.0, 1331.0, 259.0, 102.0, 54.0, 50.0, 33.0, 30.0, 19.0, 16.0, 8.0, 8.0, 8.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24286651611328125, -0.2352447509765625, -0.22762298583984375, -0.220001220703125, -0.21237945556640625, -0.2047576904296875, -0.19713592529296875, -0.18951416015625, -0.18189239501953125, -0.1742706298828125, -0.16664886474609375, -0.159027099609375, -0.15140533447265625, -0.1437835693359375, -0.13616180419921875, -0.1285400390625, -0.12091827392578125, -0.1132965087890625, -0.10567474365234375, -0.098052978515625, -0.09043121337890625, -0.0828094482421875, -0.07518768310546875, -0.06756591796875, -0.05994415283203125, -0.0523223876953125, -0.04470062255859375, -0.037078857421875, -0.02945709228515625, -0.0218353271484375, -0.01421356201171875, -0.006591796875, 0.00102996826171875, 0.0086517333984375, 0.01627349853515625, 0.023895263671875, 0.03151702880859375, 0.0391387939453125, 0.04676055908203125, 0.05438232421875, 0.06200408935546875, 0.0696258544921875, 0.07724761962890625, 0.084869384765625, 0.09249114990234375, 0.1001129150390625, 0.10773468017578125, 0.1153564453125, 0.12297821044921875, 0.1305999755859375, 0.13822174072265625, 0.145843505859375, 0.15346527099609375, 0.1610870361328125, 0.16870880126953125, 0.17633056640625, 0.18395233154296875, 0.1915740966796875, 0.19919586181640625, 0.206817626953125, 0.21443939208984375, 0.2220611572265625, 0.22968292236328125, 0.2373046875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 6.0, 14.0, 17.0, 18.0, 26.0, 38.0, 20.0, 34.0, 45.0, 59.0, 36.0, 53.0, 53.0, 41.0, 52.0, 46.0, 44.0, 41.0, 34.0, 40.0, 32.0, 36.0, 33.0, 23.0, 24.0, 17.0, 14.0, 10.0, 7.0, 8.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0183868408203125, -0.01778554916381836, -0.01718425750732422, -0.016582965850830078, -0.015981674194335938, -0.015380382537841797, -0.014779090881347656, -0.014177799224853516, -0.013576507568359375, -0.012975215911865234, -0.012373924255371094, -0.011772632598876953, -0.011171340942382812, -0.010570049285888672, -0.009968757629394531, -0.00936746597290039, -0.00876617431640625, -0.00816488265991211, -0.007563591003417969, -0.006962299346923828, -0.0063610076904296875, -0.005759716033935547, -0.005158424377441406, -0.004557132720947266, -0.003955841064453125, -0.0033545494079589844, -0.0027532577514648438, -0.002151966094970703, -0.0015506744384765625, -0.0009493827819824219, -0.00034809112548828125, 0.0002532005310058594, 0.0008544921875, 0.0014557838439941406, 0.0020570755004882812, 0.002658367156982422, 0.0032596588134765625, 0.003860950469970703, 0.004462242126464844, 0.005063533782958984, 0.005664825439453125, 0.006266117095947266, 0.006867408752441406, 0.007468700408935547, 0.008069992065429688, 0.008671283721923828, 0.009272575378417969, 0.00987386703491211, 0.01047515869140625, 0.01107645034790039, 0.011677742004394531, 0.012279033660888672, 0.012880325317382812, 0.013481616973876953, 0.014082908630371094, 0.014684200286865234, 0.015285491943359375, 0.015886783599853516, 0.016488075256347656, 0.017089366912841797, 0.017690658569335938, 0.018291950225830078, 0.01889324188232422, 0.01949453353881836, 0.0200958251953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 11.0, 5.0, 7.0, 16.0, 30.0, 33.0, 56.0, 64.0, 102.0, 147.0, 179.0, 286.0, 375.0, 582.0, 874.0, 1487.0, 2814.0, 6902.0, 25667.0, 3830295.0, 289215.0, 21960.0, 6232.0, 2687.0, 1438.0, 919.0, 577.0, 391.0, 278.0, 176.0, 140.0, 88.0, 73.0, 56.0, 29.0, 33.0, 12.0, 11.0, 10.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046783447265625, -0.04544496536254883, -0.044106483459472656, -0.042768001556396484, -0.04142951965332031, -0.04009103775024414, -0.03875255584716797, -0.0374140739440918, -0.036075592041015625, -0.03473711013793945, -0.03339862823486328, -0.03206014633178711, -0.030721664428710938, -0.029383182525634766, -0.028044700622558594, -0.026706218719482422, -0.02536773681640625, -0.024029254913330078, -0.022690773010253906, -0.021352291107177734, -0.020013809204101562, -0.01867532730102539, -0.01733684539794922, -0.015998363494873047, -0.014659881591796875, -0.013321399688720703, -0.011982917785644531, -0.01064443588256836, -0.009305953979492188, -0.007967472076416016, -0.006628990173339844, -0.005290508270263672, -0.0039520263671875, -0.002613544464111328, -0.0012750625610351562, 6.341934204101562e-05, 0.0014019012451171875, 0.0027403831481933594, 0.004078865051269531, 0.005417346954345703, 0.006755828857421875, 0.008094310760498047, 0.009432792663574219, 0.01077127456665039, 0.012109756469726562, 0.013448238372802734, 0.014786720275878906, 0.016125202178955078, 0.01746368408203125, 0.018802165985107422, 0.020140647888183594, 0.021479129791259766, 0.022817611694335938, 0.02415609359741211, 0.02549457550048828, 0.026833057403564453, 0.028171539306640625, 0.029510021209716797, 0.03084850311279297, 0.03218698501586914, 0.03352546691894531, 0.034863948822021484, 0.036202430725097656, 0.03754091262817383, 0.03887939453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 13.0, 16.0, 34.0, 66.0, 326.0, 3384.0, 93.0, 47.0, 28.0, 12.0, 10.0, 9.0, 7.0, 4.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01153564453125, -0.011215686798095703, -0.010895729064941406, -0.01057577133178711, -0.010255813598632812, -0.009935855865478516, -0.009615898132324219, -0.009295940399169922, -0.008975982666015625, -0.008656024932861328, -0.008336067199707031, -0.008016109466552734, -0.0076961517333984375, -0.007376194000244141, -0.007056236267089844, -0.006736278533935547, -0.00641632080078125, -0.006096363067626953, -0.005776405334472656, -0.005456447601318359, -0.0051364898681640625, -0.004816532135009766, -0.004496574401855469, -0.004176616668701172, -0.003856658935546875, -0.003536701202392578, -0.0032167434692382812, -0.0028967857360839844, -0.0025768280029296875, -0.0022568702697753906, -0.0019369125366210938, -0.0016169548034667969, -0.0012969970703125, -0.0009770393371582031, -0.0006570816040039062, -0.0003371238708496094, -1.71661376953125e-05, 0.0003027915954589844, 0.0006227493286132812, 0.0009427070617675781, 0.001262664794921875, 0.0015826225280761719, 0.0019025802612304688, 0.0022225379943847656, 0.0025424957275390625, 0.0028624534606933594, 0.0031824111938476562, 0.003502368927001953, 0.00382232666015625, 0.004142284393310547, 0.004462242126464844, 0.004782199859619141, 0.0051021575927734375, 0.005422115325927734, 0.005742073059082031, 0.006062030792236328, 0.006381988525390625, 0.006701946258544922, 0.007021903991699219, 0.007341861724853516, 0.0076618194580078125, 0.00798177719116211, 0.008301734924316406, 0.008621692657470703, 0.008941650390625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 15.0, 16.0, 28.0, 49.0, 78.0, 106.0, 165.0, 139.0, 134.0, 101.0, 64.0, 46.0, 16.0, 17.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06406395137310028, -0.06256478279829025, -0.06106560677289963, -0.0595664344727993, -0.058067262172698975, -0.05656809359788895, -0.05506891757249832, -0.05356974899768829, -0.05207057669758797, -0.05057140439748764, -0.049072232097387314, -0.04757305979728699, -0.04607388749718666, -0.044574715197086334, -0.043075546622276306, -0.04157637432217598, -0.04007720202207565, -0.03857802972197533, -0.037078857421875, -0.03557968512177467, -0.03408051282167435, -0.03258134424686432, -0.031082170084118843, -0.029582999646663666, -0.02808382362127304, -0.026584651321172714, -0.025085479021072388, -0.02358630672097206, -0.022087136283516884, -0.020587963983416557, -0.01908879168331623, -0.017589621245861053, -0.016090448945760727, -0.0145912766456604, -0.013092105276882648, -0.011592932976782322, -0.01009376160800457, -0.008594589307904243, -0.007095417007803917, -0.005596245639026165, -0.0040970733389258385, -0.0025979015044867992, -0.0010987294372171164, 0.00040044263005256653, 0.0018996144644916058, 0.003398786298930645, 0.0048979585990309715, 0.0063971299678087234, 0.00789630226790905, 0.009395474568009377, 0.010894645936787128, 0.012393818236887455, 0.013892989605665207, 0.015392161905765533, 0.01689133420586586, 0.018390506505966187, 0.019889678806066513, 0.02138885110616684, 0.022888023406267166, 0.024387195706367493, 0.02588636614382267, 0.027385538443922997, 0.028884710744023323, 0.0303838811814785, 0.03188305348157883]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 6.0, 12.0, 7.0, 16.0, 13.0, 29.0, 23.0, 14.0, 27.0, 28.0, 23.0, 33.0, 34.0, 49.0, 25.0, 42.0, 44.0, 39.0, 31.0, 42.0, 38.0, 39.0, 35.0, 34.0, 43.0, 22.0, 22.0, 35.0, 27.0, 22.0, 26.0, 19.0, 13.0, 12.0, 10.0, 11.0, 9.0, 4.0, 8.0, 1.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.018437504768371582, -0.017930898815393448, -0.017424290999770164, -0.01691768318414688, -0.016411077231168747, -0.015904471278190613, -0.01539786346256733, -0.01489125657826662, -0.014384649693965912, -0.013878042809665203, -0.013371435925364494, -0.012864829041063786, -0.012358222156763077, -0.011851615272462368, -0.01134500838816166, -0.01083840150386095, -0.010331794619560242, -0.009825187735259533, -0.009318580850958824, -0.008811973966658115, -0.008305367082357407, -0.007798760198056698, -0.007292153313755989, -0.00678554642945528, -0.0062789395451545715, -0.005772332660853863, -0.005265725776553154, -0.004759118892252445, -0.0042525120079517365, -0.0037459051236510277, -0.003239298239350319, -0.00273269135504961, -0.0022260844707489014, -0.0017194775864481926, -0.0012128707021474838, -0.0007062638178467751, -0.00019965693354606628, 0.0003069499507546425, 0.0008135568350553513, 0.00132016371935606, 0.0018267706036567688, 0.0023333774879574776, 0.0028399843722581863, 0.003346591256558895, 0.003853198140859604, 0.004359805025160313, 0.004866411909461021, 0.00537301879376173, 0.005879625678062439, 0.006386232562363148, 0.0068928394466638565, 0.007399446330964565, 0.007906053215265274, 0.008412660099565983, 0.008919266983866692, 0.0094258738681674, 0.009932480752468109, 0.010439087636768818, 0.010945694521069527, 0.011452301405370235, 0.011958908289670944, 0.012465515173971653, 0.012972122058272362, 0.01347872894257307, 0.01398533582687378]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 5.0, 7.0, 5.0, 5.0, 10.0, 8.0, 14.0, 23.0, 18.0, 30.0, 59.0, 80.0, 95.0, 150.0, 226.0, 328.0, 578.0, 954.0, 1741.0, 4255.0, 13908.0, 65642.0, 374367.0, 466252.0, 91588.0, 17872.0, 5356.0, 2108.0, 1091.0, 659.0, 382.0, 222.0, 160.0, 108.0, 77.0, 56.0, 34.0, 18.0, 22.0, 13.0, 5.0, 8.0, 7.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05828857421875, -0.056351661682128906, -0.05441474914550781, -0.05247783660888672, -0.050540924072265625, -0.04860401153564453, -0.04666709899902344, -0.044730186462402344, -0.04279327392578125, -0.040856361389160156, -0.03891944885253906, -0.03698253631591797, -0.035045623779296875, -0.03310871124267578, -0.031171798706054688, -0.029234886169433594, -0.0272979736328125, -0.025361061096191406, -0.023424148559570312, -0.02148723602294922, -0.019550323486328125, -0.01761341094970703, -0.015676498413085938, -0.013739585876464844, -0.01180267333984375, -0.009865760803222656, -0.007928848266601562, -0.005991935729980469, -0.004055023193359375, -0.0021181106567382812, -0.0001811981201171875, 0.0017557144165039062, 0.003692626953125, 0.005629539489746094, 0.0075664520263671875, 0.009503364562988281, 0.011440277099609375, 0.013377189636230469, 0.015314102172851562, 0.017251014709472656, 0.01918792724609375, 0.021124839782714844, 0.023061752319335938, 0.02499866485595703, 0.026935577392578125, 0.02887248992919922, 0.030809402465820312, 0.032746315002441406, 0.0346832275390625, 0.036620140075683594, 0.03855705261230469, 0.04049396514892578, 0.042430877685546875, 0.04436779022216797, 0.04630470275878906, 0.048241615295410156, 0.05017852783203125, 0.052115440368652344, 0.05405235290527344, 0.05598926544189453, 0.057926177978515625, 0.05986309051513672, 0.06180000305175781, 0.0637369155883789, 0.065673828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 8.0, 6.0, 13.0, 12.0, 16.0, 29.0, 31.0, 22.0, 27.0, 40.0, 49.0, 46.0, 39.0, 46.0, 54.0, 45.0, 51.0, 45.0, 35.0, 37.0, 37.0, 49.0, 34.0, 35.0, 37.0, 17.0, 16.0, 17.0, 12.0, 12.0, 11.0, 10.0, 6.0, 10.0, 3.0, 4.0, 3.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.017822265625, -0.017215967178344727, -0.016609668731689453, -0.01600337028503418, -0.015397071838378906, -0.014790773391723633, -0.01418447494506836, -0.013578176498413086, -0.012971878051757812, -0.012365579605102539, -0.011759281158447266, -0.011152982711791992, -0.010546684265136719, -0.009940385818481445, -0.009334087371826172, -0.008727788925170898, -0.008121490478515625, -0.0075151920318603516, -0.006908893585205078, -0.006302595138549805, -0.005696296691894531, -0.005089998245239258, -0.004483699798583984, -0.003877401351928711, -0.0032711029052734375, -0.002664804458618164, -0.0020585060119628906, -0.0014522075653076172, -0.0008459091186523438, -0.0002396106719970703, 0.0003666877746582031, 0.0009729862213134766, 0.00157928466796875, 0.0021855831146240234, 0.002791881561279297, 0.0033981800079345703, 0.004004478454589844, 0.004610776901245117, 0.005217075347900391, 0.005823373794555664, 0.0064296722412109375, 0.007035970687866211, 0.007642269134521484, 0.008248567581176758, 0.008854866027832031, 0.009461164474487305, 0.010067462921142578, 0.010673761367797852, 0.011280059814453125, 0.011886358261108398, 0.012492656707763672, 0.013098955154418945, 0.013705253601074219, 0.014311552047729492, 0.014917850494384766, 0.015524148941040039, 0.016130447387695312, 0.016736745834350586, 0.01734304428100586, 0.017949342727661133, 0.018555641174316406, 0.01916193962097168, 0.019768238067626953, 0.020374536514282227, 0.0209808349609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 8.0, 11.0, 4.0, 11.0, 11.0, 17.0, 15.0, 26.0, 33.0, 51.0, 56.0, 82.0, 133.0, 224.0, 462.0, 969.0, 2484.0, 8856.0, 49360.0, 441958.0, 476996.0, 52696.0, 9374.0, 2603.0, 912.0, 477.0, 247.0, 133.0, 86.0, 60.0, 40.0, 36.0, 26.0, 23.0, 16.0, 11.0, 12.0, 9.0, 4.0, 7.0, 3.0, 4.0, 6.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0567626953125, -0.054932594299316406, -0.05310249328613281, -0.05127239227294922, -0.049442291259765625, -0.04761219024658203, -0.04578208923339844, -0.043951988220214844, -0.04212188720703125, -0.040291786193847656, -0.03846168518066406, -0.03663158416748047, -0.034801483154296875, -0.03297138214111328, -0.031141281127929688, -0.029311180114746094, -0.0274810791015625, -0.025650978088378906, -0.023820877075195312, -0.02199077606201172, -0.020160675048828125, -0.01833057403564453, -0.016500473022460938, -0.014670372009277344, -0.01284027099609375, -0.011010169982910156, -0.009180068969726562, -0.007349967956542969, -0.005519866943359375, -0.0036897659301757812, -0.0018596649169921875, -2.956390380859375e-05, 0.001800537109375, 0.0036306381225585938, 0.0054607391357421875, 0.007290840148925781, 0.009120941162109375, 0.010951042175292969, 0.012781143188476562, 0.014611244201660156, 0.01644134521484375, 0.018271446228027344, 0.020101547241210938, 0.02193164825439453, 0.023761749267578125, 0.02559185028076172, 0.027421951293945312, 0.029252052307128906, 0.0310821533203125, 0.032912254333496094, 0.03474235534667969, 0.03657245635986328, 0.038402557373046875, 0.04023265838623047, 0.04206275939941406, 0.043892860412597656, 0.04572296142578125, 0.047553062438964844, 0.04938316345214844, 0.05121326446533203, 0.053043365478515625, 0.05487346649169922, 0.05670356750488281, 0.058533668518066406, 0.06036376953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 14.0, 12.0, 12.0, 15.0, 8.0, 13.0, 16.0, 27.0, 22.0, 36.0, 34.0, 35.0, 33.0, 26.0, 44.0, 29.0, 41.0, 34.0, 31.0, 39.0, 30.0, 33.0, 28.0, 44.0, 36.0, 35.0, 33.0, 33.0, 28.0, 25.0, 27.0, 14.0, 11.0, 18.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.063232421875, -0.06129121780395508, -0.059350013732910156, -0.057408809661865234, -0.05546760559082031, -0.05352640151977539, -0.05158519744873047, -0.04964399337768555, -0.047702789306640625, -0.0457615852355957, -0.04382038116455078, -0.04187917709350586, -0.03993797302246094, -0.037996768951416016, -0.036055564880371094, -0.03411436080932617, -0.03217315673828125, -0.030231952667236328, -0.028290748596191406, -0.026349544525146484, -0.024408340454101562, -0.02246713638305664, -0.02052593231201172, -0.018584728240966797, -0.016643524169921875, -0.014702320098876953, -0.012761116027832031, -0.01081991195678711, -0.008878707885742188, -0.006937503814697266, -0.004996299743652344, -0.003055095672607422, -0.0011138916015625, 0.0008273124694824219, 0.0027685165405273438, 0.004709720611572266, 0.0066509246826171875, 0.00859212875366211, 0.010533332824707031, 0.012474536895751953, 0.014415740966796875, 0.016356945037841797, 0.01829814910888672, 0.02023935317993164, 0.022180557250976562, 0.024121761322021484, 0.026062965393066406, 0.028004169464111328, 0.02994537353515625, 0.03188657760620117, 0.033827781677246094, 0.035768985748291016, 0.03771018981933594, 0.03965139389038086, 0.04159259796142578, 0.0435338020324707, 0.045475006103515625, 0.04741621017456055, 0.04935741424560547, 0.05129861831665039, 0.05323982238769531, 0.055181026458740234, 0.057122230529785156, 0.05906343460083008, 0.061004638671875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 26.0, 22.0, 42.0, 110.0, 153.0, 338.0, 678.0, 1682.0, 4623.0, 17977.0, 124415.0, 733372.0, 137928.0, 19099.0, 4888.0, 1738.0, 706.0, 320.0, 160.0, 74.0, 56.0, 29.0, 25.0, 17.0, 13.0, 11.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022857666015625, -0.022154808044433594, -0.021451950073242188, -0.02074909210205078, -0.020046234130859375, -0.01934337615966797, -0.018640518188476562, -0.017937660217285156, -0.01723480224609375, -0.016531944274902344, -0.015829086303710938, -0.015126228332519531, -0.014423370361328125, -0.013720512390136719, -0.013017654418945312, -0.012314796447753906, -0.0116119384765625, -0.010909080505371094, -0.010206222534179688, -0.009503364562988281, -0.008800506591796875, -0.008097648620605469, -0.0073947906494140625, -0.006691932678222656, -0.00598907470703125, -0.005286216735839844, -0.0045833587646484375, -0.0038805007934570312, -0.003177642822265625, -0.0024747848510742188, -0.0017719268798828125, -0.0010690689086914062, -0.0003662109375, 0.00033664703369140625, 0.0010395050048828125, 0.0017423629760742188, 0.002445220947265625, 0.0031480789184570312, 0.0038509368896484375, 0.004553794860839844, 0.00525665283203125, 0.005959510803222656, 0.0066623687744140625, 0.007365226745605469, 0.008068084716796875, 0.008770942687988281, 0.009473800659179688, 0.010176658630371094, 0.0108795166015625, 0.011582374572753906, 0.012285232543945312, 0.012988090515136719, 0.013690948486328125, 0.014393806457519531, 0.015096664428710938, 0.015799522399902344, 0.01650238037109375, 0.017205238342285156, 0.017908096313476562, 0.01861095428466797, 0.019313812255859375, 0.02001667022705078, 0.020719528198242188, 0.021422386169433594, 0.022125244140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 11.0, 3.0, 8.0, 10.0, 16.0, 17.0, 26.0, 33.0, 39.0, 59.0, 53.0, 62.0, 67.0, 101.0, 68.0, 56.0, 76.0, 63.0, 47.0, 48.0, 29.0, 25.0, 21.0, 13.0, 8.0, 11.0, 5.0, 5.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.359070539474487e-06, -6.161630153656006e-06, -5.964189767837524e-06, -5.766749382019043e-06, -5.5693089962005615e-06, -5.37186861038208e-06, -5.174428224563599e-06, -4.976987838745117e-06, -4.779547452926636e-06, -4.582107067108154e-06, -4.384666681289673e-06, -4.187226295471191e-06, -3.98978590965271e-06, -3.7923455238342285e-06, -3.594905138015747e-06, -3.3974647521972656e-06, -3.200024366378784e-06, -3.0025839805603027e-06, -2.8051435947418213e-06, -2.60770320892334e-06, -2.4102628231048584e-06, -2.212822437286377e-06, -2.0153820514678955e-06, -1.817941665649414e-06, -1.6205012798309326e-06, -1.4230608940124512e-06, -1.2256205081939697e-06, -1.0281801223754883e-06, -8.307397365570068e-07, -6.332993507385254e-07, -4.3585896492004395e-07, -2.384185791015625e-07, -4.0978193283081055e-08, 1.564621925354004e-07, 3.5390257835388184e-07, 5.513429641723633e-07, 7.487833499908447e-07, 9.462237358093262e-07, 1.1436641216278076e-06, 1.341104507446289e-06, 1.5385448932647705e-06, 1.735985279083252e-06, 1.9334256649017334e-06, 2.130866050720215e-06, 2.3283064365386963e-06, 2.5257468223571777e-06, 2.723187208175659e-06, 2.9206275939941406e-06, 3.118067979812622e-06, 3.3155083656311035e-06, 3.512948751449585e-06, 3.7103891372680664e-06, 3.907829523086548e-06, 4.105269908905029e-06, 4.302710294723511e-06, 4.500150680541992e-06, 4.697591066360474e-06, 4.895031452178955e-06, 5.0924718379974365e-06, 5.289912223815918e-06, 5.487352609634399e-06, 5.684792995452881e-06, 5.882233381271362e-06, 6.079673767089844e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 19.0, 13.0, 33.0, 51.0, 83.0, 151.0, 341.0, 863.0, 2531.0, 10553.0, 90668.0, 813674.0, 113496.0, 11739.0, 2645.0, 890.0, 375.0, 163.0, 85.0, 63.0, 32.0, 17.0, 13.0, 13.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03997802734375, -0.03891301155090332, -0.03784799575805664, -0.03678297996520996, -0.03571796417236328, -0.0346529483795166, -0.03358793258666992, -0.03252291679382324, -0.03145790100097656, -0.030392885208129883, -0.029327869415283203, -0.028262853622436523, -0.027197837829589844, -0.026132822036743164, -0.025067806243896484, -0.024002790451049805, -0.022937774658203125, -0.021872758865356445, -0.020807743072509766, -0.019742727279663086, -0.018677711486816406, -0.017612695693969727, -0.016547679901123047, -0.015482664108276367, -0.014417648315429688, -0.013352632522583008, -0.012287616729736328, -0.011222600936889648, -0.010157585144042969, -0.009092569351196289, -0.00802755355834961, -0.00696253776550293, -0.00589752197265625, -0.00483250617980957, -0.0037674903869628906, -0.002702474594116211, -0.0016374588012695312, -0.0005724430084228516, 0.0004925727844238281, 0.0015575885772705078, 0.0026226043701171875, 0.003687620162963867, 0.004752635955810547, 0.0058176517486572266, 0.006882667541503906, 0.007947683334350586, 0.009012699127197266, 0.010077714920043945, 0.011142730712890625, 0.012207746505737305, 0.013272762298583984, 0.014337778091430664, 0.015402793884277344, 0.016467809677124023, 0.017532825469970703, 0.018597841262817383, 0.019662857055664062, 0.020727872848510742, 0.021792888641357422, 0.0228579044342041, 0.02392292022705078, 0.02498793601989746, 0.02605295181274414, 0.02711796760559082, 0.0281829833984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 4.0, 9.0, 17.0, 28.0, 38.0, 59.0, 73.0, 76.0, 114.0, 130.0, 101.0, 95.0, 72.0, 55.0, 46.0, 27.0, 9.0, 16.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02691650390625, -0.026062965393066406, -0.025209426879882812, -0.02435588836669922, -0.023502349853515625, -0.02264881134033203, -0.021795272827148438, -0.020941734313964844, -0.02008819580078125, -0.019234657287597656, -0.018381118774414062, -0.01752758026123047, -0.016674041748046875, -0.01582050323486328, -0.014966964721679688, -0.014113426208496094, -0.0132598876953125, -0.012406349182128906, -0.011552810668945312, -0.010699272155761719, -0.009845733642578125, -0.008992195129394531, -0.008138656616210938, -0.007285118103027344, -0.00643157958984375, -0.005578041076660156, -0.0047245025634765625, -0.0038709640502929688, -0.003017425537109375, -0.0021638870239257812, -0.0013103485107421875, -0.00045680999755859375, 0.000396728515625, 0.0012502670288085938, 0.0021038055419921875, 0.0029573440551757812, 0.003810882568359375, 0.004664421081542969, 0.0055179595947265625, 0.006371498107910156, 0.00722503662109375, 0.008078575134277344, 0.008932113647460938, 0.009785652160644531, 0.010639190673828125, 0.011492729187011719, 0.012346267700195312, 0.013199806213378906, 0.0140533447265625, 0.014906883239746094, 0.015760421752929688, 0.01661396026611328, 0.017467498779296875, 0.01832103729248047, 0.019174575805664062, 0.020028114318847656, 0.02088165283203125, 0.021735191345214844, 0.022588729858398438, 0.02344226837158203, 0.024295806884765625, 0.02514934539794922, 0.026002883911132812, 0.026856422424316406, 0.0277099609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 8.0, 7.0, 25.0, 76.0, 219.0, 334.0, 215.0, 86.0, 31.0, 8.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18634408712387085, -0.157488614320755, -0.12863312661647797, -0.09977764636278152, -0.07092216610908508, -0.04206669330596924, -0.0132112056016922, 0.01564428210258484, 0.044499754905700684, 0.07335523515939713, 0.10221071541309357, 0.1310662031173706, 0.15992167592048645, 0.1887771487236023, 0.21763263642787933, 0.24648812413215637, 0.2753435969352722, 0.30419906973838806, 0.3330545425415039, 0.36191004514694214, 0.390765517950058, 0.41962099075317383, 0.44847649335861206, 0.4773319661617279, 0.5061874389648438, 0.535042941570282, 0.5638983845710754, 0.5927538871765137, 0.6216093301773071, 0.6504648327827454, 0.6793203353881836, 0.708175778388977, 0.7370312213897705, 0.7658867239952087, 0.7947421669960022, 0.8235976696014404, 0.8524531126022339, 0.8813086152076721, 0.9101641178131104, 0.9390195608139038, 0.967875063419342, 0.9967305660247803, 1.0255860090255737, 1.0544414520263672, 1.0832970142364502, 1.1121524572372437, 1.141007900238037, 1.1698634624481201, 1.1987189054489136, 1.227574348449707, 1.25642991065979, 1.2852853536605835, 1.314140796661377, 1.34299635887146, 1.3718518018722534, 1.4007072448730469, 1.4295628070831299, 1.4584182500839233, 1.4872738122940063, 1.5161292552947998, 1.5449846982955933, 1.5738401412963867, 1.6026957035064697, 1.6315511465072632, 1.6604065895080566]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 9.0, 12.0, 8.0, 5.0, 10.0, 4.0, 17.0, 16.0, 21.0, 17.0, 21.0, 26.0, 42.0, 41.0, 43.0, 51.0, 57.0, 57.0, 42.0, 47.0, 54.0, 51.0, 48.0, 44.0, 34.0, 29.0, 31.0, 27.0, 26.0, 20.0, 16.0, 11.0, 11.0, 17.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3653542995452881, -0.3539857864379883, -0.3426172733306885, -0.33124876022338867, -0.31988024711608887, -0.30851173400878906, -0.29714322090148926, -0.28577470779418945, -0.27440619468688965, -0.26303768157958984, -0.25166916847229004, -0.24030065536499023, -0.22893214225769043, -0.21756362915039062, -0.20619510114192963, -0.19482658803462982, -0.18345806002616882, -0.17208954691886902, -0.1607210338115692, -0.1493525207042694, -0.1379840075969696, -0.1266154944896698, -0.1152469664812088, -0.103878453373909, -0.09250994026660919, -0.08114142715930939, -0.06977291405200958, -0.05840439349412918, -0.047035880386829376, -0.03566736727952957, -0.02429884672164917, -0.012930333614349365, -0.0015618205070495605, 0.009806694462895393, 0.021175209432840347, 0.03254372626543045, 0.043912239372730255, 0.05528075248003006, 0.06664927303791046, 0.07801778614521027, 0.08938629925251007, 0.10075481235980988, 0.11212332546710968, 0.12349184602499008, 0.13486036658287048, 0.1462288796901703, 0.1575973927974701, 0.1689659059047699, 0.1803344190120697, 0.1917029321193695, 0.2030714452266693, 0.21443995833396912, 0.22580847144126892, 0.23717698454856873, 0.24854551255702972, 0.2599140405654907, 0.2712825536727905, 0.28265106678009033, 0.29401957988739014, 0.30538809299468994, 0.31675660610198975, 0.32812511920928955, 0.33949363231658936, 0.35086214542388916, 0.36223065853118896]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 8.0, 24.0, 33.0, 68.0, 90.0, 171.0, 434.0, 1901.0, 4061998.0, 127414.0, 1412.0, 373.0, 142.0, 91.0, 54.0, 25.0, 15.0, 13.0, 11.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30322265625, -0.295989990234375, -0.28875732421875, -0.281524658203125, -0.2742919921875, -0.267059326171875, -0.25982666015625, -0.252593994140625, -0.245361328125, -0.238128662109375, -0.23089599609375, -0.223663330078125, -0.2164306640625, -0.209197998046875, -0.20196533203125, -0.194732666015625, -0.1875, -0.180267333984375, -0.17303466796875, -0.165802001953125, -0.1585693359375, -0.151336669921875, -0.14410400390625, -0.136871337890625, -0.129638671875, -0.122406005859375, -0.11517333984375, -0.107940673828125, -0.1007080078125, -0.093475341796875, -0.08624267578125, -0.079010009765625, -0.07177734375, -0.064544677734375, -0.05731201171875, -0.050079345703125, -0.0428466796875, -0.035614013671875, -0.02838134765625, -0.021148681640625, -0.013916015625, -0.006683349609375, 0.00054931640625, 0.007781982421875, 0.0150146484375, 0.022247314453125, 0.02947998046875, 0.036712646484375, 0.0439453125, 0.051177978515625, 0.05841064453125, 0.065643310546875, 0.0728759765625, 0.080108642578125, 0.08734130859375, 0.094573974609375, 0.101806640625, 0.109039306640625, 0.11627197265625, 0.123504638671875, 0.1307373046875, 0.137969970703125, 0.14520263671875, 0.152435302734375, 0.15966796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 13.0, 13.0, 25.0, 22.0, 12.0, 30.0, 31.0, 32.0, 52.0, 48.0, 38.0, 38.0, 54.0, 62.0, 65.0, 40.0, 45.0, 43.0, 42.0, 46.0, 34.0, 28.0, 42.0, 29.0, 18.0, 15.0, 13.0, 11.0, 6.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01953125, -0.01890277862548828, -0.018274307250976562, -0.017645835876464844, -0.017017364501953125, -0.016388893127441406, -0.015760421752929688, -0.015131950378417969, -0.01450347900390625, -0.013875007629394531, -0.013246536254882812, -0.012618064880371094, -0.011989593505859375, -0.011361122131347656, -0.010732650756835938, -0.010104179382324219, -0.0094757080078125, -0.008847236633300781, -0.008218765258789062, -0.007590293884277344, -0.006961822509765625, -0.006333351135253906, -0.0057048797607421875, -0.005076408386230469, -0.00444793701171875, -0.0038194656372070312, -0.0031909942626953125, -0.0025625228881835938, -0.001934051513671875, -0.0013055801391601562, -0.0006771087646484375, -4.863739013671875e-05, 0.000579833984375, 0.0012083053588867188, 0.0018367767333984375, 0.0024652481079101562, 0.003093719482421875, 0.0037221908569335938, 0.0043506622314453125, 0.004979133605957031, 0.00560760498046875, 0.006236076354980469, 0.0068645477294921875, 0.007493019104003906, 0.008121490478515625, 0.008749961853027344, 0.009378433227539062, 0.010006904602050781, 0.0106353759765625, 0.011263847351074219, 0.011892318725585938, 0.012520790100097656, 0.013149261474609375, 0.013777732849121094, 0.014406204223632812, 0.015034675598144531, 0.01566314697265625, 0.01629161834716797, 0.016920089721679688, 0.017548561096191406, 0.018177032470703125, 0.018805503845214844, 0.019433975219726562, 0.02006244659423828, 0.02069091796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 10.0, 10.0, 19.0, 24.0, 39.0, 58.0, 84.0, 127.0, 213.0, 294.0, 536.0, 932.0, 2118.0, 6409.0, 37392.0, 4036908.0, 93550.0, 9878.0, 2851.0, 1153.0, 647.0, 338.0, 203.0, 162.0, 85.0, 57.0, 48.0, 31.0, 22.0, 19.0, 14.0, 8.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05963134765625, -0.05747509002685547, -0.05531883239746094, -0.053162574768066406, -0.051006317138671875, -0.048850059509277344, -0.04669380187988281, -0.04453754425048828, -0.04238128662109375, -0.04022502899169922, -0.03806877136230469, -0.035912513732910156, -0.033756256103515625, -0.031599998474121094, -0.029443740844726562, -0.02728748321533203, -0.0251312255859375, -0.02297496795654297, -0.020818710327148438, -0.018662452697753906, -0.016506195068359375, -0.014349937438964844, -0.012193679809570312, -0.010037422180175781, -0.00788116455078125, -0.005724906921386719, -0.0035686492919921875, -0.0014123916625976562, 0.000743865966796875, 0.0029001235961914062, 0.0050563812255859375, 0.007212638854980469, 0.009368896484375, 0.011525154113769531, 0.013681411743164062, 0.015837669372558594, 0.017993927001953125, 0.020150184631347656, 0.022306442260742188, 0.02446269989013672, 0.02661895751953125, 0.02877521514892578, 0.030931472778320312, 0.033087730407714844, 0.035243988037109375, 0.037400245666503906, 0.03955650329589844, 0.04171276092529297, 0.0438690185546875, 0.04602527618408203, 0.04818153381347656, 0.050337791442871094, 0.052494049072265625, 0.054650306701660156, 0.05680656433105469, 0.05896282196044922, 0.06111907958984375, 0.06327533721923828, 0.06543159484863281, 0.06758785247802734, 0.06974411010742188, 0.0719003677368164, 0.07405662536621094, 0.07621288299560547, 0.078369140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 4.0, 6.0, 7.0, 15.0, 23.0, 56.0, 127.0, 3007.0, 640.0, 93.0, 46.0, 21.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0236053466796875, -0.02269434928894043, -0.02178335189819336, -0.02087235450744629, -0.01996135711669922, -0.01905035972595215, -0.018139362335205078, -0.017228364944458008, -0.016317367553710938, -0.015406370162963867, -0.014495372772216797, -0.013584375381469727, -0.012673377990722656, -0.011762380599975586, -0.010851383209228516, -0.009940385818481445, -0.009029388427734375, -0.008118391036987305, -0.007207393646240234, -0.006296396255493164, -0.005385398864746094, -0.0044744014739990234, -0.003563404083251953, -0.002652406692504883, -0.0017414093017578125, -0.0008304119110107422, 8.058547973632812e-05, 0.0009915828704833984, 0.0019025802612304688, 0.002813577651977539, 0.0037245750427246094, 0.00463557243347168, 0.00554656982421875, 0.00645756721496582, 0.007368564605712891, 0.008279561996459961, 0.009190559387207031, 0.010101556777954102, 0.011012554168701172, 0.011923551559448242, 0.012834548950195312, 0.013745546340942383, 0.014656543731689453, 0.015567541122436523, 0.016478538513183594, 0.017389535903930664, 0.018300533294677734, 0.019211530685424805, 0.020122528076171875, 0.021033525466918945, 0.021944522857666016, 0.022855520248413086, 0.023766517639160156, 0.024677515029907227, 0.025588512420654297, 0.026499509811401367, 0.027410507202148438, 0.028321504592895508, 0.029232501983642578, 0.03014349937438965, 0.03105449676513672, 0.03196549415588379, 0.03287649154663086, 0.03378748893737793, 0.034698486328125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 9.0, 27.0, 50.0, 106.0, 204.0, 255.0, 191.0, 89.0, 34.0, 19.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25620049238204956, -0.25081244111061096, -0.24542438983917236, -0.24003635346889496, -0.23464830219745636, -0.22926025092601776, -0.22387221455574036, -0.21848416328430176, -0.21309611201286316, -0.20770806074142456, -0.20232000946998596, -0.19693197309970856, -0.19154392182826996, -0.18615587055683136, -0.18076783418655396, -0.17537978291511536, -0.16999173164367676, -0.16460368037223816, -0.15921562910079956, -0.15382759273052216, -0.14843954145908356, -0.14305149018764496, -0.13766345381736755, -0.13227540254592896, -0.12688735127449036, -0.12149930000305176, -0.11611125618219376, -0.11072321236133575, -0.10533516108989716, -0.09994710981845856, -0.09455906599760056, -0.08917102217674255, -0.08378295600414276, -0.07839490473270416, -0.07300686091184616, -0.06761881709098816, -0.06223076581954956, -0.05684271827340126, -0.05145467072725296, -0.04606662318110466, -0.04067857563495636, -0.03529052808880806, -0.02990248054265976, -0.02451443299651146, -0.01912638545036316, -0.013738337904214859, -0.008350290358066559, -0.0029622428119182587, 0.0024258047342300415, 0.007813852280378342, 0.013201899826526642, 0.018589947372674942, 0.023977994918823242, 0.029366042464971542, 0.03475409001111984, 0.04014213755726814, 0.04553018510341644, 0.05091823264956474, 0.05630628019571304, 0.06169432774186134, 0.06708237528800964, 0.07247042655944824, 0.07785847038030624, 0.08324651420116425, 0.08863456547260284]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 1.0, 9.0, 7.0, 11.0, 17.0, 23.0, 13.0, 26.0, 22.0, 33.0, 43.0, 49.0, 53.0, 40.0, 51.0, 54.0, 70.0, 54.0, 59.0, 34.0, 57.0, 47.0, 36.0, 31.0, 29.0, 23.0, 26.0, 18.0, 12.0, 14.0, 9.0, 10.0, 4.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.057099342346191406, -0.055458031594753265, -0.053816720843315125, -0.052175406366586685, -0.050534095615148544, -0.0488927848637104, -0.047251470386981964, -0.04561015963554382, -0.04396884888410568, -0.04232753813266754, -0.0406862273812294, -0.03904491290450096, -0.03740360215306282, -0.03576229140162468, -0.03412097692489624, -0.0324796661734581, -0.03083835542201996, -0.029197044670581818, -0.027555732056498528, -0.025914419442415237, -0.024273108690977097, -0.022631797939538956, -0.020990485325455666, -0.019349172711372375, -0.017707861959934235, -0.016066551208496094, -0.014425238594412804, -0.012783926911652088, -0.011142615228891373, -0.009501303546130657, -0.007859991863369942, -0.006218680180609226, -0.004577368497848511, -0.0029360568150877953, -0.0012947451323270798, 0.0003465665504336357, 0.001987878233194351, 0.0036291899159550667, 0.005270501598715782, 0.006911813281476498, 0.008553124964237213, 0.010194436646997929, 0.011835748329758644, 0.01347706001251936, 0.015118371695280075, 0.016759682446718216, 0.018400995060801506, 0.020042307674884796, 0.021683618426322937, 0.023324929177761078, 0.024966241791844368, 0.026607554405927658, 0.0282488651573658, 0.02989017590880394, 0.03153149038553238, 0.03317280113697052, 0.03481411188840866, 0.0364554226398468, 0.03809673339128494, 0.03973804786801338, 0.04137935861945152, 0.043020669370889664, 0.0446619838476181, 0.046303294599056244, 0.047944605350494385]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 17.0, 20.0, 43.0, 53.0, 92.0, 124.0, 236.0, 436.0, 756.0, 1528.0, 3179.0, 7297.0, 19659.0, 64408.0, 246237.0, 447948.0, 182363.0, 47260.0, 15238.0, 5960.0, 2727.0, 1333.0, 710.0, 375.0, 206.0, 130.0, 73.0, 49.0, 20.0, 20.0, 13.0, 11.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.030963420867919922, -0.029639244079589844, -0.028315067291259766, -0.026990890502929688, -0.02566671371459961, -0.02434253692626953, -0.023018360137939453, -0.021694183349609375, -0.020370006561279297, -0.01904582977294922, -0.01772165298461914, -0.016397476196289062, -0.015073299407958984, -0.013749122619628906, -0.012424945831298828, -0.01110076904296875, -0.009776592254638672, -0.008452415466308594, -0.007128238677978516, -0.0058040618896484375, -0.004479885101318359, -0.0031557083129882812, -0.0018315315246582031, -0.000507354736328125, 0.0008168220520019531, 0.0021409988403320312, 0.0034651756286621094, 0.0047893524169921875, 0.006113529205322266, 0.007437705993652344, 0.008761882781982422, 0.0100860595703125, 0.011410236358642578, 0.012734413146972656, 0.014058589935302734, 0.015382766723632812, 0.01670694351196289, 0.01803112030029297, 0.019355297088623047, 0.020679473876953125, 0.022003650665283203, 0.02332782745361328, 0.02465200424194336, 0.025976181030273438, 0.027300357818603516, 0.028624534606933594, 0.029948711395263672, 0.03127288818359375, 0.03259706497192383, 0.033921241760253906, 0.035245418548583984, 0.03656959533691406, 0.03789377212524414, 0.03921794891357422, 0.0405421257019043, 0.041866302490234375, 0.04319047927856445, 0.04451465606689453, 0.04583883285522461, 0.04716300964355469, 0.048487186431884766, 0.049811363220214844, 0.05113554000854492, 0.052459716796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 7.0, 7.0, 14.0, 10.0, 19.0, 22.0, 37.0, 23.0, 30.0, 39.0, 52.0, 42.0, 48.0, 60.0, 61.0, 57.0, 68.0, 44.0, 50.0, 40.0, 51.0, 36.0, 30.0, 29.0, 24.0, 22.0, 16.0, 13.0, 9.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.023834228515625, -0.023119688034057617, -0.022405147552490234, -0.02169060707092285, -0.02097606658935547, -0.020261526107788086, -0.019546985626220703, -0.01883244514465332, -0.018117904663085938, -0.017403364181518555, -0.016688823699951172, -0.01597428321838379, -0.015259742736816406, -0.014545202255249023, -0.01383066177368164, -0.013116121292114258, -0.012401580810546875, -0.011687040328979492, -0.01097249984741211, -0.010257959365844727, -0.009543418884277344, -0.008828878402709961, -0.008114337921142578, -0.007399797439575195, -0.0066852569580078125, -0.00597071647644043, -0.005256175994873047, -0.004541635513305664, -0.0038270950317382812, -0.0031125545501708984, -0.0023980140686035156, -0.0016834735870361328, -0.00096893310546875, -0.0002543926239013672, 0.0004601478576660156, 0.0011746883392333984, 0.0018892288208007812, 0.002603769302368164, 0.003318309783935547, 0.00403285026550293, 0.0047473907470703125, 0.005461931228637695, 0.006176471710205078, 0.006891012191772461, 0.007605552673339844, 0.008320093154907227, 0.00903463363647461, 0.009749174118041992, 0.010463714599609375, 0.011178255081176758, 0.01189279556274414, 0.012607336044311523, 0.013321876525878906, 0.014036417007446289, 0.014750957489013672, 0.015465497970581055, 0.016180038452148438, 0.01689457893371582, 0.017609119415283203, 0.018323659896850586, 0.01903820037841797, 0.01975274085998535, 0.020467281341552734, 0.021181821823120117, 0.0218963623046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 12.0, 13.0, 26.0, 27.0, 37.0, 49.0, 75.0, 81.0, 162.0, 320.0, 536.0, 1201.0, 3127.0, 10186.0, 48173.0, 455525.0, 463825.0, 49127.0, 10198.0, 3195.0, 1280.0, 547.0, 280.0, 170.0, 99.0, 66.0, 45.0, 38.0, 32.0, 18.0, 19.0, 9.0, 7.0, 13.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.05047607421875, -0.04867362976074219, -0.046871185302734375, -0.04506874084472656, -0.04326629638671875, -0.04146385192871094, -0.039661407470703125, -0.03785896301269531, -0.0360565185546875, -0.03425407409667969, -0.032451629638671875, -0.030649185180664062, -0.02884674072265625, -0.027044296264648438, -0.025241851806640625, -0.023439407348632812, -0.021636962890625, -0.019834518432617188, -0.018032073974609375, -0.016229629516601562, -0.01442718505859375, -0.012624740600585938, -0.010822296142578125, -0.009019851684570312, -0.0072174072265625, -0.0054149627685546875, -0.003612518310546875, -0.0018100738525390625, -7.62939453125e-06, 0.0017948150634765625, 0.003597259521484375, 0.0053997039794921875, 0.0072021484375, 0.009004592895507812, 0.010807037353515625, 0.012609481811523438, 0.01441192626953125, 0.016214370727539062, 0.018016815185546875, 0.019819259643554688, 0.0216217041015625, 0.023424148559570312, 0.025226593017578125, 0.027029037475585938, 0.02883148193359375, 0.030633926391601562, 0.032436370849609375, 0.03423881530761719, 0.036041259765625, 0.03784370422363281, 0.039646148681640625, 0.04144859313964844, 0.04325103759765625, 0.04505348205566406, 0.046855926513671875, 0.04865837097167969, 0.0504608154296875, 0.05226325988769531, 0.054065704345703125, 0.05586814880371094, 0.05767059326171875, 0.05947303771972656, 0.061275482177734375, 0.06307792663574219, 0.06488037109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 4.0, 7.0, 7.0, 10.0, 13.0, 12.0, 15.0, 16.0, 15.0, 19.0, 23.0, 24.0, 29.0, 32.0, 38.0, 30.0, 37.0, 38.0, 37.0, 53.0, 31.0, 51.0, 44.0, 38.0, 31.0, 31.0, 41.0, 33.0, 39.0, 31.0, 33.0, 33.0, 12.0, 18.0, 18.0, 9.0, 9.0, 5.0, 5.0, 2.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.06866455078125, -0.06661033630371094, -0.06455612182617188, -0.06250190734863281, -0.06044769287109375, -0.05839347839355469, -0.056339263916015625, -0.05428504943847656, -0.0522308349609375, -0.05017662048339844, -0.048122406005859375, -0.04606819152832031, -0.04401397705078125, -0.04195976257324219, -0.039905548095703125, -0.03785133361816406, -0.035797119140625, -0.03374290466308594, -0.031688690185546875, -0.029634475708007812, -0.02758026123046875, -0.025526046752929688, -0.023471832275390625, -0.021417617797851562, -0.0193634033203125, -0.017309188842773438, -0.015254974365234375, -0.013200759887695312, -0.01114654541015625, -0.009092330932617188, -0.007038116455078125, -0.0049839019775390625, -0.0029296875, -0.0008754730224609375, 0.001178741455078125, 0.0032329559326171875, 0.00528717041015625, 0.0073413848876953125, 0.009395599365234375, 0.011449813842773438, 0.0135040283203125, 0.015558242797851562, 0.017612457275390625, 0.019666671752929688, 0.02172088623046875, 0.023775100708007812, 0.025829315185546875, 0.027883529663085938, 0.029937744140625, 0.03199195861816406, 0.034046173095703125, 0.03610038757324219, 0.03815460205078125, 0.04020881652832031, 0.042263031005859375, 0.04431724548339844, 0.0463714599609375, 0.04842567443847656, 0.050479888916015625, 0.05253410339355469, 0.05458831787109375, 0.05664253234863281, 0.058696746826171875, 0.06075096130371094, 0.06280517578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 7.0, 22.0, 29.0, 24.0, 38.0, 47.0, 61.0, 134.0, 202.0, 355.0, 672.0, 1365.0, 3278.0, 11031.0, 52064.0, 416520.0, 484794.0, 59090.0, 12080.0, 3605.0, 1379.0, 709.0, 360.0, 237.0, 129.0, 87.0, 55.0, 40.0, 24.0, 19.0, 26.0, 12.0, 8.0, 12.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.016021728515625, -0.015550971031188965, -0.01508021354675293, -0.014609456062316895, -0.01413869857788086, -0.013667941093444824, -0.013197183609008789, -0.012726426124572754, -0.012255668640136719, -0.011784911155700684, -0.011314153671264648, -0.010843396186828613, -0.010372638702392578, -0.009901881217956543, -0.009431123733520508, -0.008960366249084473, -0.008489608764648438, -0.008018851280212402, -0.007548093795776367, -0.007077336311340332, -0.006606578826904297, -0.006135821342468262, -0.0056650638580322266, -0.005194306373596191, -0.004723548889160156, -0.004252791404724121, -0.003782033920288086, -0.0033112764358520508, -0.0028405189514160156, -0.0023697614669799805, -0.0018990039825439453, -0.0014282464981079102, -0.000957489013671875, -0.00048673152923583984, -1.5974044799804688e-05, 0.00045478343963623047, 0.0009255409240722656, 0.0013962984085083008, 0.001867055892944336, 0.002337813377380371, 0.0028085708618164062, 0.0032793283462524414, 0.0037500858306884766, 0.004220843315124512, 0.004691600799560547, 0.005162358283996582, 0.005633115768432617, 0.006103873252868652, 0.0065746307373046875, 0.007045388221740723, 0.007516145706176758, 0.007986903190612793, 0.008457660675048828, 0.008928418159484863, 0.009399175643920898, 0.009869933128356934, 0.010340690612792969, 0.010811448097229004, 0.011282205581665039, 0.011752963066101074, 0.01222372055053711, 0.012694478034973145, 0.01316523551940918, 0.013635993003845215, 0.01410675048828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 10.0, 2.0, 18.0, 12.0, 33.0, 34.0, 38.0, 41.0, 68.0, 76.0, 60.0, 98.0, 61.0, 90.0, 59.0, 70.0, 64.0, 42.0, 35.0, 29.0, 21.0, 11.0, 6.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-06, -4.079192876815796e-06, -3.866851329803467e-06, -3.6545097827911377e-06, -3.4421682357788086e-06, -3.2298266887664795e-06, -3.0174851417541504e-06, -2.8051435947418213e-06, -2.592802047729492e-06, -2.380460500717163e-06, -2.168118953704834e-06, -1.955777406692505e-06, -1.7434358596801758e-06, -1.5310943126678467e-06, -1.3187527656555176e-06, -1.1064112186431885e-06, -8.940696716308594e-07, -6.817281246185303e-07, -4.6938657760620117e-07, -2.5704503059387207e-07, -4.470348358154297e-08, 1.6763806343078613e-07, 3.7997961044311523e-07, 5.923211574554443e-07, 8.046627044677734e-07, 1.0170042514801025e-06, 1.2293457984924316e-06, 1.4416873455047607e-06, 1.6540288925170898e-06, 1.866370439529419e-06, 2.078711986541748e-06, 2.291053533554077e-06, 2.5033950805664062e-06, 2.7157366275787354e-06, 2.9280781745910645e-06, 3.1404197216033936e-06, 3.3527612686157227e-06, 3.5651028156280518e-06, 3.777444362640381e-06, 3.98978590965271e-06, 4.202127456665039e-06, 4.414469003677368e-06, 4.626810550689697e-06, 4.839152097702026e-06, 5.0514936447143555e-06, 5.2638351917266846e-06, 5.476176738739014e-06, 5.688518285751343e-06, 5.900859832763672e-06, 6.113201379776001e-06, 6.32554292678833e-06, 6.537884473800659e-06, 6.750226020812988e-06, 6.962567567825317e-06, 7.1749091148376465e-06, 7.387250661849976e-06, 7.599592208862305e-06, 7.811933755874634e-06, 8.024275302886963e-06, 8.236616849899292e-06, 8.448958396911621e-06, 8.66129994392395e-06, 8.87364149093628e-06, 9.085983037948608e-06, 9.298324584960938e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 16.0, 23.0, 36.0, 47.0, 69.0, 130.0, 224.0, 499.0, 1390.0, 4668.0, 23318.0, 234597.0, 700776.0, 68251.0, 10278.0, 2554.0, 856.0, 372.0, 170.0, 86.0, 67.0, 38.0, 26.0, 16.0, 12.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269927978515625, -0.026287317276000977, -0.025581836700439453, -0.02487635612487793, -0.024170875549316406, -0.023465394973754883, -0.02275991439819336, -0.022054433822631836, -0.021348953247070312, -0.02064347267150879, -0.019937992095947266, -0.019232511520385742, -0.01852703094482422, -0.017821550369262695, -0.017116069793701172, -0.01641058921813965, -0.015705108642578125, -0.014999628067016602, -0.014294147491455078, -0.013588666915893555, -0.012883186340332031, -0.012177705764770508, -0.011472225189208984, -0.010766744613647461, -0.010061264038085938, -0.009355783462524414, -0.00865030288696289, -0.007944822311401367, -0.007239341735839844, -0.00653386116027832, -0.005828380584716797, -0.0051229000091552734, -0.00441741943359375, -0.0037119388580322266, -0.003006458282470703, -0.0023009777069091797, -0.0015954971313476562, -0.0008900165557861328, -0.00018453598022460938, 0.0005209445953369141, 0.0012264251708984375, 0.001931905746459961, 0.0026373863220214844, 0.003342866897583008, 0.004048347473144531, 0.004753828048706055, 0.005459308624267578, 0.0061647891998291016, 0.006870269775390625, 0.0075757503509521484, 0.008281230926513672, 0.008986711502075195, 0.009692192077636719, 0.010397672653198242, 0.011103153228759766, 0.011808633804321289, 0.012514114379882812, 0.013219594955444336, 0.01392507553100586, 0.014630556106567383, 0.015336036682128906, 0.01604151725769043, 0.016746997833251953, 0.017452478408813477, 0.018157958984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 11.0, 10.0, 15.0, 20.0, 34.0, 32.0, 48.0, 61.0, 67.0, 105.0, 131.0, 104.0, 93.0, 70.0, 48.0, 39.0, 25.0, 22.0, 18.0, 9.0, 14.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026123046875, -0.025407791137695312, -0.024692535400390625, -0.023977279663085938, -0.02326202392578125, -0.022546768188476562, -0.021831512451171875, -0.021116256713867188, -0.0204010009765625, -0.019685745239257812, -0.018970489501953125, -0.018255233764648438, -0.01753997802734375, -0.016824722290039062, -0.016109466552734375, -0.015394210815429688, -0.014678955078125, -0.013963699340820312, -0.013248443603515625, -0.012533187866210938, -0.01181793212890625, -0.011102676391601562, -0.010387420654296875, -0.009672164916992188, -0.0089569091796875, -0.008241653442382812, -0.007526397705078125, -0.0068111419677734375, -0.00609588623046875, -0.0053806304931640625, -0.004665374755859375, -0.0039501190185546875, -0.00323486328125, -0.0025196075439453125, -0.001804351806640625, -0.0010890960693359375, -0.00037384033203125, 0.0003414154052734375, 0.001056671142578125, 0.0017719268798828125, 0.0024871826171875, 0.0032024383544921875, 0.003917694091796875, 0.0046329498291015625, 0.00534820556640625, 0.0060634613037109375, 0.006778717041015625, 0.0074939727783203125, 0.008209228515625, 0.008924484252929688, 0.009639739990234375, 0.010354995727539062, 0.01107025146484375, 0.011785507202148438, 0.012500762939453125, 0.013216018676757812, 0.0139312744140625, 0.014646530151367188, 0.015361785888671875, 0.016077041625976562, 0.01679229736328125, 0.017507553100585938, 0.018222808837890625, 0.018938064575195312, 0.0196533203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 13.0, 29.0, 47.0, 89.0, 128.0, 169.0, 169.0, 152.0, 93.0, 54.0, 24.0, 19.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2519371509552002, -0.2371351718902588, -0.22233319282531738, -0.20753121376037598, -0.19272923469543457, -0.17792725563049316, -0.16312527656555176, -0.14832329750061035, -0.13352131843566895, -0.11871933937072754, -0.10391736030578613, -0.08911538124084473, -0.07431340217590332, -0.05951143056154251, -0.044709451496601105, -0.0299074724316597, -0.01510550081729889, -0.0003035226836800575, 0.014498455449938774, 0.02930043265223503, 0.04410241171717644, 0.058904387056827545, 0.07370636612176895, 0.08850834518671036, 0.10331032425165176, 0.11811230331659317, 0.13291427493095398, 0.14771625399589539, 0.1625182330608368, 0.1773202121257782, 0.1921221911907196, 0.206924170255661, 0.22172614932060242, 0.23652812838554382, 0.25133010745048523, 0.26613208651542664, 0.28093406558036804, 0.29573604464530945, 0.31053802371025085, 0.32534000277519226, 0.34014198184013367, 0.3549439609050751, 0.3697459399700165, 0.3845479190349579, 0.3993498980998993, 0.4141518771648407, 0.4289538562297821, 0.4437558352947235, 0.45855778455734253, 0.47335976362228394, 0.48816174268722534, 0.5029637217521667, 0.5177657008171082, 0.5325676798820496, 0.547369658946991, 0.5621716380119324, 0.5769736170768738, 0.5917755961418152, 0.6065775752067566, 0.621379554271698, 0.6361815333366394, 0.6509835124015808, 0.6657854914665222, 0.6805874705314636, 0.695389449596405]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 13.0, 11.0, 22.0, 23.0, 28.0, 34.0, 28.0, 36.0, 50.0, 41.0, 61.0, 53.0, 72.0, 70.0, 66.0, 58.0, 53.0, 54.0, 48.0, 25.0, 48.0, 22.0, 17.0, 16.0, 10.0, 10.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34588414430618286, -0.33211013674736023, -0.31833615899086, -0.30456215143203735, -0.2907881736755371, -0.2770141661167145, -0.26324015855789185, -0.2494661659002304, -0.23569217324256897, -0.22191818058490753, -0.2081441879272461, -0.19437018036842346, -0.18059618771076202, -0.16682219505310059, -0.15304818749427795, -0.13927419483661652, -0.12550020217895508, -0.11172620952129364, -0.0979522094130516, -0.08417820930480957, -0.07040421664714813, -0.056630223989486694, -0.04285622388124466, -0.029082223773002625, -0.015308231115341187, -0.00153423473238945, 0.012239761650562286, 0.026013758033514023, 0.03978775441646576, 0.0535617470741272, 0.06733574718236923, 0.08110974729061127, 0.0948837399482727, 0.10865773260593414, 0.12243173271417618, 0.1362057328224182, 0.14997972548007965, 0.1637537181377411, 0.17752772569656372, 0.19130171835422516, 0.2050757110118866, 0.21884970366954803, 0.23262369632720947, 0.2463977038860321, 0.26017171144485474, 0.273945689201355, 0.2877196967601776, 0.30149370431900024, 0.3152676820755005, 0.3290416896343231, 0.34281566739082336, 0.356589674949646, 0.37036365270614624, 0.38413766026496887, 0.3979116678237915, 0.41168564558029175, 0.4254596531391144, 0.439233660697937, 0.45300763845443726, 0.4667816460132599, 0.4805556535720825, 0.49432963132858276, 0.508103609085083, 0.521877646446228, 0.5356516242027283]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 15.0, 40.0, 101.0, 263.0, 953.0, 4722.0, 46288.0, 4013498.0, 118595.0, 7817.0, 1385.0, 378.0, 129.0, 50.0, 23.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06097412109375, -0.057702064514160156, -0.05443000793457031, -0.05115795135498047, -0.047885894775390625, -0.04461383819580078, -0.04134178161621094, -0.038069725036621094, -0.03479766845703125, -0.031525611877441406, -0.028253555297851562, -0.02498149871826172, -0.021709442138671875, -0.01843738555908203, -0.015165328979492188, -0.011893272399902344, -0.0086212158203125, -0.005349159240722656, -0.0020771026611328125, 0.0011949539184570312, 0.004467010498046875, 0.007739067077636719, 0.011011123657226562, 0.014283180236816406, 0.01755523681640625, 0.020827293395996094, 0.024099349975585938, 0.02737140655517578, 0.030643463134765625, 0.03391551971435547, 0.03718757629394531, 0.040459632873535156, 0.043731689453125, 0.047003746032714844, 0.05027580261230469, 0.05354785919189453, 0.056819915771484375, 0.06009197235107422, 0.06336402893066406, 0.0666360855102539, 0.06990814208984375, 0.0731801986694336, 0.07645225524902344, 0.07972431182861328, 0.08299636840820312, 0.08626842498779297, 0.08954048156738281, 0.09281253814697266, 0.0960845947265625, 0.09935665130615234, 0.10262870788574219, 0.10590076446533203, 0.10917282104492188, 0.11244487762451172, 0.11571693420410156, 0.1189889907836914, 0.12226104736328125, 0.1255331039428711, 0.12880516052246094, 0.13207721710205078, 0.13534927368164062, 0.13862133026123047, 0.1418933868408203, 0.14516544342041016, 0.1484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 13.0, 6.0, 9.0, 15.0, 28.0, 25.0, 20.0, 36.0, 34.0, 49.0, 44.0, 52.0, 51.0, 52.0, 54.0, 59.0, 62.0, 55.0, 58.0, 48.0, 37.0, 25.0, 34.0, 30.0, 22.0, 16.0, 13.0, 10.0, 9.0, 10.0, 9.0, 1.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0227813720703125, -0.02211475372314453, -0.021448135375976562, -0.020781517028808594, -0.020114898681640625, -0.019448280334472656, -0.018781661987304688, -0.01811504364013672, -0.01744842529296875, -0.01678180694580078, -0.016115188598632812, -0.015448570251464844, -0.014781951904296875, -0.014115333557128906, -0.013448715209960938, -0.012782096862792969, -0.012115478515625, -0.011448860168457031, -0.010782241821289062, -0.010115623474121094, -0.009449005126953125, -0.008782386779785156, -0.008115768432617188, -0.007449150085449219, -0.00678253173828125, -0.006115913391113281, -0.0054492950439453125, -0.004782676696777344, -0.004116058349609375, -0.0034494400024414062, -0.0027828216552734375, -0.0021162033081054688, -0.0014495849609375, -0.0007829666137695312, -0.0001163482666015625, 0.0005502700805664062, 0.001216888427734375, 0.0018835067749023438, 0.0025501251220703125, 0.0032167434692382812, 0.00388336181640625, 0.004549980163574219, 0.0052165985107421875, 0.005883216857910156, 0.006549835205078125, 0.007216453552246094, 0.007883071899414062, 0.008549690246582031, 0.00921630859375, 0.009882926940917969, 0.010549545288085938, 0.011216163635253906, 0.011882781982421875, 0.012549400329589844, 0.013216018676757812, 0.013882637023925781, 0.01454925537109375, 0.015215873718261719, 0.015882492065429688, 0.016549110412597656, 0.017215728759765625, 0.017882347106933594, 0.018548965454101562, 0.01921558380126953, 0.0198822021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 4.0, 5.0, 4.0, 12.0, 13.0, 17.0, 26.0, 43.0, 64.0, 142.0, 281.0, 810.0, 2818.0, 15706.0, 228263.0, 3885749.0, 51374.0, 6495.0, 1503.0, 502.0, 194.0, 74.0, 57.0, 37.0, 29.0, 12.0, 10.0, 9.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.0901031494140625, -0.087310791015625, -0.0845184326171875, -0.08172607421875, -0.0789337158203125, -0.076141357421875, -0.0733489990234375, -0.070556640625, -0.0677642822265625, -0.064971923828125, -0.0621795654296875, -0.05938720703125, -0.0565948486328125, -0.053802490234375, -0.0510101318359375, -0.0482177734375, -0.0454254150390625, -0.042633056640625, -0.0398406982421875, -0.03704833984375, -0.0342559814453125, -0.031463623046875, -0.0286712646484375, -0.02587890625, -0.0230865478515625, -0.020294189453125, -0.0175018310546875, -0.01470947265625, -0.0119171142578125, -0.009124755859375, -0.0063323974609375, -0.0035400390625, -0.0007476806640625, 0.002044677734375, 0.0048370361328125, 0.00762939453125, 0.0104217529296875, 0.013214111328125, 0.0160064697265625, 0.018798828125, 0.0215911865234375, 0.024383544921875, 0.0271759033203125, 0.02996826171875, 0.0327606201171875, 0.035552978515625, 0.0383453369140625, 0.0411376953125, 0.0439300537109375, 0.046722412109375, 0.0495147705078125, 0.05230712890625, 0.0550994873046875, 0.057891845703125, 0.0606842041015625, 0.0634765625, 0.0662689208984375, 0.069061279296875, 0.0718536376953125, 0.07464599609375, 0.0774383544921875, 0.080230712890625, 0.0830230712890625, 0.0858154296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 6.0, 4.0, 9.0, 6.0, 14.0, 14.0, 17.0, 50.0, 76.0, 211.0, 804.0, 1778.0, 656.0, 178.0, 90.0, 38.0, 49.0, 26.0, 13.0, 8.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07513427734375, -0.0730733871459961, -0.07101249694824219, -0.06895160675048828, -0.06689071655273438, -0.06482982635498047, -0.06276893615722656, -0.060708045959472656, -0.05864715576171875, -0.056586265563964844, -0.05452537536621094, -0.05246448516845703, -0.050403594970703125, -0.04834270477294922, -0.04628181457519531, -0.044220924377441406, -0.0421600341796875, -0.040099143981933594, -0.03803825378417969, -0.03597736358642578, -0.033916473388671875, -0.03185558319091797, -0.029794692993164062, -0.027733802795410156, -0.02567291259765625, -0.023612022399902344, -0.021551132202148438, -0.01949024200439453, -0.017429351806640625, -0.015368461608886719, -0.013307571411132812, -0.011246681213378906, -0.009185791015625, -0.007124900817871094, -0.0050640106201171875, -0.0030031204223632812, -0.000942230224609375, 0.0011186599731445312, 0.0031795501708984375, 0.005240440368652344, 0.00730133056640625, 0.009362220764160156, 0.011423110961914062, 0.013484001159667969, 0.015544891357421875, 0.01760578155517578, 0.019666671752929688, 0.021727561950683594, 0.0237884521484375, 0.025849342346191406, 0.027910232543945312, 0.02997112274169922, 0.032032012939453125, 0.03409290313720703, 0.03615379333496094, 0.038214683532714844, 0.04027557373046875, 0.042336463928222656, 0.04439735412597656, 0.04645824432373047, 0.048519134521484375, 0.05058002471923828, 0.05264091491699219, 0.054701805114746094, 0.0567626953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 8.0, 22.0, 60.0, 166.0, 283.0, 270.0, 114.0, 37.0, 20.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.070047378540039, -1.0472526550292969, -1.0244579315185547, -1.0016632080078125, -0.9788684844970703, -0.9560737013816833, -0.9332789778709412, -0.910484254360199, -0.8876895308494568, -0.8648948073387146, -0.8421000838279724, -0.8193053603172302, -0.7965105772018433, -0.7737158536911011, -0.7509211301803589, -0.7281264066696167, -0.7053316831588745, -0.6825369596481323, -0.6597422361373901, -0.636947512626648, -0.6141527891159058, -0.5913580060005188, -0.5685632824897766, -0.5457685589790344, -0.5229738354682922, -0.50017911195755, -0.47738438844680786, -0.4545896351337433, -0.4317949116230011, -0.4090001881122589, -0.38620543479919434, -0.36341071128845215, -0.34061601758003235, -0.31782129406929016, -0.2950265407562256, -0.2722318172454834, -0.2494370937347412, -0.22664237022399902, -0.20384763181209564, -0.18105289340019226, -0.15825816988945007, -0.13546344637870789, -0.1126687079668045, -0.08987397700548172, -0.06707924604415894, -0.04428451508283615, -0.021489784121513367, 0.0013049542903900146, 0.024099677801132202, 0.04689440876245499, 0.06968913972377777, 0.09248387068510056, 0.11527860164642334, 0.13807332515716553, 0.1608680635690689, 0.1836628019809723, 0.20645752549171448, 0.22925224900245667, 0.25204700231552124, 0.2748417258262634, 0.2976364493370056, 0.3204311728477478, 0.34322589635849, 0.36602064967155457, 0.38881537318229675]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 9.0, 17.0, 25.0, 19.0, 14.0, 21.0, 24.0, 29.0, 38.0, 34.0, 58.0, 52.0, 53.0, 55.0, 49.0, 57.0, 49.0, 44.0, 43.0, 42.0, 34.0, 26.0, 28.0, 33.0, 22.0, 15.0, 18.0, 15.0, 15.0, 7.0, 9.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.21915125846862793, -0.21306724846363068, -0.20698323845863342, -0.20089921355247498, -0.19481520354747772, -0.18873119354248047, -0.18264718353748322, -0.17656317353248596, -0.17047914862632751, -0.16439513862133026, -0.158311128616333, -0.15222710371017456, -0.1461430937051773, -0.14005908370018005, -0.1339750736951828, -0.12789106369018555, -0.1218070536851883, -0.11572304368019104, -0.10963902622461319, -0.10355501621961594, -0.09747099876403809, -0.09138698875904083, -0.08530297875404358, -0.07921896874904633, -0.07313495129346848, -0.06705094128847122, -0.06096692383289337, -0.05488291382789612, -0.048798900097608566, -0.042714886367321014, -0.03663087636232376, -0.03054686263203621, -0.024462848901748657, -0.018378835171461105, -0.012294823303818703, -0.0062108114361763, -0.00012679770588874817, 0.005957216024398804, 0.012041226029396057, 0.01812523975968361, 0.02420925348997116, 0.030293267220258713, 0.036377280950546265, 0.04246129095554352, 0.04854530468583107, 0.05462931841611862, 0.060713328421115875, 0.06679734587669373, 0.07288135588169098, 0.07896536588668823, 0.08504938334226608, 0.09113339334726334, 0.09721741080284119, 0.10330142080783844, 0.1093854308128357, 0.11546944081783295, 0.1215534582734108, 0.12763747572898865, 0.1337214857339859, 0.13980549573898315, 0.1458895057439804, 0.15197351574897766, 0.1580575406551361, 0.16414155066013336, 0.17022556066513062]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 11.0, 18.0, 40.0, 53.0, 109.0, 259.0, 587.0, 1533.0, 4142.0, 13246.0, 49022.0, 183917.0, 428872.0, 263740.0, 73949.0, 19727.0, 5960.0, 1957.0, 751.0, 301.0, 149.0, 74.0, 39.0, 22.0, 8.0, 9.0, 11.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.052154541015625, -0.050731658935546875, -0.04930877685546875, -0.047885894775390625, -0.0464630126953125, -0.045040130615234375, -0.04361724853515625, -0.042194366455078125, -0.040771484375, -0.039348602294921875, -0.03792572021484375, -0.036502838134765625, -0.0350799560546875, -0.033657073974609375, -0.03223419189453125, -0.030811309814453125, -0.029388427734375, -0.027965545654296875, -0.02654266357421875, -0.025119781494140625, -0.0236968994140625, -0.022274017333984375, -0.02085113525390625, -0.019428253173828125, -0.01800537109375, -0.016582489013671875, -0.01515960693359375, -0.013736724853515625, -0.0123138427734375, -0.010890960693359375, -0.00946807861328125, -0.008045196533203125, -0.006622314453125, -0.005199432373046875, -0.00377655029296875, -0.002353668212890625, -0.0009307861328125, 0.000492095947265625, 0.00191497802734375, 0.003337860107421875, 0.0047607421875, 0.006183624267578125, 0.00760650634765625, 0.009029388427734375, 0.0104522705078125, 0.011875152587890625, 0.01329803466796875, 0.014720916748046875, 0.016143798828125, 0.017566680908203125, 0.01898956298828125, 0.020412445068359375, 0.0218353271484375, 0.023258209228515625, 0.02468109130859375, 0.026103973388671875, 0.02752685546875, 0.028949737548828125, 0.03037261962890625, 0.031795501708984375, 0.0332183837890625, 0.034641265869140625, 0.03606414794921875, 0.037487030029296875, 0.038909912109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 6.0, 2.0, 16.0, 16.0, 16.0, 20.0, 23.0, 30.0, 34.0, 43.0, 40.0, 42.0, 41.0, 51.0, 40.0, 64.0, 50.0, 46.0, 50.0, 62.0, 56.0, 36.0, 34.0, 27.0, 26.0, 23.0, 18.0, 10.0, 16.0, 11.0, 11.0, 10.0, 5.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185089111328125, -0.017876386642456055, -0.01724386215209961, -0.016611337661743164, -0.01597881317138672, -0.015346288681030273, -0.014713764190673828, -0.014081239700317383, -0.013448715209960938, -0.012816190719604492, -0.012183666229248047, -0.011551141738891602, -0.010918617248535156, -0.010286092758178711, -0.009653568267822266, -0.00902104377746582, -0.008388519287109375, -0.00775599479675293, -0.007123470306396484, -0.006490945816040039, -0.005858421325683594, -0.0052258968353271484, -0.004593372344970703, -0.003960847854614258, -0.0033283233642578125, -0.002695798873901367, -0.002063274383544922, -0.0014307498931884766, -0.0007982254028320312, -0.00016570091247558594, 0.0004668235778808594, 0.0010993480682373047, 0.00173187255859375, 0.0023643970489501953, 0.0029969215393066406, 0.003629446029663086, 0.004261970520019531, 0.0048944950103759766, 0.005527019500732422, 0.006159543991088867, 0.0067920684814453125, 0.007424592971801758, 0.008057117462158203, 0.008689641952514648, 0.009322166442871094, 0.009954690933227539, 0.010587215423583984, 0.01121973991394043, 0.011852264404296875, 0.01248478889465332, 0.013117313385009766, 0.013749837875366211, 0.014382362365722656, 0.015014886856079102, 0.015647411346435547, 0.016279935836791992, 0.016912460327148438, 0.017544984817504883, 0.018177509307861328, 0.018810033798217773, 0.01944255828857422, 0.020075082778930664, 0.02070760726928711, 0.021340131759643555, 0.02197265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 17.0, 8.0, 19.0, 25.0, 33.0, 57.0, 78.0, 136.0, 244.0, 465.0, 911.0, 2218.0, 8502.0, 79960.0, 795018.0, 144053.0, 11845.0, 2648.0, 1061.0, 507.0, 266.0, 165.0, 87.0, 66.0, 52.0, 27.0, 17.0, 20.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06261730194091797, -0.06017112731933594, -0.057724952697753906, -0.055278778076171875, -0.052832603454589844, -0.05038642883300781, -0.04794025421142578, -0.04549407958984375, -0.04304790496826172, -0.04060173034667969, -0.038155555725097656, -0.035709381103515625, -0.033263206481933594, -0.030817031860351562, -0.02837085723876953, -0.0259246826171875, -0.02347850799560547, -0.021032333374023438, -0.018586158752441406, -0.016139984130859375, -0.013693809509277344, -0.011247634887695312, -0.008801460266113281, -0.00635528564453125, -0.003909111022949219, -0.0014629364013671875, 0.0009832382202148438, 0.003429412841796875, 0.005875587463378906, 0.008321762084960938, 0.010767936706542969, 0.013214111328125, 0.01566028594970703, 0.018106460571289062, 0.020552635192871094, 0.022998809814453125, 0.025444984436035156, 0.027891159057617188, 0.03033733367919922, 0.03278350830078125, 0.03522968292236328, 0.03767585754394531, 0.040122032165527344, 0.042568206787109375, 0.045014381408691406, 0.04746055603027344, 0.04990673065185547, 0.0523529052734375, 0.05479907989501953, 0.05724525451660156, 0.059691429138183594, 0.062137603759765625, 0.06458377838134766, 0.06702995300292969, 0.06947612762451172, 0.07192230224609375, 0.07436847686767578, 0.07681465148925781, 0.07926082611083984, 0.08170700073242188, 0.0841531753540039, 0.08659934997558594, 0.08904552459716797, 0.09149169921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 12.0, 10.0, 8.0, 11.0, 21.0, 25.0, 22.0, 30.0, 32.0, 45.0, 47.0, 54.0, 52.0, 61.0, 50.0, 47.0, 61.0, 58.0, 49.0, 43.0, 50.0, 26.0, 26.0, 35.0, 26.0, 23.0, 15.0, 15.0, 14.0, 10.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086181640625, -0.08368587493896484, -0.08119010925292969, -0.07869434356689453, -0.07619857788085938, -0.07370281219482422, -0.07120704650878906, -0.0687112808227539, -0.06621551513671875, -0.0637197494506836, -0.06122398376464844, -0.05872821807861328, -0.056232452392578125, -0.05373668670654297, -0.05124092102050781, -0.048745155334472656, -0.0462493896484375, -0.043753623962402344, -0.04125785827636719, -0.03876209259033203, -0.036266326904296875, -0.03377056121826172, -0.03127479553222656, -0.028779029846191406, -0.02628326416015625, -0.023787498474121094, -0.021291732788085938, -0.01879596710205078, -0.016300201416015625, -0.013804435729980469, -0.011308670043945312, -0.008812904357910156, -0.006317138671875, -0.0038213729858398438, -0.0013256072998046875, 0.0011701583862304688, 0.003665924072265625, 0.006161689758300781, 0.008657455444335938, 0.011153221130371094, 0.01364898681640625, 0.016144752502441406, 0.018640518188476562, 0.02113628387451172, 0.023632049560546875, 0.02612781524658203, 0.028623580932617188, 0.031119346618652344, 0.0336151123046875, 0.036110877990722656, 0.03860664367675781, 0.04110240936279297, 0.043598175048828125, 0.04609394073486328, 0.04858970642089844, 0.051085472106933594, 0.05358123779296875, 0.056077003479003906, 0.05857276916503906, 0.06106853485107422, 0.06356430053710938, 0.06606006622314453, 0.06855583190917969, 0.07105159759521484, 0.07354736328125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 16.0, 51.0, 168.0, 900.0, 18363.0, 1018103.0, 10058.0, 682.0, 137.0, 38.0, 21.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11865234375, -0.11571788787841797, -0.11278343200683594, -0.1098489761352539, -0.10691452026367188, -0.10398006439208984, -0.10104560852050781, -0.09811115264892578, -0.09517669677734375, -0.09224224090576172, -0.08930778503417969, -0.08637332916259766, -0.08343887329101562, -0.0805044174194336, -0.07756996154785156, -0.07463550567626953, -0.0717010498046875, -0.06876659393310547, -0.06583213806152344, -0.0628976821899414, -0.059963226318359375, -0.057028770446777344, -0.05409431457519531, -0.05115985870361328, -0.04822540283203125, -0.04529094696044922, -0.04235649108886719, -0.039422035217285156, -0.036487579345703125, -0.033553123474121094, -0.030618667602539062, -0.02768421173095703, -0.024749755859375, -0.02181529998779297, -0.018880844116210938, -0.015946388244628906, -0.013011932373046875, -0.010077476501464844, -0.0071430206298828125, -0.004208564758300781, -0.00127410888671875, 0.0016603469848632812, 0.0045948028564453125, 0.007529258728027344, 0.010463714599609375, 0.013398170471191406, 0.016332626342773438, 0.01926708221435547, 0.0222015380859375, 0.02513599395751953, 0.028070449829101562, 0.031004905700683594, 0.033939361572265625, 0.036873817443847656, 0.03980827331542969, 0.04274272918701172, 0.04567718505859375, 0.04861164093017578, 0.05154609680175781, 0.054480552673339844, 0.057415008544921875, 0.060349464416503906, 0.06328392028808594, 0.06621837615966797, 0.06915283203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 9.0, 12.0, 23.0, 25.0, 46.0, 58.0, 97.0, 93.0, 78.0, 116.0, 86.0, 85.0, 90.0, 36.0, 41.0, 29.0, 18.0, 14.0, 7.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2874603271484375e-05, -1.2556090950965881e-05, -1.2237578630447388e-05, -1.1919066309928894e-05, -1.16005539894104e-05, -1.1282041668891907e-05, -1.0963529348373413e-05, -1.064501702785492e-05, -1.0326504707336426e-05, -1.0007992386817932e-05, -9.689480066299438e-06, -9.370967745780945e-06, -9.052455425262451e-06, -8.733943104743958e-06, -8.415430784225464e-06, -8.09691846370697e-06, -7.778406143188477e-06, -7.459893822669983e-06, -7.141381502151489e-06, -6.822869181632996e-06, -6.504356861114502e-06, -6.185844540596008e-06, -5.867332220077515e-06, -5.548819899559021e-06, -5.230307579040527e-06, -4.911795258522034e-06, -4.59328293800354e-06, -4.274770617485046e-06, -3.956258296966553e-06, -3.637745976448059e-06, -3.3192336559295654e-06, -3.0007213354110718e-06, -2.682209014892578e-06, -2.3636966943740845e-06, -2.045184373855591e-06, -1.7266720533370972e-06, -1.4081597328186035e-06, -1.0896474123001099e-06, -7.711350917816162e-07, -4.5262277126312256e-07, -1.341104507446289e-07, 1.8440186977386475e-07, 5.029141902923584e-07, 8.21426510810852e-07, 1.1399388313293457e-06, 1.4584511518478394e-06, 1.776963472366333e-06, 2.0954757928848267e-06, 2.4139881134033203e-06, 2.732500433921814e-06, 3.0510127544403076e-06, 3.3695250749588013e-06, 3.688037395477295e-06, 4.0065497159957886e-06, 4.325062036514282e-06, 4.643574357032776e-06, 4.9620866775512695e-06, 5.280598998069763e-06, 5.599111318588257e-06, 5.9176236391067505e-06, 6.236135959625244e-06, 6.554648280143738e-06, 6.8731606006622314e-06, 7.191672921180725e-06, 7.510185241699219e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 18.0, 13.0, 18.0, 34.0, 56.0, 107.0, 175.0, 346.0, 926.0, 3066.0, 17094.0, 250600.0, 723952.0, 43835.0, 5703.0, 1516.0, 515.0, 225.0, 114.0, 85.0, 50.0, 26.0, 14.0, 17.0, 13.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033050537109375, -0.03205513954162598, -0.031059741973876953, -0.03006434440612793, -0.029068946838378906, -0.028073549270629883, -0.02707815170288086, -0.026082754135131836, -0.025087356567382812, -0.02409195899963379, -0.023096561431884766, -0.022101163864135742, -0.02110576629638672, -0.020110368728637695, -0.019114971160888672, -0.01811957359313965, -0.017124176025390625, -0.0161287784576416, -0.015133380889892578, -0.014137983322143555, -0.013142585754394531, -0.012147188186645508, -0.011151790618896484, -0.010156393051147461, -0.009160995483398438, -0.008165597915649414, -0.007170200347900391, -0.006174802780151367, -0.005179405212402344, -0.00418400764465332, -0.003188610076904297, -0.0021932125091552734, -0.00119781494140625, -0.00020241737365722656, 0.0007929801940917969, 0.0017883777618408203, 0.0027837753295898438, 0.003779172897338867, 0.004774570465087891, 0.005769968032836914, 0.0067653656005859375, 0.007760763168334961, 0.008756160736083984, 0.009751558303833008, 0.010746955871582031, 0.011742353439331055, 0.012737751007080078, 0.013733148574829102, 0.014728546142578125, 0.01572394371032715, 0.016719341278076172, 0.017714738845825195, 0.01871013641357422, 0.019705533981323242, 0.020700931549072266, 0.02169632911682129, 0.022691726684570312, 0.023687124252319336, 0.02468252182006836, 0.025677919387817383, 0.026673316955566406, 0.02766871452331543, 0.028664112091064453, 0.029659509658813477, 0.0306549072265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 10.0, 9.0, 8.0, 10.0, 18.0, 21.0, 23.0, 32.0, 24.0, 44.0, 45.0, 60.0, 69.0, 63.0, 71.0, 63.0, 72.0, 62.0, 47.0, 41.0, 31.0, 35.0, 31.0, 24.0, 17.0, 18.0, 14.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0154571533203125, -0.014914751052856445, -0.01437234878540039, -0.013829946517944336, -0.013287544250488281, -0.012745141983032227, -0.012202739715576172, -0.011660337448120117, -0.011117935180664062, -0.010575532913208008, -0.010033130645751953, -0.009490728378295898, -0.008948326110839844, -0.008405923843383789, -0.007863521575927734, -0.00732111930847168, -0.006778717041015625, -0.00623631477355957, -0.005693912506103516, -0.005151510238647461, -0.004609107971191406, -0.0040667057037353516, -0.003524303436279297, -0.002981901168823242, -0.0024394989013671875, -0.0018970966339111328, -0.0013546943664550781, -0.0008122920989990234, -0.00026988983154296875, 0.00027251243591308594, 0.0008149147033691406, 0.0013573169708251953, 0.00189971923828125, 0.0024421215057373047, 0.0029845237731933594, 0.003526926040649414, 0.004069328308105469, 0.0046117305755615234, 0.005154132843017578, 0.005696535110473633, 0.0062389373779296875, 0.006781339645385742, 0.007323741912841797, 0.007866144180297852, 0.008408546447753906, 0.008950948715209961, 0.009493350982666016, 0.01003575325012207, 0.010578155517578125, 0.01112055778503418, 0.011662960052490234, 0.012205362319946289, 0.012747764587402344, 0.013290166854858398, 0.013832569122314453, 0.014374971389770508, 0.014917373657226562, 0.015459775924682617, 0.016002178192138672, 0.016544580459594727, 0.01708698272705078, 0.017629384994506836, 0.01817178726196289, 0.018714189529418945, 0.019256591796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 25.0, 129.0, 504.0, 268.0, 61.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4143719673156738, -1.3725115060806274, -1.330651044845581, -1.2887905836105347, -1.2469301223754883, -1.205069661140442, -1.1632091999053955, -1.1213487386703491, -1.0794882774353027, -1.0376278162002563, -0.99576735496521, -0.9539068937301636, -0.9120464324951172, -0.8701859712600708, -0.8283255100250244, -0.786465048789978, -0.7446046471595764, -0.70274418592453, -0.6608837246894836, -0.6190232634544373, -0.5771628022193909, -0.5353023409843445, -0.4934419095516205, -0.4515814483165741, -0.4097209870815277, -0.3678605258464813, -0.32600006461143494, -0.28413963317871094, -0.24227915704250336, -0.20041869580745697, -0.15855824947357178, -0.11669778823852539, -0.074837327003479, -0.032976869493722916, 0.008883588016033173, 0.05074404180049896, 0.09260450303554535, 0.13446496427059174, 0.17632541060447693, 0.21818587183952332, 0.2600463330745697, 0.3019067943096161, 0.3437672555446625, 0.3856276869773865, 0.42748814821243286, 0.46934860944747925, 0.5112090706825256, 0.553069531917572, 0.5949299931526184, 0.6367904543876648, 0.6786509156227112, 0.7205113768577576, 0.762371838092804, 0.8042322993278503, 0.846092700958252, 0.8879531621932983, 0.9298136234283447, 0.9716740846633911, 1.0135345458984375, 1.0553950071334839, 1.0972554683685303, 1.1391159296035767, 1.180976390838623, 1.2228368520736694, 1.2646973133087158]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 3.0, 11.0, 8.0, 8.0, 11.0, 16.0, 16.0, 26.0, 23.0, 24.0, 21.0, 35.0, 47.0, 44.0, 45.0, 55.0, 56.0, 63.0, 54.0, 56.0, 52.0, 48.0, 40.0, 37.0, 28.0, 35.0, 27.0, 15.0, 15.0, 21.0, 14.0, 9.0, 11.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26651525497436523, -0.25771552324295044, -0.24891576170921326, -0.24011602997779846, -0.23131628334522247, -0.22251653671264648, -0.2137168049812317, -0.2049170583486557, -0.1961173117160797, -0.18731756508350372, -0.17851781845092773, -0.16971808671951294, -0.16091834008693695, -0.15211859345436096, -0.14331886172294617, -0.13451911509037018, -0.1257193684577942, -0.1169196218252182, -0.10811988264322281, -0.09932014346122742, -0.09052039682865143, -0.08172065019607544, -0.07292091101408005, -0.06412117183208466, -0.05532142519950867, -0.04652168229222298, -0.037721939384937286, -0.028922196477651596, -0.020122453570365906, -0.011322710663080215, -0.002522967755794525, 0.006276775151491165, 0.015076518058776855, 0.023876260966062546, 0.032676003873348236, 0.041475746780633926, 0.05027548968791962, 0.05907523259520531, 0.067874975502491, 0.07667471468448639, 0.08547446131706238, 0.09427420794963837, 0.10307394713163376, 0.11187368631362915, 0.12067343294620514, 0.12947317957878113, 0.13827291131019592, 0.1470726579427719, 0.1558724045753479, 0.1646721512079239, 0.17347189784049988, 0.18227162957191467, 0.19107137620449066, 0.19987112283706665, 0.20867085456848145, 0.21747060120105743, 0.22627034783363342, 0.2350700944662094, 0.2438698410987854, 0.2526695728302002, 0.261469304561615, 0.2702690660953522, 0.27906879782676697, 0.28786855936050415, 0.29666829109191895]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 9.0, 15.0, 63.0, 187.0, 734.0, 4192573.0, 512.0, 143.0, 37.0, 11.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.375, -0.324462890625, -0.27392578125, -0.223388671875, -0.1728515625, -0.122314453125, -0.07177734375, -0.021240234375, 0.029296875, 0.079833984375, 0.13037109375, 0.180908203125, 0.2314453125, 0.281982421875, 0.33251953125, 0.383056640625, 0.43359375, 0.484130859375, 0.53466796875, 0.585205078125, 0.6357421875, 0.686279296875, 0.73681640625, 0.787353515625, 0.837890625, 0.888427734375, 0.93896484375, 0.989501953125, 1.0400390625, 1.090576171875, 1.14111328125, 1.191650390625, 1.2421875, 1.292724609375, 1.34326171875, 1.393798828125, 1.4443359375, 1.494873046875, 1.54541015625, 1.595947265625, 1.646484375, 1.697021484375, 1.74755859375, 1.798095703125, 1.8486328125, 1.899169921875, 1.94970703125, 2.000244140625, 2.05078125, 2.101318359375, 2.15185546875, 2.202392578125, 2.2529296875, 2.303466796875, 2.35400390625, 2.404541015625, 2.455078125, 2.505615234375, 2.55615234375, 2.606689453125, 2.6572265625, 2.707763671875, 2.75830078125, 2.808837890625, 2.859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 16.0, 17.0, 19.0, 29.0, 30.0, 38.0, 37.0, 59.0, 58.0, 65.0, 55.0, 63.0, 60.0, 69.0, 62.0, 60.0, 56.0, 37.0, 30.0, 22.0, 27.0, 15.0, 16.0, 14.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018218994140625, -0.017462491989135742, -0.016705989837646484, -0.015949487686157227, -0.015192985534667969, -0.014436483383178711, -0.013679981231689453, -0.012923479080200195, -0.012166976928710938, -0.01141047477722168, -0.010653972625732422, -0.009897470474243164, -0.009140968322753906, -0.008384466171264648, -0.007627964019775391, -0.006871461868286133, -0.006114959716796875, -0.005358457565307617, -0.004601955413818359, -0.0038454532623291016, -0.0030889511108398438, -0.002332448959350586, -0.0015759468078613281, -0.0008194446563720703, -6.29425048828125e-05, 0.0006935596466064453, 0.0014500617980957031, 0.002206563949584961, 0.0029630661010742188, 0.0037195682525634766, 0.004476070404052734, 0.005232572555541992, 0.00598907470703125, 0.006745576858520508, 0.007502079010009766, 0.008258581161499023, 0.009015083312988281, 0.009771585464477539, 0.010528087615966797, 0.011284589767456055, 0.012041091918945312, 0.01279759407043457, 0.013554096221923828, 0.014310598373413086, 0.015067100524902344, 0.0158236026763916, 0.01658010482788086, 0.017336606979370117, 0.018093109130859375, 0.018849611282348633, 0.01960611343383789, 0.02036261558532715, 0.021119117736816406, 0.021875619888305664, 0.022632122039794922, 0.02338862419128418, 0.024145126342773438, 0.024901628494262695, 0.025658130645751953, 0.02641463279724121, 0.02717113494873047, 0.027927637100219727, 0.028684139251708984, 0.029440641403198242, 0.0301971435546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 10.0, 11.0, 17.0, 29.0, 68.0, 121.0, 214.0, 522.0, 1648.0, 8447.0, 66180.0, 3788660.0, 304220.0, 19394.0, 3294.0, 841.0, 311.0, 132.0, 73.0, 35.0, 18.0, 13.0, 8.0, 6.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.0668344497680664, -0.06433296203613281, -0.06183147430419922, -0.059329986572265625, -0.05682849884033203, -0.05432701110839844, -0.051825523376464844, -0.04932403564453125, -0.046822547912597656, -0.04432106018066406, -0.04181957244873047, -0.039318084716796875, -0.03681659698486328, -0.03431510925292969, -0.031813621520996094, -0.0293121337890625, -0.026810646057128906, -0.024309158325195312, -0.02180767059326172, -0.019306182861328125, -0.01680469512939453, -0.014303207397460938, -0.011801719665527344, -0.00930023193359375, -0.006798744201660156, -0.0042972564697265625, -0.0017957687377929688, 0.000705718994140625, 0.0032072067260742188, 0.0057086944580078125, 0.008210182189941406, 0.010711669921875, 0.013213157653808594, 0.015714645385742188, 0.01821613311767578, 0.020717620849609375, 0.02321910858154297, 0.025720596313476562, 0.028222084045410156, 0.03072357177734375, 0.033225059509277344, 0.03572654724121094, 0.03822803497314453, 0.040729522705078125, 0.04323101043701172, 0.04573249816894531, 0.048233985900878906, 0.0507354736328125, 0.053236961364746094, 0.05573844909667969, 0.05823993682861328, 0.060741424560546875, 0.06324291229248047, 0.06574440002441406, 0.06824588775634766, 0.07074737548828125, 0.07324886322021484, 0.07575035095214844, 0.07825183868408203, 0.08075332641601562, 0.08325481414794922, 0.08575630187988281, 0.0882577896118164, 0.09075927734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 44.0, 37.0, 122.0, 243.0, 755.0, 1699.0, 730.0, 205.0, 77.0, 50.0, 19.0, 19.0, 19.0, 14.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0775146484375, -0.07532835006713867, -0.07314205169677734, -0.07095575332641602, -0.06876945495605469, -0.06658315658569336, -0.06439685821533203, -0.0622105598449707, -0.060024261474609375, -0.05783796310424805, -0.05565166473388672, -0.05346536636352539, -0.05127906799316406, -0.049092769622802734, -0.046906471252441406, -0.04472017288208008, -0.04253387451171875, -0.04034757614135742, -0.038161277770996094, -0.035974979400634766, -0.03378868103027344, -0.03160238265991211, -0.02941608428955078, -0.027229785919189453, -0.025043487548828125, -0.022857189178466797, -0.02067089080810547, -0.01848459243774414, -0.016298294067382812, -0.014111995697021484, -0.011925697326660156, -0.009739398956298828, -0.0075531005859375, -0.005366802215576172, -0.0031805038452148438, -0.0009942054748535156, 0.0011920928955078125, 0.0033783912658691406, 0.005564689636230469, 0.007750988006591797, 0.009937286376953125, 0.012123584747314453, 0.014309883117675781, 0.01649618148803711, 0.018682479858398438, 0.020868778228759766, 0.023055076599121094, 0.025241374969482422, 0.02742767333984375, 0.029613971710205078, 0.031800270080566406, 0.033986568450927734, 0.03617286682128906, 0.03835916519165039, 0.04054546356201172, 0.04273176193237305, 0.044918060302734375, 0.0471043586730957, 0.04929065704345703, 0.05147695541381836, 0.05366325378417969, 0.055849552154541016, 0.058035850524902344, 0.06022214889526367, 0.062408447265625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 18.0, 36.0, 92.0, 322.0, 403.0, 109.0, 14.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7876958847045898, -1.7506794929504395, -1.7136629819869995, -1.6766464710235596, -1.6396300792694092, -1.6026136875152588, -1.5655971765518188, -1.528580665588379, -1.4915642738342285, -1.4545478820800781, -1.4175313711166382, -1.3805148601531982, -1.3434984683990479, -1.3064820766448975, -1.2694655656814575, -1.2324490547180176, -1.1954326629638672, -1.1584162712097168, -1.1213997602462769, -1.084383249282837, -1.0473668575286865, -1.0103504657745361, -0.9733339548110962, -0.936317503452301, -0.8993010520935059, -0.8622846007347107, -0.8252681493759155, -0.7882516980171204, -0.7512352466583252, -0.71421879529953, -0.6772023439407349, -0.6401858925819397, -0.6031695604324341, -0.5661531090736389, -0.5291366577148438, -0.4921202063560486, -0.4551037549972534, -0.41808730363845825, -0.3810708522796631, -0.3440544009208679, -0.30703794956207275, -0.2700214982032776, -0.23300504684448242, -0.19598859548568726, -0.1589721441268921, -0.12195569276809692, -0.08493924140930176, -0.04792279005050659, -0.010906338691711426, 0.02611011266708374, 0.0631265640258789, 0.10014301538467407, 0.13715946674346924, 0.1741759181022644, 0.21119236946105957, 0.24820882081985474, 0.2852252721786499, 0.32224172353744507, 0.35925817489624023, 0.3962746262550354, 0.43329107761383057, 0.47030752897262573, 0.5073239803314209, 0.5443404316902161, 0.5813568830490112]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 19.0, 12.0, 23.0, 33.0, 33.0, 40.0, 38.0, 61.0, 68.0, 82.0, 66.0, 69.0, 69.0, 58.0, 47.0, 53.0, 35.0, 28.0, 33.0, 32.0, 28.0, 15.0, 10.0, 5.0, 5.0, 11.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3091663718223572, -0.29894956946372986, -0.28873276710510254, -0.2785159945487976, -0.2682991921901703, -0.25808238983154297, -0.24786558747291565, -0.23764878511428833, -0.227431982755661, -0.2172151803970337, -0.20699839293956757, -0.19678159058094025, -0.18656478822231293, -0.1763480007648468, -0.16613119840621948, -0.15591439604759216, -0.14569760859012604, -0.13548080623149872, -0.1252640187740326, -0.11504721641540527, -0.10483041405677795, -0.09461361914873123, -0.08439682424068451, -0.07418002188205719, -0.06396322697401047, -0.05374642834067345, -0.043529629707336426, -0.0333128347992897, -0.023096036165952682, -0.012879237532615662, -0.002662442624568939, 0.00755435973405838, 0.017771154642105103, 0.027987953275442123, 0.038204751908779144, 0.04842154681682587, 0.05863834545016289, 0.06885514408349991, 0.07907193899154663, 0.08928874135017395, 0.09950553625822067, 0.1097223311662674, 0.11993913352489471, 0.13015592098236084, 0.14037272334098816, 0.15058952569961548, 0.1608063280582428, 0.17102313041687012, 0.18123991787433624, 0.19145672023296356, 0.2016735076904297, 0.211890310049057, 0.22210711240768433, 0.23232391476631165, 0.24254070222377777, 0.2527574896812439, 0.2629742920398712, 0.27319109439849854, 0.28340789675712585, 0.2936246991157532, 0.3038414716720581, 0.3140582740306854, 0.32427507638931274, 0.33449187874794006, 0.3447086811065674]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 3.0, 4.0, 3.0, 10.0, 18.0, 31.0, 67.0, 175.0, 423.0, 1387.0, 8071.0, 188932.0, 807506.0, 37264.0, 3344.0, 772.0, 287.0, 114.0, 57.0, 37.0, 19.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12017250061035156, -0.11522293090820312, -0.11027336120605469, -0.10532379150390625, -0.10037422180175781, -0.09542465209960938, -0.09047508239746094, -0.0855255126953125, -0.08057594299316406, -0.07562637329101562, -0.07067680358886719, -0.06572723388671875, -0.06077766418457031, -0.055828094482421875, -0.05087852478027344, -0.045928955078125, -0.04097938537597656, -0.036029815673828125, -0.031080245971679688, -0.02613067626953125, -0.021181106567382812, -0.016231536865234375, -0.011281967163085938, -0.0063323974609375, -0.0013828277587890625, 0.003566741943359375, 0.008516311645507812, 0.01346588134765625, 0.018415451049804688, 0.023365020751953125, 0.028314590454101562, 0.03326416015625, 0.03821372985839844, 0.043163299560546875, 0.04811286926269531, 0.05306243896484375, 0.05801200866699219, 0.06296157836914062, 0.06791114807128906, 0.0728607177734375, 0.07781028747558594, 0.08275985717773438, 0.08770942687988281, 0.09265899658203125, 0.09760856628417969, 0.10255813598632812, 0.10750770568847656, 0.112457275390625, 0.11740684509277344, 0.12235641479492188, 0.1273059844970703, 0.13225555419921875, 0.1372051239013672, 0.14215469360351562, 0.14710426330566406, 0.1520538330078125, 0.15700340270996094, 0.16195297241210938, 0.1669025421142578, 0.17185211181640625, 0.1768016815185547, 0.18175125122070312, 0.18670082092285156, 0.191650390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 16.0, 16.0, 18.0, 13.0, 22.0, 27.0, 31.0, 31.0, 31.0, 44.0, 45.0, 47.0, 55.0, 45.0, 62.0, 51.0, 50.0, 46.0, 42.0, 46.0, 32.0, 44.0, 30.0, 28.0, 22.0, 21.0, 14.0, 14.0, 14.0, 5.0, 4.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020259857177734375, -0.01958465576171875, -0.018909454345703125, -0.0182342529296875, -0.017559051513671875, -0.01688385009765625, -0.016208648681640625, -0.015533447265625, -0.014858245849609375, -0.01418304443359375, -0.013507843017578125, -0.0128326416015625, -0.012157440185546875, -0.01148223876953125, -0.010807037353515625, -0.0101318359375, -0.009456634521484375, -0.00878143310546875, -0.008106231689453125, -0.0074310302734375, -0.006755828857421875, -0.00608062744140625, -0.005405426025390625, -0.004730224609375, -0.004055023193359375, -0.00337982177734375, -0.002704620361328125, -0.0020294189453125, -0.001354217529296875, -0.00067901611328125, -3.814697265625e-06, 0.00067138671875, 0.001346588134765625, 0.00202178955078125, 0.002696990966796875, 0.0033721923828125, 0.004047393798828125, 0.00472259521484375, 0.005397796630859375, 0.006072998046875, 0.006748199462890625, 0.00742340087890625, 0.008098602294921875, 0.0087738037109375, 0.009449005126953125, 0.01012420654296875, 0.010799407958984375, 0.011474609375, 0.012149810791015625, 0.01282501220703125, 0.013500213623046875, 0.0141754150390625, 0.014850616455078125, 0.01552581787109375, 0.016201019287109375, 0.016876220703125, 0.017551422119140625, 0.01822662353515625, 0.018901824951171875, 0.0195770263671875, 0.020252227783203125, 0.02092742919921875, 0.021602630615234375, 0.02227783203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 8.0, 11.0, 20.0, 29.0, 52.0, 108.0, 275.0, 759.0, 3246.0, 33888.0, 917189.0, 86252.0, 4946.0, 1076.0, 359.0, 152.0, 60.0, 44.0, 25.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1873779296875, -0.18211746215820312, -0.17685699462890625, -0.17159652709960938, -0.1663360595703125, -0.16107559204101562, -0.15581512451171875, -0.15055465698242188, -0.145294189453125, -0.14003372192382812, -0.13477325439453125, -0.12951278686523438, -0.1242523193359375, -0.11899185180664062, -0.11373138427734375, -0.10847091674804688, -0.10321044921875, -0.09794998168945312, -0.09268951416015625, -0.08742904663085938, -0.0821685791015625, -0.07690811157226562, -0.07164764404296875, -0.06638717651367188, -0.061126708984375, -0.055866241455078125, -0.05060577392578125, -0.045345306396484375, -0.0400848388671875, -0.034824371337890625, -0.02956390380859375, -0.024303436279296875, -0.01904296875, -0.013782501220703125, -0.00852203369140625, -0.003261566162109375, 0.0019989013671875, 0.007259368896484375, 0.01251983642578125, 0.017780303955078125, 0.023040771484375, 0.028301239013671875, 0.03356170654296875, 0.038822174072265625, 0.0440826416015625, 0.049343109130859375, 0.05460357666015625, 0.059864044189453125, 0.06512451171875, 0.07038497924804688, 0.07564544677734375, 0.08090591430664062, 0.0861663818359375, 0.09142684936523438, 0.09668731689453125, 0.10194778442382812, 0.107208251953125, 0.11246871948242188, 0.11772918701171875, 0.12298965454101562, 0.1282501220703125, 0.13351058959960938, 0.13877105712890625, 0.14403152465820312, 0.1492919921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 7.0, 11.0, 11.0, 18.0, 19.0, 16.0, 19.0, 31.0, 26.0, 33.0, 51.0, 50.0, 64.0, 61.0, 52.0, 53.0, 67.0, 54.0, 46.0, 42.0, 39.0, 42.0, 32.0, 29.0, 22.0, 17.0, 15.0, 13.0, 11.0, 9.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08050537109375, -0.07775306701660156, -0.07500076293945312, -0.07224845886230469, -0.06949615478515625, -0.06674385070800781, -0.06399154663085938, -0.06123924255371094, -0.0584869384765625, -0.05573463439941406, -0.052982330322265625, -0.05023002624511719, -0.04747772216796875, -0.04472541809082031, -0.041973114013671875, -0.03922080993652344, -0.036468505859375, -0.03371620178222656, -0.030963897705078125, -0.028211593627929688, -0.02545928955078125, -0.022706985473632812, -0.019954681396484375, -0.017202377319335938, -0.0144500732421875, -0.011697769165039062, -0.008945465087890625, -0.0061931610107421875, -0.00344085693359375, -0.0006885528564453125, 0.002063751220703125, 0.0048160552978515625, 0.007568359375, 0.010320663452148438, 0.013072967529296875, 0.015825271606445312, 0.01857757568359375, 0.021329879760742188, 0.024082183837890625, 0.026834487915039062, 0.0295867919921875, 0.03233909606933594, 0.035091400146484375, 0.03784370422363281, 0.04059600830078125, 0.04334831237792969, 0.046100616455078125, 0.04885292053222656, 0.051605224609375, 0.05435752868652344, 0.057109832763671875, 0.05986213684082031, 0.06261444091796875, 0.06536674499511719, 0.06811904907226562, 0.07087135314941406, 0.0736236572265625, 0.07637596130371094, 0.07912826538085938, 0.08188056945800781, 0.08463287353515625, 0.08738517761230469, 0.09013748168945312, 0.09288978576660156, 0.09564208984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 23.0, 32.0, 50.0, 80.0, 159.0, 255.0, 593.0, 1395.0, 5247.0, 42428.0, 974317.0, 18636.0, 3337.0, 1034.0, 386.0, 224.0, 113.0, 73.0, 34.0, 24.0, 26.0, 14.0, 11.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.162353515625, -0.1573352813720703, -0.15231704711914062, -0.14729881286621094, -0.14228057861328125, -0.13726234436035156, -0.13224411010742188, -0.1272258758544922, -0.1222076416015625, -0.11718940734863281, -0.11217117309570312, -0.10715293884277344, -0.10213470458984375, -0.09711647033691406, -0.09209823608398438, -0.08708000183105469, -0.082061767578125, -0.07704353332519531, -0.07202529907226562, -0.06700706481933594, -0.06198883056640625, -0.05697059631347656, -0.051952362060546875, -0.04693412780761719, -0.0419158935546875, -0.03689765930175781, -0.031879425048828125, -0.026861190795898438, -0.02184295654296875, -0.016824722290039062, -0.011806488037109375, -0.0067882537841796875, -0.00177001953125, 0.0032482147216796875, 0.008266448974609375, 0.013284683227539062, 0.01830291748046875, 0.023321151733398438, 0.028339385986328125, 0.03335762023925781, 0.0383758544921875, 0.04339408874511719, 0.048412322998046875, 0.05343055725097656, 0.05844879150390625, 0.06346702575683594, 0.06848526000976562, 0.07350349426269531, 0.078521728515625, 0.08353996276855469, 0.08855819702148438, 0.09357643127441406, 0.09859466552734375, 0.10361289978027344, 0.10863113403320312, 0.11364936828613281, 0.1186676025390625, 0.12368583679199219, 0.12870407104492188, 0.13372230529785156, 0.13874053955078125, 0.14375877380371094, 0.14877700805664062, 0.1537952423095703, 0.1588134765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 7.0, 8.0, 17.0, 23.0, 46.0, 129.0, 299.0, 269.0, 102.0, 26.0, 9.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7670135498046875e-05, -3.644730895757675e-05, -3.522448241710663e-05, -3.4001655876636505e-05, -3.277882933616638e-05, -3.155600279569626e-05, -3.0333176255226135e-05, -2.9110349714756012e-05, -2.788752317428589e-05, -2.6664696633815765e-05, -2.5441870093345642e-05, -2.421904355287552e-05, -2.2996217012405396e-05, -2.1773390471935272e-05, -2.055056393146515e-05, -1.9327737390995026e-05, -1.8104910850524902e-05, -1.688208431005478e-05, -1.5659257769584656e-05, -1.4436431229114532e-05, -1.321360468864441e-05, -1.1990778148174286e-05, -1.0767951607704163e-05, -9.54512506723404e-06, -8.322298526763916e-06, -7.099471986293793e-06, -5.8766454458236694e-06, -4.653818905353546e-06, -3.430992364883423e-06, -2.2081658244132996e-06, -9.853392839431763e-07, 2.3748725652694702e-07, 1.4603137969970703e-06, 2.6831403374671936e-06, 3.905966877937317e-06, 5.12879341840744e-06, 6.3516199588775635e-06, 7.574446499347687e-06, 8.79727303981781e-06, 1.0020099580287933e-05, 1.1242926120758057e-05, 1.246575266122818e-05, 1.3688579201698303e-05, 1.4911405742168427e-05, 1.613423228263855e-05, 1.7357058823108673e-05, 1.8579885363578796e-05, 1.980271190404892e-05, 2.1025538444519043e-05, 2.2248364984989166e-05, 2.347119152545929e-05, 2.4694018065929413e-05, 2.5916844606399536e-05, 2.713967114686966e-05, 2.8362497687339783e-05, 2.9585324227809906e-05, 3.080815076828003e-05, 3.203097730875015e-05, 3.3253803849220276e-05, 3.44766303896904e-05, 3.569945693016052e-05, 3.6922283470630646e-05, 3.814511001110077e-05, 3.936793655157089e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 2.0, 5.0, 16.0, 21.0, 20.0, 35.0, 35.0, 63.0, 126.0, 236.0, 469.0, 1110.0, 2912.0, 10439.0, 100430.0, 887472.0, 35025.0, 6408.0, 2045.0, 816.0, 357.0, 178.0, 119.0, 48.0, 39.0, 23.0, 21.0, 12.0, 12.0, 15.0, 3.0, 5.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08465576171875, -0.0818643569946289, -0.07907295227050781, -0.07628154754638672, -0.07349014282226562, -0.07069873809814453, -0.06790733337402344, -0.06511592864990234, -0.06232452392578125, -0.059533119201660156, -0.05674171447753906, -0.05395030975341797, -0.051158905029296875, -0.04836750030517578, -0.04557609558105469, -0.042784690856933594, -0.0399932861328125, -0.037201881408691406, -0.03441047668457031, -0.03161907196044922, -0.028827667236328125, -0.02603626251220703, -0.023244857788085938, -0.020453453063964844, -0.01766204833984375, -0.014870643615722656, -0.012079238891601562, -0.009287834167480469, -0.006496429443359375, -0.0037050247192382812, -0.0009136199951171875, 0.0018777847290039062, 0.004669189453125, 0.007460594177246094, 0.010251998901367188, 0.013043403625488281, 0.015834808349609375, 0.01862621307373047, 0.021417617797851562, 0.024209022521972656, 0.02700042724609375, 0.029791831970214844, 0.03258323669433594, 0.03537464141845703, 0.038166046142578125, 0.04095745086669922, 0.04374885559082031, 0.046540260314941406, 0.0493316650390625, 0.052123069763183594, 0.05491447448730469, 0.05770587921142578, 0.060497283935546875, 0.06328868865966797, 0.06608009338378906, 0.06887149810791016, 0.07166290283203125, 0.07445430755615234, 0.07724571228027344, 0.08003711700439453, 0.08282852172851562, 0.08561992645263672, 0.08841133117675781, 0.0912027359008789, 0.093994140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 8.0, 12.0, 12.0, 21.0, 42.0, 72.0, 84.0, 119.0, 147.0, 136.0, 99.0, 61.0, 54.0, 23.0, 23.0, 14.0, 11.0, 8.0, 7.0, 2.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.058013916015625, -0.05623626708984375, -0.0544586181640625, -0.05268096923828125, -0.0509033203125, -0.04912567138671875, -0.0473480224609375, -0.04557037353515625, -0.043792724609375, -0.04201507568359375, -0.0402374267578125, -0.03845977783203125, -0.03668212890625, -0.03490447998046875, -0.0331268310546875, -0.03134918212890625, -0.029571533203125, -0.02779388427734375, -0.0260162353515625, -0.02423858642578125, -0.0224609375, -0.02068328857421875, -0.0189056396484375, -0.01712799072265625, -0.015350341796875, -0.01357269287109375, -0.0117950439453125, -0.01001739501953125, -0.00823974609375, -0.00646209716796875, -0.0046844482421875, -0.00290679931640625, -0.001129150390625, 0.00064849853515625, 0.0024261474609375, 0.00420379638671875, 0.0059814453125, 0.00775909423828125, 0.0095367431640625, 0.01131439208984375, 0.013092041015625, 0.01486968994140625, 0.0166473388671875, 0.01842498779296875, 0.02020263671875, 0.02198028564453125, 0.0237579345703125, 0.02553558349609375, 0.027313232421875, 0.02909088134765625, 0.0308685302734375, 0.03264617919921875, 0.034423828125, 0.03620147705078125, 0.0379791259765625, 0.03975677490234375, 0.041534423828125, 0.04331207275390625, 0.0450897216796875, 0.04686737060546875, 0.04864501953125, 0.05042266845703125, 0.0522003173828125, 0.05397796630859375, 0.055755615234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 4.0, 4.0, 15.0, 36.0, 199.0, 447.0, 180.0, 65.0, 26.0, 16.0, 6.0, 7.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9484210014343262, -0.8828245997428894, -0.8172281980514526, -0.7516317963600159, -0.6860353946685791, -0.6204389929771423, -0.5548425912857056, -0.4892461895942688, -0.42364978790283203, -0.35805338621139526, -0.2924569845199585, -0.22686058282852173, -0.16126418113708496, -0.0956677794456482, -0.030071377754211426, 0.03552502393722534, 0.10112142562866211, 0.16671782732009888, 0.23231422901153564, 0.2979106307029724, 0.3635070323944092, 0.42910343408584595, 0.4946998357772827, 0.5602962374687195, 0.6258926391601562, 0.691489040851593, 0.7570854425430298, 0.8226818442344666, 0.8882782459259033, 0.9538746476173401, 1.0194710493087769, 1.0850675106048584, 1.1506636142730713, 1.2162599563598633, 1.2818564176559448, 1.3474528789520264, 1.4130492210388184, 1.4786455631256104, 1.544242024421692, 1.6098384857177734, 1.6754348278045654, 1.7410311698913574, 1.806627631187439, 1.8722240924835205, 1.9378204345703125, 2.0034167766571045, 2.0690131187438965, 2.1346096992492676, 2.2002060413360596, 2.2658023834228516, 2.3313989639282227, 2.3969953060150146, 2.4625916481018066, 2.5281879901885986, 2.5937843322753906, 2.6593809127807617, 2.7249772548675537, 2.7905735969543457, 2.856170177459717, 2.921766519546509, 2.987362861633301, 3.0529592037200928, 3.1185555458068848, 3.184152126312256, 3.249748468399048]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 4.0, 14.0, 11.0, 14.0, 7.0, 17.0, 12.0, 32.0, 35.0, 32.0, 31.0, 35.0, 34.0, 46.0, 40.0, 68.0, 63.0, 50.0, 56.0, 49.0, 45.0, 32.0, 25.0, 26.0, 33.0, 30.0, 22.0, 20.0, 15.0, 9.0, 14.0, 11.0, 17.0, 5.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3813024163246155, -0.36928194761276245, -0.3572615087032318, -0.3452410399913788, -0.33322060108184814, -0.3212001323699951, -0.3091796636581421, -0.29715919494628906, -0.2851387560367584, -0.2731182873249054, -0.26109784841537476, -0.24907737970352173, -0.2370569258928299, -0.22503647208213806, -0.21301600337028503, -0.2009955495595932, -0.18897509574890137, -0.17695464193820953, -0.1649341881275177, -0.15291371941566467, -0.14089326560497284, -0.128872811794281, -0.11685235053300858, -0.10483188927173615, -0.09281143546104431, -0.08079098165035248, -0.06877052038908005, -0.056750062853097916, -0.044729605317115784, -0.03270914778113365, -0.02068869024515152, -0.00866822898387909, 0.003352224826812744, 0.015372682362794876, 0.027393139898777008, 0.03941359743475914, 0.05143405497074127, 0.0634545087814331, 0.07547497004270554, 0.08749543130397797, 0.0995158851146698, 0.11153633892536163, 0.12355680018663406, 0.1355772614479065, 0.14759771525859833, 0.15961816906929016, 0.1716386377811432, 0.18365909159183502, 0.19567954540252686, 0.2076999992132187, 0.21972045302391052, 0.23174092173576355, 0.24376137554645538, 0.2557818293571472, 0.26780229806900024, 0.27982276678085327, 0.2918432056903839, 0.30386367440223694, 0.3158841133117676, 0.3279045820236206, 0.33992505073547363, 0.3519454896450043, 0.3639659583568573, 0.37598639726638794, 0.38800686597824097]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 21.0, 42.0, 69.0, 133.0, 387.0, 3899.0, 4137705.0, 50829.0, 785.0, 180.0, 94.0, 49.0, 26.0, 21.0, 10.0, 9.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.10926532745361328, -0.10067176818847656, -0.09207820892333984, -0.08348464965820312, -0.0748910903930664, -0.06629753112792969, -0.05770397186279297, -0.04911041259765625, -0.04051685333251953, -0.03192329406738281, -0.023329734802246094, -0.014736175537109375, -0.006142616271972656, 0.0024509429931640625, 0.011044502258300781, 0.0196380615234375, 0.02823162078857422, 0.03682518005371094, 0.045418739318847656, 0.054012298583984375, 0.0626058578491211, 0.07119941711425781, 0.07979297637939453, 0.08838653564453125, 0.09698009490966797, 0.10557365417480469, 0.1141672134399414, 0.12276077270507812, 0.13135433197021484, 0.13994789123535156, 0.14854145050048828, 0.157135009765625, 0.16572856903076172, 0.17432212829589844, 0.18291568756103516, 0.19150924682617188, 0.2001028060913086, 0.2086963653564453, 0.21728992462158203, 0.22588348388671875, 0.23447704315185547, 0.2430706024169922, 0.2516641616821289, 0.2602577209472656, 0.26885128021240234, 0.27744483947753906, 0.2860383987426758, 0.2946319580078125, 0.3032255172729492, 0.31181907653808594, 0.32041263580322266, 0.3290061950683594, 0.3375997543334961, 0.3461933135986328, 0.35478687286376953, 0.36338043212890625, 0.37197399139404297, 0.3805675506591797, 0.3891611099243164, 0.3977546691894531, 0.40634822845458984, 0.41494178771972656, 0.4235353469848633, 0.43212890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 2.0, 9.0, 10.0, 12.0, 24.0, 22.0, 24.0, 32.0, 41.0, 38.0, 44.0, 48.0, 38.0, 59.0, 56.0, 56.0, 50.0, 51.0, 53.0, 43.0, 44.0, 33.0, 39.0, 28.0, 29.0, 12.0, 19.0, 18.0, 10.0, 16.0, 5.0, 9.0, 6.0, 3.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179290771484375, -0.017261505126953125, -0.01659393310546875, -0.015926361083984375, -0.0152587890625, -0.014591217041015625, -0.01392364501953125, -0.013256072998046875, -0.0125885009765625, -0.011920928955078125, -0.01125335693359375, -0.010585784912109375, -0.009918212890625, -0.009250640869140625, -0.00858306884765625, -0.007915496826171875, -0.0072479248046875, -0.006580352783203125, -0.00591278076171875, -0.005245208740234375, -0.00457763671875, -0.003910064697265625, -0.00324249267578125, -0.002574920654296875, -0.0019073486328125, -0.001239776611328125, -0.00057220458984375, 9.5367431640625e-05, 0.000762939453125, 0.001430511474609375, 0.00209808349609375, 0.002765655517578125, 0.0034332275390625, 0.004100799560546875, 0.00476837158203125, 0.005435943603515625, 0.006103515625, 0.006771087646484375, 0.00743865966796875, 0.008106231689453125, 0.0087738037109375, 0.009441375732421875, 0.01010894775390625, 0.010776519775390625, 0.011444091796875, 0.012111663818359375, 0.01277923583984375, 0.013446807861328125, 0.0141143798828125, 0.014781951904296875, 0.01544952392578125, 0.016117095947265625, 0.01678466796875, 0.017452239990234375, 0.01811981201171875, 0.018787384033203125, 0.0194549560546875, 0.020122528076171875, 0.02079010009765625, 0.021457672119140625, 0.022125244140625, 0.022792816162109375, 0.02346038818359375, 0.024127960205078125, 0.0247955322265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 3.0, 6.0, 11.0, 8.0, 18.0, 14.0, 29.0, 30.0, 32.0, 45.0, 43.0, 81.0, 129.0, 276.0, 591.0, 2870.0, 115048.0, 4055913.0, 16979.0, 1278.0, 402.0, 166.0, 91.0, 53.0, 30.0, 27.0, 19.0, 20.0, 11.0, 9.0, 10.0, 7.0, 10.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1700439453125, -0.16332054138183594, -0.15659713745117188, -0.1498737335205078, -0.14315032958984375, -0.1364269256591797, -0.12970352172851562, -0.12298011779785156, -0.1162567138671875, -0.10953330993652344, -0.10280990600585938, -0.09608650207519531, -0.08936309814453125, -0.08263969421386719, -0.07591629028320312, -0.06919288635253906, -0.062469482421875, -0.05574607849121094, -0.049022674560546875, -0.04229927062988281, -0.03557586669921875, -0.028852462768554688, -0.022129058837890625, -0.015405654907226562, -0.0086822509765625, -0.0019588470458984375, 0.004764556884765625, 0.011487960815429688, 0.01821136474609375, 0.024934768676757812, 0.031658172607421875, 0.03838157653808594, 0.04510498046875, 0.05182838439941406, 0.058551788330078125, 0.06527519226074219, 0.07199859619140625, 0.07872200012207031, 0.08544540405273438, 0.09216880798339844, 0.0988922119140625, 0.10561561584472656, 0.11233901977539062, 0.11906242370605469, 0.12578582763671875, 0.1325092315673828, 0.13923263549804688, 0.14595603942871094, 0.152679443359375, 0.15940284729003906, 0.16612625122070312, 0.1728496551513672, 0.17957305908203125, 0.1862964630126953, 0.19301986694335938, 0.19974327087402344, 0.2064666748046875, 0.21319007873535156, 0.21991348266601562, 0.2266368865966797, 0.23336029052734375, 0.2400836944580078, 0.24680709838867188, 0.25353050231933594, 0.26025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 12.0, 15.0, 33.0, 61.0, 91.0, 295.0, 994.0, 1593.0, 552.0, 207.0, 120.0, 40.0, 31.0, 19.0, 6.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.18310546875, -0.17939424514770508, -0.17568302154541016, -0.17197179794311523, -0.1682605743408203, -0.1645493507385254, -0.16083812713623047, -0.15712690353393555, -0.15341567993164062, -0.1497044563293457, -0.14599323272705078, -0.14228200912475586, -0.13857078552246094, -0.13485956192016602, -0.1311483383178711, -0.12743711471557617, -0.12372589111328125, -0.12001466751098633, -0.1163034439086914, -0.11259222030639648, -0.10888099670410156, -0.10516977310180664, -0.10145854949951172, -0.0977473258972168, -0.09403610229492188, -0.09032487869262695, -0.08661365509033203, -0.08290243148803711, -0.07919120788574219, -0.07547998428344727, -0.07176876068115234, -0.06805753707885742, -0.0643463134765625, -0.06063508987426758, -0.056923866271972656, -0.053212642669677734, -0.04950141906738281, -0.04579019546508789, -0.04207897186279297, -0.03836774826049805, -0.034656524658203125, -0.030945301055908203, -0.02723407745361328, -0.02352285385131836, -0.019811630249023438, -0.016100406646728516, -0.012389183044433594, -0.008677959442138672, -0.00496673583984375, -0.0012555122375488281, 0.0024557113647460938, 0.006166934967041016, 0.009878158569335938, 0.01358938217163086, 0.01730060577392578, 0.021011829376220703, 0.024723052978515625, 0.028434276580810547, 0.03214550018310547, 0.03585672378540039, 0.03956794738769531, 0.043279170989990234, 0.046990394592285156, 0.05070161819458008, 0.054412841796875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 5.0, 13.0, 15.0, 20.0, 27.0, 44.0, 40.0, 79.0, 94.0, 154.0, 165.0, 123.0, 78.0, 43.0, 28.0, 17.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0225791931152344, -0.9936679601669312, -0.9647567868232727, -0.9358456134796143, -0.906934380531311, -0.8780231475830078, -0.8491119742393494, -0.8202008008956909, -0.7912895679473877, -0.7623783349990845, -0.733467161655426, -0.7045559883117676, -0.6756447553634644, -0.6467335224151611, -0.6178223490715027, -0.5889111757278442, -0.559999942779541, -0.5310887098312378, -0.5021775364875793, -0.4732663333415985, -0.4443551301956177, -0.41544392704963684, -0.386532723903656, -0.35762152075767517, -0.32871031761169434, -0.2997991144657135, -0.27088791131973267, -0.24197670817375183, -0.213065505027771, -0.18415430188179016, -0.15524309873580933, -0.1263318955898285, -0.09742075204849243, -0.0685095489025116, -0.03959834575653076, -0.010687142610549927, 0.018224060535430908, 0.04713526368141174, 0.07604646682739258, 0.10495766997337341, 0.13386887311935425, 0.16278007626533508, 0.19169127941131592, 0.22060248255729675, 0.2495136857032776, 0.2784248888492584, 0.30733609199523926, 0.3362472951412201, 0.3651584982872009, 0.39406970143318176, 0.4229809045791626, 0.45189210772514343, 0.48080331087112427, 0.5097144842147827, 0.5386257171630859, 0.5675369501113892, 0.5964481234550476, 0.625359296798706, 0.6542705297470093, 0.6831817626953125, 0.712092936038971, 0.7410041093826294, 0.7699153423309326, 0.7988265752792358, 0.8277377486228943]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 6.0, 6.0, 5.0, 9.0, 11.0, 9.0, 17.0, 19.0, 23.0, 32.0, 24.0, 34.0, 17.0, 35.0, 45.0, 40.0, 36.0, 45.0, 45.0, 36.0, 38.0, 56.0, 36.0, 42.0, 34.0, 28.0, 35.0, 35.0, 25.0, 22.0, 23.0, 22.0, 16.0, 9.0, 22.0, 12.0, 11.0, 9.0, 4.0, 5.0, 6.0, 3.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2651612162590027, -0.2543907165527344, -0.24362020194530487, -0.23284968733787537, -0.22207918763160706, -0.21130867302417755, -0.20053815841674805, -0.18976765871047974, -0.17899714410305023, -0.16822662949562073, -0.15745612978935242, -0.1466856151819229, -0.1359151005744934, -0.1251446008682251, -0.1143740862607956, -0.10360357910394669, -0.09283307194709778, -0.08206256479024887, -0.07129205763339996, -0.06052154302597046, -0.04975103586912155, -0.038980528712272644, -0.02821001410484314, -0.017439506947994232, -0.006668999791145325, 0.004101509228348732, 0.014872018247842789, 0.025642529129981995, 0.0364130362868309, 0.04718354344367981, 0.057954058051109314, 0.06872456520795822, 0.07949507236480713, 0.09026557952165604, 0.10103608667850494, 0.11180660128593445, 0.12257710844278336, 0.13334761559963226, 0.14411813020706177, 0.15488862991333008, 0.16565914452075958, 0.1764296591281891, 0.1872001588344574, 0.1979706734418869, 0.2087411880493164, 0.21951168775558472, 0.23028220236301422, 0.24105271697044373, 0.25182321667671204, 0.26259371638298035, 0.27336424589157104, 0.28413474559783936, 0.29490524530410767, 0.305675745010376, 0.3164462745189667, 0.327216774225235, 0.3379873037338257, 0.348757803440094, 0.3595283329486847, 0.370298832654953, 0.3810693323612213, 0.391839861869812, 0.4026103615760803, 0.41338086128234863, 0.42415136098861694]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 12.0, 18.0, 15.0, 37.0, 59.0, 82.0, 107.0, 154.0, 252.0, 378.0, 617.0, 944.0, 1475.0, 2532.0, 4414.0, 8289.0, 17041.0, 37531.0, 89718.0, 211053.0, 317514.0, 200956.0, 84850.0, 35221.0, 16491.0, 8141.0, 4235.0, 2349.0, 1481.0, 850.0, 590.0, 387.0, 231.0, 165.0, 113.0, 94.0, 41.0, 24.0, 19.0, 13.0, 20.0, 9.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.053924560546875, -0.05244588851928711, -0.05096721649169922, -0.04948854446411133, -0.04800987243652344, -0.04653120040893555, -0.045052528381347656, -0.043573856353759766, -0.042095184326171875, -0.040616512298583984, -0.039137840270996094, -0.0376591682434082, -0.03618049621582031, -0.03470182418823242, -0.03322315216064453, -0.03174448013305664, -0.03026580810546875, -0.02878713607788086, -0.02730846405029297, -0.025829792022705078, -0.024351119995117188, -0.022872447967529297, -0.021393775939941406, -0.019915103912353516, -0.018436431884765625, -0.016957759857177734, -0.015479087829589844, -0.014000415802001953, -0.012521743774414062, -0.011043071746826172, -0.009564399719238281, -0.00808572769165039, -0.0066070556640625, -0.005128383636474609, -0.0036497116088867188, -0.002171039581298828, -0.0006923675537109375, 0.0007863044738769531, 0.0022649765014648438, 0.0037436485290527344, 0.005222320556640625, 0.006700992584228516, 0.008179664611816406, 0.009658336639404297, 0.011137008666992188, 0.012615680694580078, 0.014094352722167969, 0.01557302474975586, 0.01705169677734375, 0.01853036880493164, 0.02000904083251953, 0.021487712860107422, 0.022966384887695312, 0.024445056915283203, 0.025923728942871094, 0.027402400970458984, 0.028881072998046875, 0.030359745025634766, 0.031838417053222656, 0.03331708908081055, 0.03479576110839844, 0.03627443313598633, 0.03775310516357422, 0.03923177719116211, 0.04071044921875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 2.0, 4.0, 5.0, 5.0, 10.0, 6.0, 15.0, 18.0, 25.0, 25.0, 31.0, 37.0, 33.0, 40.0, 43.0, 36.0, 44.0, 45.0, 45.0, 50.0, 45.0, 45.0, 38.0, 36.0, 43.0, 35.0, 31.0, 28.0, 31.0, 23.0, 25.0, 21.0, 14.0, 15.0, 10.0, 10.0, 7.0, 10.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0190277099609375, -0.018321514129638672, -0.017615318298339844, -0.016909122467041016, -0.016202926635742188, -0.01549673080444336, -0.014790534973144531, -0.014084339141845703, -0.013378143310546875, -0.012671947479248047, -0.011965751647949219, -0.01125955581665039, -0.010553359985351562, -0.009847164154052734, -0.009140968322753906, -0.008434772491455078, -0.00772857666015625, -0.007022380828857422, -0.006316184997558594, -0.005609989166259766, -0.0049037933349609375, -0.004197597503662109, -0.0034914016723632812, -0.002785205841064453, -0.002079010009765625, -0.0013728141784667969, -0.0006666183471679688, 3.9577484130859375e-05, 0.0007457733154296875, 0.0014519691467285156, 0.0021581649780273438, 0.002864360809326172, 0.003570556640625, 0.004276752471923828, 0.004982948303222656, 0.005689144134521484, 0.0063953399658203125, 0.007101535797119141, 0.007807731628417969, 0.008513927459716797, 0.009220123291015625, 0.009926319122314453, 0.010632514953613281, 0.01133871078491211, 0.012044906616210938, 0.012751102447509766, 0.013457298278808594, 0.014163494110107422, 0.01486968994140625, 0.015575885772705078, 0.016282081604003906, 0.016988277435302734, 0.017694473266601562, 0.01840066909790039, 0.01910686492919922, 0.019813060760498047, 0.020519256591796875, 0.021225452423095703, 0.02193164825439453, 0.02263784408569336, 0.023344039916992188, 0.024050235748291016, 0.024756431579589844, 0.025462627410888672, 0.0261688232421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 10.0, 13.0, 26.0, 41.0, 55.0, 123.0, 218.0, 433.0, 848.0, 1807.0, 4500.0, 14436.0, 106615.0, 830681.0, 69368.0, 11991.0, 4008.0, 1659.0, 764.0, 412.0, 222.0, 120.0, 62.0, 33.0, 31.0, 17.0, 13.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.18212890625, -0.1766796112060547, -0.17123031616210938, -0.16578102111816406, -0.16033172607421875, -0.15488243103027344, -0.14943313598632812, -0.1439838409423828, -0.1385345458984375, -0.1330852508544922, -0.12763595581054688, -0.12218666076660156, -0.11673736572265625, -0.11128807067871094, -0.10583877563476562, -0.10038948059082031, -0.094940185546875, -0.08949089050292969, -0.08404159545898438, -0.07859230041503906, -0.07314300537109375, -0.06769371032714844, -0.062244415283203125, -0.05679512023925781, -0.0513458251953125, -0.04589653015136719, -0.040447235107421875, -0.03499794006347656, -0.02954864501953125, -0.024099349975585938, -0.018650054931640625, -0.013200759887695312, -0.00775146484375, -0.0023021697998046875, 0.003147125244140625, 0.008596420288085938, 0.01404571533203125, 0.019495010375976562, 0.024944305419921875, 0.030393600463867188, 0.0358428955078125, 0.04129219055175781, 0.046741485595703125, 0.05219078063964844, 0.05764007568359375, 0.06308937072753906, 0.06853866577148438, 0.07398796081542969, 0.079437255859375, 0.08488655090332031, 0.09033584594726562, 0.09578514099121094, 0.10123443603515625, 0.10668373107910156, 0.11213302612304688, 0.11758232116699219, 0.1230316162109375, 0.1284809112548828, 0.13393020629882812, 0.13937950134277344, 0.14482879638671875, 0.15027809143066406, 0.15572738647460938, 0.1611766815185547, 0.1666259765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 9.0, 6.0, 6.0, 10.0, 7.0, 13.0, 19.0, 16.0, 19.0, 22.0, 35.0, 32.0, 48.0, 46.0, 69.0, 57.0, 56.0, 50.0, 55.0, 73.0, 57.0, 52.0, 47.0, 36.0, 29.0, 30.0, 19.0, 19.0, 13.0, 11.0, 7.0, 9.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1279296875, -0.12394332885742188, -0.11995697021484375, -0.11597061157226562, -0.1119842529296875, -0.10799789428710938, -0.10401153564453125, -0.10002517700195312, -0.096038818359375, -0.09205245971679688, -0.08806610107421875, -0.08407974243164062, -0.0800933837890625, -0.07610702514648438, -0.07212066650390625, -0.06813430786132812, -0.06414794921875, -0.060161590576171875, -0.05617523193359375, -0.052188873291015625, -0.0482025146484375, -0.044216156005859375, -0.04022979736328125, -0.036243438720703125, -0.032257080078125, -0.028270721435546875, -0.02428436279296875, -0.020298004150390625, -0.0163116455078125, -0.012325286865234375, -0.00833892822265625, -0.004352569580078125, -0.0003662109375, 0.003620147705078125, 0.00760650634765625, 0.011592864990234375, 0.0155792236328125, 0.019565582275390625, 0.02355194091796875, 0.027538299560546875, 0.031524658203125, 0.035511016845703125, 0.03949737548828125, 0.043483734130859375, 0.0474700927734375, 0.051456451416015625, 0.05544281005859375, 0.059429168701171875, 0.06341552734375, 0.06740188598632812, 0.07138824462890625, 0.07537460327148438, 0.0793609619140625, 0.08334732055664062, 0.08733367919921875, 0.09132003784179688, 0.095306396484375, 0.09929275512695312, 0.10327911376953125, 0.10726547241210938, 0.1112518310546875, 0.11523818969726562, 0.11922454833984375, 0.12321090698242188, 0.127197265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 16.0, 18.0, 23.0, 29.0, 54.0, 69.0, 71.0, 113.0, 199.0, 333.0, 417.0, 774.0, 1213.0, 1980.0, 3424.0, 6056.0, 12205.0, 28679.0, 625234.0, 315374.0, 26465.0, 11481.0, 5982.0, 3265.0, 1847.0, 1167.0, 677.0, 451.0, 300.0, 200.0, 125.0, 79.0, 61.0, 32.0, 24.0, 27.0, 13.0, 16.0, 12.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.11785888671875, -0.11392498016357422, -0.10999107360839844, -0.10605716705322266, -0.10212326049804688, -0.0981893539428711, -0.09425544738769531, -0.09032154083251953, -0.08638763427734375, -0.08245372772216797, -0.07851982116699219, -0.0745859146118164, -0.07065200805664062, -0.06671810150146484, -0.06278419494628906, -0.05885028839111328, -0.0549163818359375, -0.05098247528076172, -0.04704856872558594, -0.043114662170410156, -0.039180755615234375, -0.035246849060058594, -0.03131294250488281, -0.02737903594970703, -0.02344512939453125, -0.01951122283935547, -0.015577316284179688, -0.011643409729003906, -0.007709503173828125, -0.0037755966186523438, 0.0001583099365234375, 0.004092216491699219, 0.008026123046875, 0.011960029602050781, 0.015893936157226562, 0.019827842712402344, 0.023761749267578125, 0.027695655822753906, 0.03162956237792969, 0.03556346893310547, 0.03949737548828125, 0.04343128204345703, 0.04736518859863281, 0.051299095153808594, 0.055233001708984375, 0.059166908264160156, 0.06310081481933594, 0.06703472137451172, 0.0709686279296875, 0.07490253448486328, 0.07883644104003906, 0.08277034759521484, 0.08670425415039062, 0.0906381607055664, 0.09457206726074219, 0.09850597381591797, 0.10243988037109375, 0.10637378692626953, 0.11030769348144531, 0.1142416000366211, 0.11817550659179688, 0.12210941314697266, 0.12604331970214844, 0.12997722625732422, 0.1339111328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 4.0, 5.0, 11.0, 9.0, 13.0, 27.0, 53.0, 606.0, 172.0, 23.0, 9.0, 17.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.00022208690643310547, -0.00021722819656133652, -0.00021236948668956757, -0.00020751077681779861, -0.00020265206694602966, -0.0001977933570742607, -0.00019293464720249176, -0.0001880759373307228, -0.00018321722745895386, -0.0001783585175871849, -0.00017349980771541595, -0.000168641097843647, -0.00016378238797187805, -0.0001589236781001091, -0.00015406496822834015, -0.0001492062583565712, -0.00014434754848480225, -0.0001394888386130333, -0.00013463012874126434, -0.0001297714188694954, -0.00012491270899772644, -0.00012005399912595749, -0.00011519528925418854, -0.00011033657938241959, -0.00010547786951065063, -0.00010061915963888168, -9.576044976711273e-05, -9.090173989534378e-05, -8.604303002357483e-05, -8.118432015180588e-05, -7.632561028003693e-05, -7.146690040826797e-05, -6.660819053649902e-05, -6.174948066473007e-05, -5.689077079296112e-05, -5.203206092119217e-05, -4.717335104942322e-05, -4.2314641177654266e-05, -3.7455931305885315e-05, -3.2597221434116364e-05, -2.7738511562347412e-05, -2.287980169057846e-05, -1.802109181880951e-05, -1.3162381947040558e-05, -8.303672075271606e-06, -3.444962203502655e-06, 1.4137476682662964e-06, 6.272457540035248e-06, 1.11311674118042e-05, 1.598987728357315e-05, 2.0848587155342102e-05, 2.5707297027111053e-05, 3.0566006898880005e-05, 3.5424716770648956e-05, 4.028342664241791e-05, 4.514213651418686e-05, 5.000084638595581e-05, 5.485955625772476e-05, 5.971826612949371e-05, 6.457697600126266e-05, 6.943568587303162e-05, 7.429439574480057e-05, 7.915310561656952e-05, 8.401181548833847e-05, 8.887052536010742e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 22.0, 22.0, 37.0, 62.0, 97.0, 191.0, 356.0, 784.0, 1944.0, 5353.0, 17997.0, 267719.0, 723757.0, 20315.0, 6008.0, 2130.0, 870.0, 388.0, 200.0, 91.0, 71.0, 48.0, 20.0, 11.0, 13.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.235870361328125, -0.22894287109375, -0.222015380859375, -0.215087890625, -0.208160400390625, -0.20123291015625, -0.194305419921875, -0.1873779296875, -0.180450439453125, -0.17352294921875, -0.166595458984375, -0.15966796875, -0.152740478515625, -0.14581298828125, -0.138885498046875, -0.1319580078125, -0.125030517578125, -0.11810302734375, -0.111175537109375, -0.104248046875, -0.097320556640625, -0.09039306640625, -0.083465576171875, -0.0765380859375, -0.069610595703125, -0.06268310546875, -0.055755615234375, -0.048828125, -0.041900634765625, -0.03497314453125, -0.028045654296875, -0.0211181640625, -0.014190673828125, -0.00726318359375, -0.000335693359375, 0.006591796875, 0.013519287109375, 0.02044677734375, 0.027374267578125, 0.0343017578125, 0.041229248046875, 0.04815673828125, 0.055084228515625, 0.06201171875, 0.068939208984375, 0.07586669921875, 0.082794189453125, 0.0897216796875, 0.096649169921875, 0.10357666015625, 0.110504150390625, 0.117431640625, 0.124359130859375, 0.13128662109375, 0.138214111328125, 0.1451416015625, 0.152069091796875, 0.15899658203125, 0.165924072265625, 0.1728515625, 0.179779052734375, 0.18670654296875, 0.193634033203125, 0.2005615234375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 11.0, 6.0, 7.0, 6.0, 7.0, 16.0, 21.0, 35.0, 204.0, 410.0, 169.0, 33.0, 16.0, 8.0, 8.0, 18.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2030029296875, -0.19609832763671875, -0.1891937255859375, -0.18228912353515625, -0.175384521484375, -0.16847991943359375, -0.1615753173828125, -0.15467071533203125, -0.14776611328125, -0.14086151123046875, -0.1339569091796875, -0.12705230712890625, -0.120147705078125, -0.11324310302734375, -0.1063385009765625, -0.09943389892578125, -0.092529296875, -0.08562469482421875, -0.0787200927734375, -0.07181549072265625, -0.064910888671875, -0.05800628662109375, -0.0511016845703125, -0.04419708251953125, -0.03729248046875, -0.03038787841796875, -0.0234832763671875, -0.01657867431640625, -0.009674072265625, -0.00276947021484375, 0.0041351318359375, 0.01103973388671875, 0.0179443359375, 0.02484893798828125, 0.0317535400390625, 0.03865814208984375, 0.045562744140625, 0.05246734619140625, 0.0593719482421875, 0.06627655029296875, 0.07318115234375, 0.08008575439453125, 0.0869903564453125, 0.09389495849609375, 0.100799560546875, 0.10770416259765625, 0.1146087646484375, 0.12151336669921875, 0.12841796875, 0.13532257080078125, 0.1422271728515625, 0.14913177490234375, 0.156036376953125, 0.16294097900390625, 0.1698455810546875, 0.17675018310546875, 0.18365478515625, 0.19055938720703125, 0.1974639892578125, 0.20436859130859375, 0.211273193359375, 0.21817779541015625, 0.2250823974609375, 0.23198699951171875, 0.2388916015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 10.0, 21.0, 54.0, 124.0, 197.0, 306.0, 150.0, 64.0, 34.0, 16.0, 8.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6584229469299316, -2.560546636581421, -2.46267032623291, -2.3647940158843994, -2.2669177055358887, -2.169041395187378, -2.071165084838867, -1.9732887744903564, -1.8754124641418457, -1.777536153793335, -1.6796598434448242, -1.5817835330963135, -1.4839072227478027, -1.386030912399292, -1.2881546020507812, -1.1902782917022705, -1.0924019813537598, -0.994525671005249, -0.8966493606567383, -0.7987730503082275, -0.7008967399597168, -0.603020429611206, -0.5051441192626953, -0.40726780891418457, -0.30939149856567383, -0.21151518821716309, -0.11363887786865234, -0.0157625675201416, 0.08211374282836914, 0.17999005317687988, 0.2778663635253906, 0.37574267387390137, 0.4736189842224121, 0.5714952945709229, 0.6693716049194336, 0.7672479152679443, 0.8651242256164551, 0.9630005359649658, 1.0608768463134766, 1.1587531566619873, 1.256629467010498, 1.3545057773590088, 1.4523820877075195, 1.5502583980560303, 1.648134708404541, 1.7460110187530518, 1.8438873291015625, 1.9417636394500732, 2.039639949798584, 2.1375162601470947, 2.2353925704956055, 2.333268880844116, 2.431145191192627, 2.5290215015411377, 2.6268978118896484, 2.724774122238159, 2.82265043258667, 2.9205267429351807, 3.0184030532836914, 3.116279363632202, 3.214155673980713, 3.3120319843292236, 3.4099082946777344, 3.507784605026245, 3.605660915374756]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 1.0, 5.0, 9.0, 10.0, 8.0, 10.0, 11.0, 16.0, 9.0, 20.0, 17.0, 26.0, 20.0, 30.0, 25.0, 33.0, 34.0, 42.0, 35.0, 49.0, 63.0, 70.0, 61.0, 46.0, 39.0, 31.0, 48.0, 29.0, 23.0, 24.0, 20.0, 18.0, 12.0, 14.0, 14.0, 10.0, 9.0, 8.0, 14.0, 6.0, 6.0, 2.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.7551835179328918, -0.7338804602622986, -0.7125774025917053, -0.6912743449211121, -0.6699712872505188, -0.6486682295799255, -0.6273651719093323, -0.606062114238739, -0.5847590565681458, -0.5634559988975525, -0.5421529412269592, -0.520849883556366, -0.4995468258857727, -0.47824376821517944, -0.4569407105445862, -0.4356376528739929, -0.41433459520339966, -0.3930315375328064, -0.37172847986221313, -0.3504254221916199, -0.3291223645210266, -0.30781930685043335, -0.2865162491798401, -0.2652131915092468, -0.24391013383865356, -0.2226070761680603, -0.20130401849746704, -0.18000096082687378, -0.15869790315628052, -0.13739484548568726, -0.116091787815094, -0.09478873014450073, -0.07348573207855225, -0.052182674407958984, -0.030879616737365723, -0.009576559066772461, 0.0117264986038208, 0.03302955627441406, 0.054332613945007324, 0.07563567161560059, 0.09693872928619385, 0.11824178695678711, 0.13954484462738037, 0.16084790229797363, 0.1821509599685669, 0.20345401763916016, 0.22475707530975342, 0.24606013298034668, 0.26736319065093994, 0.2886662483215332, 0.30996930599212646, 0.3312723636627197, 0.352575421333313, 0.37387847900390625, 0.3951815366744995, 0.4164845943450928, 0.43778765201568604, 0.4590907096862793, 0.48039376735687256, 0.5016968250274658, 0.5229998826980591, 0.5443029403686523, 0.5656059980392456, 0.5869090557098389, 0.6082121133804321]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 11.0, 10.0, 18.0, 29.0, 28.0, 38.0, 66.0, 119.0, 214.0, 447.0, 1041.0, 2922.0, 11442.0, 107036.0, 3717690.0, 326434.0, 19840.0, 4224.0, 1386.0, 600.0, 263.0, 162.0, 86.0, 57.0, 32.0, 15.0, 16.0, 4.0, 6.0, 11.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12939453125, -0.1248779296875, -0.120361328125, -0.1158447265625, -0.111328125, -0.1068115234375, -0.102294921875, -0.0977783203125, -0.09326171875, -0.0887451171875, -0.084228515625, -0.0797119140625, -0.0751953125, -0.0706787109375, -0.066162109375, -0.0616455078125, -0.05712890625, -0.0526123046875, -0.048095703125, -0.0435791015625, -0.0390625, -0.0345458984375, -0.030029296875, -0.0255126953125, -0.02099609375, -0.0164794921875, -0.011962890625, -0.0074462890625, -0.0029296875, 0.0015869140625, 0.006103515625, 0.0106201171875, 0.01513671875, 0.0196533203125, 0.024169921875, 0.0286865234375, 0.033203125, 0.0377197265625, 0.042236328125, 0.0467529296875, 0.05126953125, 0.0557861328125, 0.060302734375, 0.0648193359375, 0.0693359375, 0.0738525390625, 0.078369140625, 0.0828857421875, 0.08740234375, 0.0919189453125, 0.096435546875, 0.1009521484375, 0.10546875, 0.1099853515625, 0.114501953125, 0.1190185546875, 0.12353515625, 0.1280517578125, 0.132568359375, 0.1370849609375, 0.1416015625, 0.1461181640625, 0.150634765625, 0.1551513671875, 0.15966796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 10.0, 18.0, 17.0, 25.0, 33.0, 34.0, 38.0, 37.0, 51.0, 62.0, 53.0, 51.0, 70.0, 60.0, 49.0, 49.0, 55.0, 39.0, 43.0, 33.0, 21.0, 19.0, 21.0, 20.0, 13.0, 14.0, 6.0, 7.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035888671875, -0.034821510314941406, -0.03375434875488281, -0.03268718719482422, -0.031620025634765625, -0.03055286407470703, -0.029485702514648438, -0.028418540954589844, -0.02735137939453125, -0.026284217834472656, -0.025217056274414062, -0.02414989471435547, -0.023082733154296875, -0.02201557159423828, -0.020948410034179688, -0.019881248474121094, -0.0188140869140625, -0.017746925354003906, -0.016679763793945312, -0.015612602233886719, -0.014545440673828125, -0.013478279113769531, -0.012411117553710938, -0.011343955993652344, -0.01027679443359375, -0.009209632873535156, -0.008142471313476562, -0.007075309753417969, -0.006008148193359375, -0.004940986633300781, -0.0038738250732421875, -0.0028066635131835938, -0.001739501953125, -0.0006723403930664062, 0.0003948211669921875, 0.0014619827270507812, 0.002529144287109375, 0.0035963058471679688, 0.0046634674072265625, 0.005730628967285156, 0.00679779052734375, 0.007864952087402344, 0.008932113647460938, 0.009999275207519531, 0.011066436767578125, 0.012133598327636719, 0.013200759887695312, 0.014267921447753906, 0.0153350830078125, 0.016402244567871094, 0.017469406127929688, 0.01853656768798828, 0.019603729248046875, 0.02067089080810547, 0.021738052368164062, 0.022805213928222656, 0.02387237548828125, 0.024939537048339844, 0.026006698608398438, 0.02707386016845703, 0.028141021728515625, 0.02920818328857422, 0.030275344848632812, 0.031342506408691406, 0.03240966796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 14.0, 14.0, 13.0, 23.0, 28.0, 36.0, 58.0, 76.0, 81.0, 85.0, 106.0, 171.0, 260.0, 495.0, 1512.0, 17199.0, 4098637.0, 71367.0, 2680.0, 609.0, 251.0, 157.0, 112.0, 97.0, 59.0, 28.0, 25.0, 22.0, 14.0, 13.0, 11.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4902191162109375, -0.473114013671875, -0.4560089111328125, -0.43890380859375, -0.4217987060546875, -0.404693603515625, -0.3875885009765625, -0.3704833984375, -0.3533782958984375, -0.336273193359375, -0.3191680908203125, -0.30206298828125, -0.2849578857421875, -0.267852783203125, -0.2507476806640625, -0.233642578125, -0.2165374755859375, -0.199432373046875, -0.1823272705078125, -0.16522216796875, -0.1481170654296875, -0.131011962890625, -0.1139068603515625, -0.0968017578125, -0.0796966552734375, -0.062591552734375, -0.0454864501953125, -0.02838134765625, -0.0112762451171875, 0.005828857421875, 0.0229339599609375, 0.0400390625, 0.0571441650390625, 0.074249267578125, 0.0913543701171875, 0.10845947265625, 0.1255645751953125, 0.142669677734375, 0.1597747802734375, 0.1768798828125, 0.1939849853515625, 0.211090087890625, 0.2281951904296875, 0.24530029296875, 0.2624053955078125, 0.279510498046875, 0.2966156005859375, 0.313720703125, 0.3308258056640625, 0.347930908203125, 0.3650360107421875, 0.38214111328125, 0.3992462158203125, 0.416351318359375, 0.4334564208984375, 0.4505615234375, 0.4676666259765625, 0.484771728515625, 0.5018768310546875, 0.51898193359375, 0.5360870361328125, 0.553192138671875, 0.5702972412109375, 0.58740234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 14.0, 18.0, 44.0, 193.0, 1901.0, 1604.0, 188.0, 67.0, 27.0, 13.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6757278442382812, -0.6610260009765625, -0.6463241577148438, -0.631622314453125, -0.6169204711914062, -0.6022186279296875, -0.5875167846679688, -0.57281494140625, -0.5581130981445312, -0.5434112548828125, -0.5287094116210938, -0.514007568359375, -0.49930572509765625, -0.4846038818359375, -0.46990203857421875, -0.4552001953125, -0.44049835205078125, -0.4257965087890625, -0.41109466552734375, -0.396392822265625, -0.38169097900390625, -0.3669891357421875, -0.35228729248046875, -0.33758544921875, -0.32288360595703125, -0.3081817626953125, -0.29347991943359375, -0.278778076171875, -0.26407623291015625, -0.2493743896484375, -0.23467254638671875, -0.219970703125, -0.20526885986328125, -0.1905670166015625, -0.17586517333984375, -0.161163330078125, -0.14646148681640625, -0.1317596435546875, -0.11705780029296875, -0.10235595703125, -0.08765411376953125, -0.0729522705078125, -0.05825042724609375, -0.043548583984375, -0.02884674072265625, -0.0141448974609375, 0.00055694580078125, 0.0152587890625, 0.02996063232421875, 0.0446624755859375, 0.05936431884765625, 0.074066162109375, 0.08876800537109375, 0.1034698486328125, 0.11817169189453125, 0.13287353515625, 0.14757537841796875, 0.1622772216796875, 0.17697906494140625, 0.191680908203125, 0.20638275146484375, 0.2210845947265625, 0.23578643798828125, 0.25048828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 5.0, 5.0, 7.0, 22.0, 23.0, 33.0, 44.0, 70.0, 119.0, 146.0, 166.0, 112.0, 82.0, 50.0, 26.0, 25.0, 14.0, 5.0, 0.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9199395179748535, -1.8638726472854614, -1.8078057765960693, -1.7517387866973877, -1.6956719160079956, -1.6396050453186035, -1.5835380554199219, -1.5274711847305298, -1.4714043140411377, -1.4153374433517456, -1.3592705726623535, -1.3032035827636719, -1.2471367120742798, -1.1910698413848877, -1.135002851486206, -1.078935980796814, -1.0228691101074219, -0.9668022394180298, -0.9107353091239929, -0.854668378829956, -0.798601508140564, -0.7425346374511719, -0.686467707157135, -0.6304007768630981, -0.574333906173706, -0.518267035484314, -0.4622001051902771, -0.4061332046985626, -0.35006630420684814, -0.29399940371513367, -0.2379325032234192, -0.1818656027317047, -0.12579870223999023, -0.06973180174827576, -0.01366490125656128, 0.0424019992351532, 0.09846889972686768, 0.15453580021858215, 0.21060270071029663, 0.2666696012020111, 0.3227365016937256, 0.37880340218544006, 0.43487030267715454, 0.490937203168869, 0.5470041036605835, 0.6030709743499756, 0.6591379046440125, 0.7152048349380493, 0.7712717056274414, 0.8273385763168335, 0.8834055066108704, 0.9394724369049072, 0.9955393075942993, 1.0516061782836914, 1.107673168182373, 1.1637400388717651, 1.2198069095611572, 1.2758737802505493, 1.3319406509399414, 1.388007640838623, 1.4440745115280151, 1.5001413822174072, 1.5562083721160889, 1.612275242805481, 1.668342113494873]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 13.0, 10.0, 13.0, 24.0, 22.0, 24.0, 27.0, 33.0, 42.0, 39.0, 39.0, 68.0, 51.0, 52.0, 65.0, 47.0, 56.0, 44.0, 56.0, 42.0, 27.0, 34.0, 34.0, 24.0, 12.0, 14.0, 15.0, 9.0, 6.0, 10.0, 7.0, 8.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0254302024841309, -0.9901659488677979, -0.9549016356468201, -0.9196373820304871, -0.8843730688095093, -0.8491088151931763, -0.8138445615768433, -0.7785802483558655, -0.7433159351348877, -0.7080516815185547, -0.6727873682975769, -0.6375231146812439, -0.6022588014602661, -0.5669945478439331, -0.5317302942276001, -0.4964659810066223, -0.4612017273902893, -0.4259374439716339, -0.3906731605529785, -0.3554089069366455, -0.3201445937156677, -0.2848803400993347, -0.24961605668067932, -0.21435177326202393, -0.17908748984336853, -0.14382320642471313, -0.10855893045663834, -0.07329465448856354, -0.03803037106990814, -0.0027660876512527466, 0.032498180866241455, 0.06776246428489685, 0.10302674770355225, 0.13829103112220764, 0.17355531454086304, 0.20881958305835724, 0.24408386647701263, 0.27934813499450684, 0.31461241841316223, 0.3498767018318176, 0.385140985250473, 0.4204052686691284, 0.4556695520877838, 0.4909338355064392, 0.5261980891227722, 0.56146240234375, 0.596726655960083, 0.631990909576416, 0.6672552227973938, 0.7025194764137268, 0.7377837896347046, 0.7730480432510376, 0.8083123564720154, 0.8435766100883484, 0.8788409233093262, 0.9141051769256592, 0.9493694305419922, 0.9846336841583252, 1.0198979377746582, 1.0551623106002808, 1.0904265642166138, 1.1256908178329468, 1.1609550714492798, 1.1962194442749023, 1.2314836978912354]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 13.0, 24.0, 35.0, 57.0, 73.0, 98.0, 168.0, 209.0, 305.0, 484.0, 831.0, 1323.0, 2241.0, 4040.0, 7771.0, 15912.0, 37446.0, 100378.0, 301359.0, 362423.0, 128303.0, 45501.0, 19149.0, 9008.0, 4711.0, 2557.0, 1486.0, 942.0, 585.0, 358.0, 245.0, 166.0, 112.0, 68.0, 43.0, 30.0, 17.0, 18.0, 10.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0], "bins": [-0.1346435546875, -0.13080883026123047, -0.12697410583496094, -0.1231393814086914, -0.11930465698242188, -0.11546993255615234, -0.11163520812988281, -0.10780048370361328, -0.10396575927734375, -0.10013103485107422, -0.09629631042480469, -0.09246158599853516, -0.08862686157226562, -0.0847921371459961, -0.08095741271972656, -0.07712268829345703, -0.0732879638671875, -0.06945323944091797, -0.06561851501464844, -0.061783790588378906, -0.057949066162109375, -0.054114341735839844, -0.05027961730957031, -0.04644489288330078, -0.04261016845703125, -0.03877544403076172, -0.03494071960449219, -0.031105995178222656, -0.027271270751953125, -0.023436546325683594, -0.019601821899414062, -0.01576709747314453, -0.011932373046875, -0.008097648620605469, -0.0042629241943359375, -0.00042819976806640625, 0.003406524658203125, 0.007241249084472656, 0.011075973510742188, 0.014910697937011719, 0.01874542236328125, 0.02258014678955078, 0.026414871215820312, 0.030249595642089844, 0.034084320068359375, 0.037919044494628906, 0.04175376892089844, 0.04558849334716797, 0.0494232177734375, 0.05325794219970703, 0.05709266662597656, 0.060927391052246094, 0.06476211547851562, 0.06859683990478516, 0.07243156433105469, 0.07626628875732422, 0.08010101318359375, 0.08393573760986328, 0.08777046203613281, 0.09160518646240234, 0.09543991088867188, 0.0992746353149414, 0.10310935974121094, 0.10694408416748047, 0.11077880859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 13.0, 9.0, 17.0, 14.0, 19.0, 27.0, 30.0, 38.0, 54.0, 40.0, 68.0, 65.0, 62.0, 69.0, 67.0, 72.0, 47.0, 42.0, 34.0, 37.0, 28.0, 28.0, 25.0, 18.0, 11.0, 14.0, 16.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06048583984375, -0.05835247039794922, -0.05621910095214844, -0.054085731506347656, -0.051952362060546875, -0.049818992614746094, -0.04768562316894531, -0.04555225372314453, -0.04341888427734375, -0.04128551483154297, -0.03915214538574219, -0.037018775939941406, -0.034885406494140625, -0.032752037048339844, -0.030618667602539062, -0.02848529815673828, -0.0263519287109375, -0.02421855926513672, -0.022085189819335938, -0.019951820373535156, -0.017818450927734375, -0.015685081481933594, -0.013551712036132812, -0.011418342590332031, -0.00928497314453125, -0.007151603698730469, -0.0050182342529296875, -0.0028848648071289062, -0.000751495361328125, 0.0013818740844726562, 0.0035152435302734375, 0.005648612976074219, 0.007781982421875, 0.009915351867675781, 0.012048721313476562, 0.014182090759277344, 0.016315460205078125, 0.018448829650878906, 0.020582199096679688, 0.02271556854248047, 0.02484893798828125, 0.02698230743408203, 0.029115676879882812, 0.031249046325683594, 0.033382415771484375, 0.035515785217285156, 0.03764915466308594, 0.03978252410888672, 0.0419158935546875, 0.04404926300048828, 0.04618263244628906, 0.048316001892089844, 0.050449371337890625, 0.052582740783691406, 0.05471611022949219, 0.05684947967529297, 0.05898284912109375, 0.06111621856689453, 0.06324958801269531, 0.0653829574584961, 0.06751632690429688, 0.06964969635009766, 0.07178306579589844, 0.07391643524169922, 0.0760498046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 1.0, 7.0, 1.0, 3.0, 10.0, 18.0, 15.0, 22.0, 41.0, 47.0, 93.0, 114.0, 144.0, 252.0, 482.0, 837.0, 1839.0, 4610.0, 14305.0, 73422.0, 765206.0, 153532.0, 22310.0, 6285.0, 2426.0, 1088.0, 576.0, 302.0, 192.0, 113.0, 80.0, 37.0, 37.0, 27.0, 27.0, 15.0, 10.0, 9.0, 3.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32403564453125, -0.3131103515625, -0.30218505859375, -0.291259765625, -0.28033447265625, -0.2694091796875, -0.25848388671875, -0.24755859375, -0.23663330078125, -0.2257080078125, -0.21478271484375, -0.203857421875, -0.19293212890625, -0.1820068359375, -0.17108154296875, -0.16015625, -0.14923095703125, -0.1383056640625, -0.12738037109375, -0.116455078125, -0.10552978515625, -0.0946044921875, -0.08367919921875, -0.07275390625, -0.06182861328125, -0.0509033203125, -0.03997802734375, -0.029052734375, -0.01812744140625, -0.0072021484375, 0.00372314453125, 0.0146484375, 0.02557373046875, 0.0364990234375, 0.04742431640625, 0.058349609375, 0.06927490234375, 0.0802001953125, 0.09112548828125, 0.10205078125, 0.11297607421875, 0.1239013671875, 0.13482666015625, 0.145751953125, 0.15667724609375, 0.1676025390625, 0.17852783203125, 0.189453125, 0.20037841796875, 0.2113037109375, 0.22222900390625, 0.233154296875, 0.24407958984375, 0.2550048828125, 0.26593017578125, 0.27685546875, 0.28778076171875, 0.2987060546875, 0.30963134765625, 0.320556640625, 0.33148193359375, 0.3424072265625, 0.35333251953125, 0.3642578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 8.0, 4.0, 11.0, 9.0, 12.0, 11.0, 18.0, 17.0, 18.0, 19.0, 38.0, 40.0, 51.0, 43.0, 50.0, 65.0, 74.0, 62.0, 63.0, 52.0, 53.0, 37.0, 31.0, 36.0, 44.0, 23.0, 31.0, 14.0, 13.0, 11.0, 12.0, 6.0, 7.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3563995361328125, -0.344879150390625, -0.3333587646484375, -0.32183837890625, -0.3103179931640625, -0.298797607421875, -0.2872772216796875, -0.2757568359375, -0.2642364501953125, -0.252716064453125, -0.2411956787109375, -0.22967529296875, -0.2181549072265625, -0.206634521484375, -0.1951141357421875, -0.18359375, -0.1720733642578125, -0.160552978515625, -0.1490325927734375, -0.13751220703125, -0.1259918212890625, -0.114471435546875, -0.1029510498046875, -0.0914306640625, -0.0799102783203125, -0.068389892578125, -0.0568695068359375, -0.04534912109375, -0.0338287353515625, -0.022308349609375, -0.0107879638671875, 0.000732421875, 0.0122528076171875, 0.023773193359375, 0.0352935791015625, 0.04681396484375, 0.0583343505859375, 0.069854736328125, 0.0813751220703125, 0.0928955078125, 0.1044158935546875, 0.115936279296875, 0.1274566650390625, 0.13897705078125, 0.1504974365234375, 0.162017822265625, 0.1735382080078125, 0.18505859375, 0.1965789794921875, 0.208099365234375, 0.2196197509765625, 0.23114013671875, 0.2426605224609375, 0.254180908203125, 0.2657012939453125, 0.2772216796875, 0.2887420654296875, 0.300262451171875, 0.3117828369140625, 0.32330322265625, 0.3348236083984375, 0.346343994140625, 0.3578643798828125, 0.369384765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 3.0, 7.0, 18.0, 27.0, 62.0, 86.0, 164.0, 310.0, 532.0, 1172.0, 2313.0, 5193.0, 12751.0, 44770.0, 738157.0, 199383.0, 26801.0, 9167.0, 3788.0, 1878.0, 914.0, 455.0, 260.0, 137.0, 75.0, 44.0, 32.0, 31.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.287841796875, -0.2809600830078125, -0.274078369140625, -0.2671966552734375, -0.26031494140625, -0.2534332275390625, -0.246551513671875, -0.2396697998046875, -0.2327880859375, -0.2259063720703125, -0.219024658203125, -0.2121429443359375, -0.20526123046875, -0.1983795166015625, -0.191497802734375, -0.1846160888671875, -0.177734375, -0.1708526611328125, -0.163970947265625, -0.1570892333984375, -0.15020751953125, -0.1433258056640625, -0.136444091796875, -0.1295623779296875, -0.1226806640625, -0.1157989501953125, -0.108917236328125, -0.1020355224609375, -0.09515380859375, -0.0882720947265625, -0.081390380859375, -0.0745086669921875, -0.067626953125, -0.0607452392578125, -0.053863525390625, -0.0469818115234375, -0.04010009765625, -0.0332183837890625, -0.026336669921875, -0.0194549560546875, -0.0125732421875, -0.0056915283203125, 0.001190185546875, 0.0080718994140625, 0.01495361328125, 0.0218353271484375, 0.028717041015625, 0.0355987548828125, 0.04248046875, 0.0493621826171875, 0.056243896484375, 0.0631256103515625, 0.07000732421875, 0.0768890380859375, 0.083770751953125, 0.0906524658203125, 0.0975341796875, 0.1044158935546875, 0.111297607421875, 0.1181793212890625, 0.12506103515625, 0.1319427490234375, 0.138824462890625, 0.1457061767578125, 0.152587890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 8.0, 7.0, 13.0, 13.0, 25.0, 37.0, 100.0, 341.0, 250.0, 72.0, 31.0, 16.0, 12.0, 14.0, 12.0, 7.0, 3.0, 5.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.721517562866211e-05, -9.255018085241318e-05, -8.788518607616425e-05, -8.322019129991531e-05, -7.855519652366638e-05, -7.389020174741745e-05, -6.922520697116852e-05, -6.456021219491959e-05, -5.9895217418670654e-05, -5.523022264242172e-05, -5.056522786617279e-05, -4.590023308992386e-05, -4.123523831367493e-05, -3.6570243537425995e-05, -3.190524876117706e-05, -2.724025398492813e-05, -2.25752592086792e-05, -1.7910264432430267e-05, -1.3245269656181335e-05, -8.580274879932404e-06, -3.915280103683472e-06, 7.497146725654602e-07, 5.414709448814392e-06, 1.0079704225063324e-05, 1.4744699001312256e-05, 1.9409693777561188e-05, 2.407468855381012e-05, 2.873968333005905e-05, 3.3404678106307983e-05, 3.8069672882556915e-05, 4.273466765880585e-05, 4.739966243505478e-05, 5.206465721130371e-05, 5.672965198755264e-05, 6.139464676380157e-05, 6.60596415400505e-05, 7.072463631629944e-05, 7.538963109254837e-05, 8.00546258687973e-05, 8.471962064504623e-05, 8.938461542129517e-05, 9.40496101975441e-05, 9.871460497379303e-05, 0.00010337959975004196, 0.0001080445945262909, 0.00011270958930253983, 0.00011737458407878876, 0.00012203957885503769, 0.00012670457363128662, 0.00013136956840753555, 0.00013603456318378448, 0.00014069955796003342, 0.00014536455273628235, 0.00015002954751253128, 0.0001546945422887802, 0.00015935953706502914, 0.00016402453184127808, 0.000168689526617527, 0.00017335452139377594, 0.00017801951617002487, 0.0001826845109462738, 0.00018734950572252274, 0.00019201450049877167, 0.0001966794952750206, 0.00020134449005126953]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 9.0, 20.0, 29.0, 51.0, 90.0, 118.0, 215.0, 399.0, 742.0, 1900.0, 5488.0, 19496.0, 199269.0, 775908.0, 32332.0, 7653.0, 2617.0, 1045.0, 454.0, 269.0, 150.0, 92.0, 62.0, 32.0, 26.0, 13.0, 8.0, 16.0, 7.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2403564453125, -0.2315044403076172, -0.22265243530273438, -0.21380043029785156, -0.20494842529296875, -0.19609642028808594, -0.18724441528320312, -0.1783924102783203, -0.1695404052734375, -0.1606884002685547, -0.15183639526367188, -0.14298439025878906, -0.13413238525390625, -0.12528038024902344, -0.11642837524414062, -0.10757637023925781, -0.098724365234375, -0.08987236022949219, -0.08102035522460938, -0.07216835021972656, -0.06331634521484375, -0.05446434020996094, -0.045612335205078125, -0.03676033020019531, -0.0279083251953125, -0.019056320190429688, -0.010204315185546875, -0.0013523101806640625, 0.00749969482421875, 0.016351699829101562, 0.025203704833984375, 0.03405570983886719, 0.04290771484375, 0.05175971984863281, 0.060611724853515625, 0.06946372985839844, 0.07831573486328125, 0.08716773986816406, 0.09601974487304688, 0.10487174987792969, 0.1137237548828125, 0.12257575988769531, 0.13142776489257812, 0.14027976989746094, 0.14913177490234375, 0.15798377990722656, 0.16683578491210938, 0.1756877899169922, 0.184539794921875, 0.1933917999267578, 0.20224380493164062, 0.21109580993652344, 0.21994781494140625, 0.22879981994628906, 0.23765182495117188, 0.2465038299560547, 0.2553558349609375, 0.2642078399658203, 0.2730598449707031, 0.28191184997558594, 0.29076385498046875, 0.29961585998535156, 0.3084678649902344, 0.3173198699951172, 0.326171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 12.0, 11.0, 8.0, 22.0, 29.0, 20.0, 52.0, 96.0, 141.0, 200.0, 166.0, 71.0, 46.0, 43.0, 22.0, 15.0, 8.0, 4.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.243896484375, -0.2370319366455078, -0.23016738891601562, -0.22330284118652344, -0.21643829345703125, -0.20957374572753906, -0.20270919799804688, -0.1958446502685547, -0.1889801025390625, -0.1821155548095703, -0.17525100708007812, -0.16838645935058594, -0.16152191162109375, -0.15465736389160156, -0.14779281616210938, -0.1409282684326172, -0.134063720703125, -0.1271991729736328, -0.12033462524414062, -0.11347007751464844, -0.10660552978515625, -0.09974098205566406, -0.09287643432617188, -0.08601188659667969, -0.0791473388671875, -0.07228279113769531, -0.06541824340820312, -0.05855369567871094, -0.05168914794921875, -0.04482460021972656, -0.037960052490234375, -0.031095504760742188, -0.02423095703125, -0.017366409301757812, -0.010501861572265625, -0.0036373138427734375, 0.00322723388671875, 0.010091781616210938, 0.016956329345703125, 0.023820877075195312, 0.0306854248046875, 0.03754997253417969, 0.044414520263671875, 0.05127906799316406, 0.05814361572265625, 0.06500816345214844, 0.07187271118164062, 0.07873725891113281, 0.085601806640625, 0.09246635437011719, 0.09933090209960938, 0.10619544982910156, 0.11305999755859375, 0.11992454528808594, 0.12678909301757812, 0.1336536407470703, 0.1405181884765625, 0.1473827362060547, 0.15424728393554688, 0.16111183166503906, 0.16797637939453125, 0.17484092712402344, 0.18170547485351562, 0.1885700225830078, 0.1954345703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 15.0, 19.0, 63.0, 132.0, 317.0, 228.0, 121.0, 52.0, 22.0, 8.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.817688465118408, -2.660344123840332, -2.5029995441436768, -2.3456552028656006, -2.1883106231689453, -2.030966281890869, -1.873621940612793, -1.7162774801254272, -1.5589330196380615, -1.4015885591506958, -1.24424409866333, -1.086899757385254, -0.9295552968978882, -0.7722108364105225, -0.6148664355278015, -0.45752203464508057, -0.30017757415771484, -0.1428331434726715, 0.014511287212371826, 0.17185571789741516, 0.3292001485824585, 0.4865446090698242, 0.6438890099525452, 0.8012334108352661, 0.9585778713226318, 1.1159223318099976, 1.2732667922973633, 1.4306111335754395, 1.5879555940628052, 1.745300054550171, 1.902644395828247, 2.0599889755249023, 2.2173328399658203, 2.3746771812438965, 2.5320217609405518, 2.689366102218628, 2.846710681915283, 3.0040550231933594, 3.1613993644714355, 3.3187437057495117, 3.476088285446167, 3.633432626724243, 3.7907772064208984, 3.9481215476989746, 4.105465888977051, 4.262810707092285, 4.420155048370361, 4.5774993896484375, 4.734843730926514, 4.89218807220459, 5.049532413482666, 5.2068772315979, 5.364221572875977, 5.521565914154053, 5.678910255432129, 5.836254596710205, 5.993598937988281, 6.150943279266357, 6.308287620544434, 6.465632438659668, 6.622976779937744, 6.78032112121582, 6.9376654624938965, 7.095009803771973, 7.252354621887207]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 6.0, 7.0, 17.0, 11.0, 19.0, 25.0, 26.0, 33.0, 36.0, 36.0, 47.0, 49.0, 67.0, 84.0, 102.0, 75.0, 46.0, 44.0, 49.0, 40.0, 24.0, 28.0, 21.0, 22.0, 18.0, 9.0, 14.0, 5.0, 10.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.019620418548584, -1.9527716636657715, -1.885922908782959, -1.8190741539001465, -1.752225399017334, -1.6853766441345215, -1.6185280084609985, -1.551679253578186, -1.4848304986953735, -1.417981743812561, -1.3511329889297485, -1.284284234046936, -1.217435598373413, -1.1505868434906006, -1.083738088607788, -1.0168893337249756, -0.9500405788421631, -0.8831918239593506, -0.8163430690765381, -0.7494943737983704, -0.6826456189155579, -0.6157968640327454, -0.5489481687545776, -0.48209941387176514, -0.41525065898895264, -0.34840190410614014, -0.28155317902565, -0.21470443904399872, -0.1478556990623474, -0.08100694417953491, -0.0141582190990448, 0.05269050598144531, 0.11953926086425781, 0.18638800084590912, 0.2532367408275604, 0.32008546590805054, 0.38693422079086304, 0.45378297567367554, 0.5206316709518433, 0.5874804258346558, 0.6543291807174683, 0.7211779356002808, 0.7880266904830933, 0.854875385761261, 0.9217241406440735, 0.988572895526886, 1.0554215908050537, 1.1222703456878662, 1.1891191005706787, 1.2559678554534912, 1.3228166103363037, 1.3896653652191162, 1.4565141201019287, 1.5233628749847412, 1.5902115106582642, 1.6570602655410767, 1.7239090204238892, 1.7907577753067017, 1.8576065301895142, 1.9244552850723267, 1.9913039207458496, 2.058152675628662, 2.1250014305114746, 2.191850185394287, 2.2586989402770996]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 14.0, 22.0, 27.0, 52.0, 93.0, 166.0, 353.0, 675.0, 1638.0, 3887.0, 11549.0, 61768.0, 2128981.0, 1911476.0, 55740.0, 10977.0, 3785.0, 1648.0, 721.0, 306.0, 174.0, 73.0, 54.0, 24.0, 20.0, 12.0, 9.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1832275390625, -0.1766796112060547, -0.17013168334960938, -0.16358375549316406, -0.15703582763671875, -0.15048789978027344, -0.14393997192382812, -0.1373920440673828, -0.1308441162109375, -0.12429618835449219, -0.11774826049804688, -0.11120033264160156, -0.10465240478515625, -0.09810447692871094, -0.09155654907226562, -0.08500862121582031, -0.078460693359375, -0.07191276550292969, -0.06536483764648438, -0.05881690979003906, -0.05226898193359375, -0.04572105407714844, -0.039173126220703125, -0.03262519836425781, -0.0260772705078125, -0.019529342651367188, -0.012981414794921875, -0.0064334869384765625, 0.00011444091796875, 0.0066623687744140625, 0.013210296630859375, 0.019758224487304688, 0.02630615234375, 0.03285408020019531, 0.039402008056640625, 0.04594993591308594, 0.05249786376953125, 0.05904579162597656, 0.06559371948242188, 0.07214164733886719, 0.0786895751953125, 0.08523750305175781, 0.09178543090820312, 0.09833335876464844, 0.10488128662109375, 0.11142921447753906, 0.11797714233398438, 0.12452507019042969, 0.131072998046875, 0.1376209259033203, 0.14416885375976562, 0.15071678161621094, 0.15726470947265625, 0.16381263732910156, 0.17036056518554688, 0.1769084930419922, 0.1834564208984375, 0.1900043487548828, 0.19655227661132812, 0.20310020446777344, 0.20964813232421875, 0.21619606018066406, 0.22274398803710938, 0.2292919158935547, 0.23583984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 6.0, 4.0, 13.0, 6.0, 11.0, 14.0, 23.0, 26.0, 32.0, 37.0, 42.0, 63.0, 68.0, 77.0, 57.0, 67.0, 69.0, 63.0, 55.0, 47.0, 51.0, 30.0, 27.0, 25.0, 20.0, 15.0, 10.0, 13.0, 4.0, 6.0, 6.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.08404541015625, -0.08167076110839844, -0.07929611206054688, -0.07692146301269531, -0.07454681396484375, -0.07217216491699219, -0.06979751586914062, -0.06742286682128906, -0.0650482177734375, -0.06267356872558594, -0.060298919677734375, -0.05792427062988281, -0.05554962158203125, -0.05317497253417969, -0.050800323486328125, -0.04842567443847656, -0.046051025390625, -0.04367637634277344, -0.041301727294921875, -0.03892707824707031, -0.03655242919921875, -0.03417778015136719, -0.031803131103515625, -0.029428482055664062, -0.0270538330078125, -0.024679183959960938, -0.022304534912109375, -0.019929885864257812, -0.01755523681640625, -0.015180587768554688, -0.012805938720703125, -0.010431289672851562, -0.008056640625, -0.0056819915771484375, -0.003307342529296875, -0.0009326934814453125, 0.00144195556640625, 0.0038166046142578125, 0.006191253662109375, 0.008565902709960938, 0.0109405517578125, 0.013315200805664062, 0.015689849853515625, 0.018064498901367188, 0.02043914794921875, 0.022813796997070312, 0.025188446044921875, 0.027563095092773438, 0.029937744140625, 0.03231239318847656, 0.034687042236328125, 0.03706169128417969, 0.03943634033203125, 0.04181098937988281, 0.044185638427734375, 0.04656028747558594, 0.0489349365234375, 0.05130958557128906, 0.053684234619140625, 0.05605888366699219, 0.05843353271484375, 0.06080818176269531, 0.06318283081054688, 0.06555747985839844, 0.06793212890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 14.0, 19.0, 11.0, 23.0, 22.0, 27.0, 57.0, 69.0, 112.0, 144.0, 245.0, 457.0, 722.0, 1806.0, 12557.0, 3969345.0, 201108.0, 4931.0, 1141.0, 522.0, 328.0, 172.0, 127.0, 84.0, 66.0, 31.0, 27.0, 19.0, 13.0, 25.0, 15.0, 6.0, 9.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6443023681640625, -0.621124267578125, -0.5979461669921875, -0.57476806640625, -0.5515899658203125, -0.528411865234375, -0.5052337646484375, -0.4820556640625, -0.4588775634765625, -0.435699462890625, -0.4125213623046875, -0.38934326171875, -0.3661651611328125, -0.342987060546875, -0.3198089599609375, -0.296630859375, -0.2734527587890625, -0.250274658203125, -0.2270965576171875, -0.20391845703125, -0.1807403564453125, -0.157562255859375, -0.1343841552734375, -0.1112060546875, -0.0880279541015625, -0.064849853515625, -0.0416717529296875, -0.01849365234375, 0.0046844482421875, 0.027862548828125, 0.0510406494140625, 0.07421875, 0.0973968505859375, 0.120574951171875, 0.1437530517578125, 0.16693115234375, 0.1901092529296875, 0.213287353515625, 0.2364654541015625, 0.2596435546875, 0.2828216552734375, 0.305999755859375, 0.3291778564453125, 0.35235595703125, 0.3755340576171875, 0.398712158203125, 0.4218902587890625, 0.445068359375, 0.4682464599609375, 0.491424560546875, 0.5146026611328125, 0.53778076171875, 0.5609588623046875, 0.584136962890625, 0.6073150634765625, 0.6304931640625, 0.6536712646484375, 0.676849365234375, 0.7000274658203125, 0.72320556640625, 0.7463836669921875, 0.769561767578125, 0.7927398681640625, 0.81591796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 12.0, 27.0, 95.0, 390.0, 2317.0, 916.0, 187.0, 68.0, 35.0, 10.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6832122802734375, -0.662322998046875, -0.6414337158203125, -0.62054443359375, -0.5996551513671875, -0.578765869140625, -0.5578765869140625, -0.5369873046875, -0.5160980224609375, -0.495208740234375, -0.4743194580078125, -0.45343017578125, -0.4325408935546875, -0.411651611328125, -0.3907623291015625, -0.369873046875, -0.3489837646484375, -0.328094482421875, -0.3072052001953125, -0.28631591796875, -0.2654266357421875, -0.244537353515625, -0.2236480712890625, -0.2027587890625, -0.1818695068359375, -0.160980224609375, -0.1400909423828125, -0.11920166015625, -0.0983123779296875, -0.077423095703125, -0.0565338134765625, -0.03564453125, -0.0147552490234375, 0.006134033203125, 0.0270233154296875, 0.04791259765625, 0.0688018798828125, 0.089691162109375, 0.1105804443359375, 0.1314697265625, 0.1523590087890625, 0.173248291015625, 0.1941375732421875, 0.21502685546875, 0.2359161376953125, 0.256805419921875, 0.2776947021484375, 0.298583984375, 0.3194732666015625, 0.340362548828125, 0.3612518310546875, 0.38214111328125, 0.4030303955078125, 0.423919677734375, 0.4448089599609375, 0.4656982421875, 0.4865875244140625, 0.507476806640625, 0.5283660888671875, 0.54925537109375, 0.5701446533203125, 0.591033935546875, 0.6119232177734375, 0.6328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 13.0, 18.0, 37.0, 87.0, 250.0, 311.0, 175.0, 72.0, 20.0, 9.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1760382652282715, -2.0118887424468994, -1.8477389812469482, -1.6835894584655762, -1.5194398164749146, -1.355290174484253, -1.1911406517028809, -1.0269910097122192, -0.8628413677215576, -0.698691725730896, -0.5345421433448792, -0.3703925311565399, -0.20624291896820068, -0.04209327697753906, 0.12205630540847778, 0.28620588779449463, 0.45035552978515625, 0.6145051717758179, 0.7786547541618347, 0.9428043365478516, 1.1069539785385132, 1.2711036205291748, 1.4352531433105469, 1.5994027853012085, 1.7635524272918701, 1.9277020692825317, 2.0918517112731934, 2.2560012340545654, 2.4201507568359375, 2.5843005180358887, 2.7484500408172607, 2.912599563598633, 3.076748847961426, 3.240898370742798, 3.405048131942749, 3.569197654724121, 3.7333474159240723, 3.8974969387054443, 4.061646461486816, 4.225796222686768, 4.389945983886719, 4.55409574508667, 4.718245029449463, 4.882394790649414, 5.046544551849365, 5.210694313049316, 5.374843597412109, 5.5389933586120605, 5.7031426429748535, 5.867292404174805, 6.031441688537598, 6.195591449737549, 6.3597412109375, 6.523890495300293, 6.688040256500244, 6.852190017700195, 7.016339302062988, 7.1804890632629395, 7.344638347625732, 7.508788108825684, 7.672937870025635, 7.837087631225586, 8.001236915588379, 8.165386199951172, 8.329536437988281]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 8.0, 6.0, 6.0, 6.0, 14.0, 16.0, 14.0, 14.0, 19.0, 22.0, 28.0, 29.0, 31.0, 27.0, 49.0, 49.0, 59.0, 58.0, 46.0, 65.0, 50.0, 43.0, 49.0, 35.0, 36.0, 28.0, 25.0, 24.0, 18.0, 27.0, 21.0, 13.0, 12.0, 10.0, 5.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.3573970794677734, -1.31841242313385, -1.2794276475906372, -1.2404429912567139, -1.2014583349227905, -1.1624736785888672, -1.1234889030456543, -1.084504246711731, -1.0455195903778076, -1.0065349340438843, -0.9675502181053162, -0.928565502166748, -0.8895808458328247, -0.8505961298942566, -0.8116114139556885, -0.7726267576217651, -0.7336419820785522, -0.6946572661399841, -0.6556726098060608, -0.6166878938674927, -0.5777032375335693, -0.5387185215950012, -0.4997338056564331, -0.4607491195201874, -0.42176443338394165, -0.3827797472476959, -0.3437950611114502, -0.3048103451728821, -0.26582565903663635, -0.22684097290039062, -0.1878562718629837, -0.14887157082557678, -0.10988688468933105, -0.07090219110250473, -0.031917497515678406, 0.007067196071147919, 0.04605188965797424, 0.08503657579421997, 0.12402127683162689, 0.1630059778690338, 0.20199066400527954, 0.24097535014152527, 0.279960036277771, 0.3189447522163391, 0.35792943835258484, 0.39691412448883057, 0.4358988404273987, 0.4748835265636444, 0.5138682126998901, 0.5528529286384583, 0.5918375849723816, 0.6308223009109497, 0.669806957244873, 0.7087916731834412, 0.7477763891220093, 0.7867610454559326, 0.8257457613945007, 0.8647304773330688, 0.9037151336669922, 0.9426998496055603, 0.9816845655441284, 1.0206692218780518, 1.059653878211975, 1.098638653755188, 1.1376233100891113]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 23.0, 28.0, 48.0, 50.0, 65.0, 97.0, 153.0, 212.0, 318.0, 450.0, 684.0, 1062.0, 1554.0, 2564.0, 4293.0, 7699.0, 14606.0, 28678.0, 60519.0, 136249.0, 269509.0, 266107.0, 132995.0, 59164.0, 28050.0, 14094.0, 7515.0, 4414.0, 2575.0, 1572.0, 1044.0, 688.0, 460.0, 295.0, 214.0, 152.0, 90.0, 66.0, 49.0, 38.0, 35.0, 14.0, 18.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1146240234375, -0.11092472076416016, -0.10722541809082031, -0.10352611541748047, -0.09982681274414062, -0.09612751007080078, -0.09242820739746094, -0.0887289047241211, -0.08502960205078125, -0.0813302993774414, -0.07763099670410156, -0.07393169403076172, -0.07023239135742188, -0.06653308868408203, -0.06283378601074219, -0.059134483337402344, -0.0554351806640625, -0.051735877990722656, -0.04803657531738281, -0.04433727264404297, -0.040637969970703125, -0.03693866729736328, -0.03323936462402344, -0.029540061950683594, -0.02584075927734375, -0.022141456604003906, -0.018442153930664062, -0.014742851257324219, -0.011043548583984375, -0.007344245910644531, -0.0036449432373046875, 5.435943603515625e-05, 0.003753662109375, 0.007452964782714844, 0.011152267456054688, 0.014851570129394531, 0.018550872802734375, 0.02225017547607422, 0.025949478149414062, 0.029648780822753906, 0.03334808349609375, 0.037047386169433594, 0.04074668884277344, 0.04444599151611328, 0.048145294189453125, 0.05184459686279297, 0.05554389953613281, 0.059243202209472656, 0.0629425048828125, 0.06664180755615234, 0.07034111022949219, 0.07404041290283203, 0.07773971557617188, 0.08143901824951172, 0.08513832092285156, 0.0888376235961914, 0.09253692626953125, 0.0962362289428711, 0.09993553161621094, 0.10363483428955078, 0.10733413696289062, 0.11103343963623047, 0.11473274230957031, 0.11843204498291016, 0.12213134765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 11.0, 11.0, 10.0, 20.0, 22.0, 30.0, 16.0, 22.0, 45.0, 40.0, 45.0, 41.0, 46.0, 45.0, 54.0, 59.0, 53.0, 49.0, 34.0, 38.0, 26.0, 39.0, 33.0, 32.0, 31.0, 27.0, 26.0, 14.0, 10.0, 10.0, 4.0, 9.0, 2.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07525634765625, -0.07300281524658203, -0.07074928283691406, -0.0684957504272461, -0.06624221801757812, -0.06398868560791016, -0.06173515319824219, -0.05948162078857422, -0.05722808837890625, -0.05497455596923828, -0.05272102355957031, -0.050467491149902344, -0.048213958740234375, -0.045960426330566406, -0.04370689392089844, -0.04145336151123047, -0.0391998291015625, -0.03694629669189453, -0.03469276428222656, -0.032439231872558594, -0.030185699462890625, -0.027932167053222656, -0.025678634643554688, -0.02342510223388672, -0.02117156982421875, -0.01891803741455078, -0.016664505004882812, -0.014410972595214844, -0.012157440185546875, -0.009903907775878906, -0.0076503753662109375, -0.005396842956542969, -0.003143310546875, -0.0008897781372070312, 0.0013637542724609375, 0.0036172866821289062, 0.005870819091796875, 0.008124351501464844, 0.010377883911132812, 0.012631416320800781, 0.01488494873046875, 0.01713848114013672, 0.019392013549804688, 0.021645545959472656, 0.023899078369140625, 0.026152610778808594, 0.028406143188476562, 0.03065967559814453, 0.0329132080078125, 0.03516674041748047, 0.03742027282714844, 0.039673805236816406, 0.041927337646484375, 0.044180870056152344, 0.04643440246582031, 0.04868793487548828, 0.05094146728515625, 0.05319499969482422, 0.05544853210449219, 0.057702064514160156, 0.059955596923828125, 0.062209129333496094, 0.06446266174316406, 0.06671619415283203, 0.0689697265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 14.0, 23.0, 44.0, 77.0, 133.0, 296.0, 741.0, 2381.0, 11201.0, 126971.0, 837981.0, 58695.0, 7186.0, 1685.0, 583.0, 241.0, 113.0, 59.0, 33.0, 17.0, 13.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5911712646484375, -0.573455810546875, -0.5557403564453125, -0.53802490234375, -0.5203094482421875, -0.502593994140625, -0.4848785400390625, -0.4671630859375, -0.4494476318359375, -0.431732177734375, -0.4140167236328125, -0.39630126953125, -0.3785858154296875, -0.360870361328125, -0.3431549072265625, -0.325439453125, -0.3077239990234375, -0.290008544921875, -0.2722930908203125, -0.25457763671875, -0.2368621826171875, -0.219146728515625, -0.2014312744140625, -0.1837158203125, -0.1660003662109375, -0.148284912109375, -0.1305694580078125, -0.11285400390625, -0.0951385498046875, -0.077423095703125, -0.0597076416015625, -0.0419921875, -0.0242767333984375, -0.006561279296875, 0.0111541748046875, 0.02886962890625, 0.0465850830078125, 0.064300537109375, 0.0820159912109375, 0.0997314453125, 0.1174468994140625, 0.135162353515625, 0.1528778076171875, 0.17059326171875, 0.1883087158203125, 0.206024169921875, 0.2237396240234375, 0.241455078125, 0.2591705322265625, 0.276885986328125, 0.2946014404296875, 0.31231689453125, 0.3300323486328125, 0.347747802734375, 0.3654632568359375, 0.3831787109375, 0.4008941650390625, 0.418609619140625, 0.4363250732421875, 0.45404052734375, 0.4717559814453125, 0.489471435546875, 0.5071868896484375, 0.52490234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 10.0, 13.0, 11.0, 13.0, 17.0, 26.0, 44.0, 33.0, 44.0, 53.0, 59.0, 62.0, 62.0, 76.0, 76.0, 58.0, 76.0, 48.0, 52.0, 34.0, 29.0, 28.0, 11.0, 19.0, 16.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4932823181152344, -0.47924041748046875, -0.4651985168457031, -0.4511566162109375, -0.4371147155761719, -0.42307281494140625, -0.4090309143066406, -0.394989013671875, -0.3809471130371094, -0.36690521240234375, -0.3528633117675781, -0.3388214111328125, -0.3247795104980469, -0.31073760986328125, -0.2966957092285156, -0.28265380859375, -0.2686119079589844, -0.25457000732421875, -0.24052810668945312, -0.2264862060546875, -0.21244430541992188, -0.19840240478515625, -0.18436050415039062, -0.170318603515625, -0.15627670288085938, -0.14223480224609375, -0.12819290161132812, -0.1141510009765625, -0.10010910034179688, -0.08606719970703125, -0.07202529907226562, -0.0579833984375, -0.043941497802734375, -0.02989959716796875, -0.015857696533203125, -0.0018157958984375, 0.012226104736328125, 0.02626800537109375, 0.040309906005859375, 0.054351806640625, 0.06839370727539062, 0.08243560791015625, 0.09647750854492188, 0.1105194091796875, 0.12456130981445312, 0.13860321044921875, 0.15264511108398438, 0.16668701171875, 0.18072891235351562, 0.19477081298828125, 0.20881271362304688, 0.2228546142578125, 0.23689651489257812, 0.25093841552734375, 0.2649803161621094, 0.279022216796875, 0.2930641174316406, 0.30710601806640625, 0.3211479187011719, 0.3351898193359375, 0.3492317199707031, 0.36327362060546875, 0.3773155212402344, 0.391357421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 13.0, 15.0, 19.0, 18.0, 37.0, 51.0, 63.0, 111.0, 133.0, 224.0, 272.0, 413.0, 634.0, 983.0, 1572.0, 2641.0, 5099.0, 10195.0, 23243.0, 63816.0, 246990.0, 541859.0, 91721.0, 31158.0, 12656.0, 6129.0, 3238.0, 1808.0, 1108.0, 704.0, 502.0, 326.0, 228.0, 150.0, 124.0, 81.0, 60.0, 47.0, 40.0, 23.0, 11.0, 19.0, 3.0, 5.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11273193359375, -0.10886478424072266, -0.10499763488769531, -0.10113048553466797, -0.09726333618164062, -0.09339618682861328, -0.08952903747558594, -0.0856618881225586, -0.08179473876953125, -0.0779275894165039, -0.07406044006347656, -0.07019329071044922, -0.06632614135742188, -0.06245899200439453, -0.05859184265136719, -0.054724693298339844, -0.0508575439453125, -0.046990394592285156, -0.04312324523925781, -0.03925609588623047, -0.035388946533203125, -0.03152179718017578, -0.027654647827148438, -0.023787498474121094, -0.01992034912109375, -0.016053199768066406, -0.012186050415039062, -0.008318901062011719, -0.004451751708984375, -0.0005846023559570312, 0.0032825469970703125, 0.007149696350097656, 0.011016845703125, 0.014883995056152344, 0.018751144409179688, 0.02261829376220703, 0.026485443115234375, 0.03035259246826172, 0.03421974182128906, 0.038086891174316406, 0.04195404052734375, 0.045821189880371094, 0.04968833923339844, 0.05355548858642578, 0.057422637939453125, 0.06128978729248047, 0.06515693664550781, 0.06902408599853516, 0.0728912353515625, 0.07675838470458984, 0.08062553405761719, 0.08449268341064453, 0.08835983276367188, 0.09222698211669922, 0.09609413146972656, 0.0999612808227539, 0.10382843017578125, 0.1076955795288086, 0.11156272888183594, 0.11542987823486328, 0.11929702758789062, 0.12316417694091797, 0.1270313262939453, 0.13089847564697266, 0.134765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 11.0, 11.0, 17.0, 20.0, 32.0, 45.0, 73.0, 94.0, 190.0, 136.0, 103.0, 52.0, 51.0, 43.0, 20.0, 14.0, 13.0, 10.0, 10.0, 12.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529424667358398e-05, -8.278340101242065e-05, -8.027255535125732e-05, -7.7761709690094e-05, -7.525086402893066e-05, -7.274001836776733e-05, -7.0229172706604e-05, -6.771832704544067e-05, -6.520748138427734e-05, -6.269663572311401e-05, -6.0185790061950684e-05, -5.7674944400787354e-05, -5.5164098739624023e-05, -5.265325307846069e-05, -5.014240741729736e-05, -4.763156175613403e-05, -4.51207160949707e-05, -4.260987043380737e-05, -4.009902477264404e-05, -3.758817911148071e-05, -3.507733345031738e-05, -3.256648778915405e-05, -3.0055642127990723e-05, -2.7544796466827393e-05, -2.5033950805664062e-05, -2.2523105144500732e-05, -2.0012259483337402e-05, -1.7501413822174072e-05, -1.4990568161010742e-05, -1.2479722499847412e-05, -9.968876838684082e-06, -7.458031177520752e-06, -4.947185516357422e-06, -2.436339855194092e-06, 7.450580596923828e-08, 2.5853514671325684e-06, 5.0961971282958984e-06, 7.6070427894592285e-06, 1.0117888450622559e-05, 1.2628734111785889e-05, 1.5139579772949219e-05, 1.765042543411255e-05, 2.016127109527588e-05, 2.267211675643921e-05, 2.518296241760254e-05, 2.769380807876587e-05, 3.02046537399292e-05, 3.271549940109253e-05, 3.522634506225586e-05, 3.773719072341919e-05, 4.024803638458252e-05, 4.275888204574585e-05, 4.526972770690918e-05, 4.778057336807251e-05, 5.029141902923584e-05, 5.280226469039917e-05, 5.53131103515625e-05, 5.782395601272583e-05, 6.033480167388916e-05, 6.284564733505249e-05, 6.535649299621582e-05, 6.786733865737915e-05, 7.037818431854248e-05, 7.288902997970581e-05, 7.539987564086914e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 2.0, 14.0, 13.0, 11.0, 27.0, 44.0, 57.0, 106.0, 173.0, 320.0, 641.0, 1242.0, 2863.0, 6517.0, 17226.0, 52782.0, 218116.0, 596286.0, 103663.0, 29890.0, 10481.0, 4245.0, 1819.0, 914.0, 474.0, 232.0, 132.0, 68.0, 45.0, 42.0, 17.0, 21.0, 10.0, 12.0, 7.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1600341796875, -0.15549468994140625, -0.1509552001953125, -0.14641571044921875, -0.141876220703125, -0.13733673095703125, -0.1327972412109375, -0.12825775146484375, -0.12371826171875, -0.11917877197265625, -0.1146392822265625, -0.11009979248046875, -0.105560302734375, -0.10102081298828125, -0.0964813232421875, -0.09194183349609375, -0.08740234375, -0.08286285400390625, -0.0783233642578125, -0.07378387451171875, -0.069244384765625, -0.06470489501953125, -0.0601654052734375, -0.05562591552734375, -0.05108642578125, -0.04654693603515625, -0.0420074462890625, -0.03746795654296875, -0.032928466796875, -0.02838897705078125, -0.0238494873046875, -0.01930999755859375, -0.0147705078125, -0.01023101806640625, -0.0056915283203125, -0.00115203857421875, 0.003387451171875, 0.00792694091796875, 0.0124664306640625, 0.01700592041015625, 0.02154541015625, 0.02608489990234375, 0.0306243896484375, 0.03516387939453125, 0.039703369140625, 0.04424285888671875, 0.0487823486328125, 0.05332183837890625, 0.057861328125, 0.06240081787109375, 0.0669403076171875, 0.07147979736328125, 0.076019287109375, 0.08055877685546875, 0.0850982666015625, 0.08963775634765625, 0.09417724609375, 0.09871673583984375, 0.1032562255859375, 0.10779571533203125, 0.112335205078125, 0.11687469482421875, 0.1214141845703125, 0.12595367431640625, 0.1304931640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 14.0, 10.0, 12.0, 9.0, 20.0, 23.0, 31.0, 46.0, 67.0, 59.0, 99.0, 118.0, 113.0, 83.0, 69.0, 47.0, 40.0, 29.0, 24.0, 14.0, 15.0, 15.0, 6.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.1509418487548828, -0.14587783813476562, -0.14081382751464844, -0.13574981689453125, -0.13068580627441406, -0.12562179565429688, -0.12055778503417969, -0.1154937744140625, -0.11042976379394531, -0.10536575317382812, -0.10030174255371094, -0.09523773193359375, -0.09017372131347656, -0.08510971069335938, -0.08004570007324219, -0.074981689453125, -0.06991767883300781, -0.06485366821289062, -0.05978965759277344, -0.05472564697265625, -0.04966163635253906, -0.044597625732421875, -0.03953361511230469, -0.0344696044921875, -0.029405593872070312, -0.024341583251953125, -0.019277572631835938, -0.01421356201171875, -0.009149551391601562, -0.004085540771484375, 0.0009784698486328125, 0.00604248046875, 0.011106491088867188, 0.016170501708984375, 0.021234512329101562, 0.02629852294921875, 0.03136253356933594, 0.036426544189453125, 0.04149055480957031, 0.0465545654296875, 0.05161857604980469, 0.056682586669921875, 0.06174659729003906, 0.06681060791015625, 0.07187461853027344, 0.07693862915039062, 0.08200263977050781, 0.087066650390625, 0.09213066101074219, 0.09719467163085938, 0.10225868225097656, 0.10732269287109375, 0.11238670349121094, 0.11745071411132812, 0.12251472473144531, 0.1275787353515625, 0.1326427459716797, 0.13770675659179688, 0.14277076721191406, 0.14783477783203125, 0.15289878845214844, 0.15796279907226562, 0.1630268096923828, 0.1680908203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 13.0, 19.0, 46.0, 89.0, 117.0, 265.0, 168.0, 107.0, 65.0, 43.0, 21.0, 14.0, 13.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7375526428222656, -2.6309187412261963, -2.524285078048706, -2.4176511764526367, -2.3110172748565674, -2.204383373260498, -2.097749710083008, -1.9911158084869385, -1.8844820261001587, -1.777848243713379, -1.6712143421173096, -1.5645805597305298, -1.45794677734375, -1.3513128757476807, -1.2446790933609009, -1.138045310974121, -1.0314114093780518, -0.9247775673866272, -0.8181437253952026, -0.7115099430084229, -0.6048761010169983, -0.49824225902557373, -0.39160847663879395, -0.2849746346473694, -0.17834079265594482, -0.07170696556568146, 0.03492686152458191, 0.14156067371368408, 0.24819451570510864, 0.3548283576965332, 0.461462140083313, 0.5680959820747375, 0.6747298240661621, 0.7813636660575867, 0.8879975080490112, 0.994631290435791, 1.1012651920318604, 1.2078989744186401, 1.31453275680542, 1.4211666584014893, 1.527800440788269, 1.6344342231750488, 1.7410681247711182, 1.847701907157898, 1.9543356895446777, 2.060969591140747, 2.1676034927368164, 2.2742371559143066, 2.380871057510376, 2.4875049591064453, 2.5941386222839355, 2.700772523880005, 2.807406425476074, 2.9140400886535645, 3.020673990249634, 3.127307891845703, 3.2339415550231934, 3.3405754566192627, 3.447209119796753, 3.5538430213928223, 3.6604769229888916, 3.767110824584961, 3.873744487762451, 3.9803783893585205, 4.08701229095459]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 5.0, 14.0, 9.0, 10.0, 18.0, 16.0, 14.0, 21.0, 21.0, 18.0, 22.0, 26.0, 35.0, 33.0, 34.0, 51.0, 61.0, 70.0, 74.0, 56.0, 34.0, 37.0, 32.0, 26.0, 24.0, 28.0, 33.0, 17.0, 22.0, 22.0, 15.0, 12.0, 11.0, 13.0, 8.0, 3.0, 7.0, 1.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2538459300994873, -1.2100763320922852, -1.166306734085083, -1.1225371360778809, -1.0787675380706787, -1.0349980592727661, -0.991228461265564, -0.9474588632583618, -0.9036892652511597, -0.8599196672439575, -0.8161500692367554, -0.772380530834198, -0.7286109328269958, -0.6848413348197937, -0.6410717964172363, -0.5973021984100342, -0.553532600402832, -0.5097630023956299, -0.4659934341907501, -0.42222386598587036, -0.3784542679786682, -0.33468466997146606, -0.2909151017665863, -0.24714553356170654, -0.2033759355545044, -0.15960635244846344, -0.11583676934242249, -0.07206718623638153, -0.028297603130340576, 0.015471979975700378, 0.05924156308174133, 0.1030111312866211, 0.1467806100845337, 0.19055019319057465, 0.2343197762966156, 0.27808934450149536, 0.3218589425086975, 0.36562854051589966, 0.4093981087207794, 0.4531676769256592, 0.49693727493286133, 0.5407068729400635, 0.5844764709472656, 0.628246009349823, 0.6720156073570251, 0.7157852053642273, 0.7595547437667847, 0.8033243417739868, 0.847093939781189, 0.8908635377883911, 0.9346331357955933, 0.9784026741981506, 1.022172212600708, 1.0659418106079102, 1.1097114086151123, 1.1534810066223145, 1.1972506046295166, 1.2410202026367188, 1.284789800643921, 1.328559398651123, 1.3723289966583252, 1.4160984754562378, 1.45986807346344, 1.503637671470642, 1.5474072694778442]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 13.0, 19.0, 26.0, 21.0, 31.0, 57.0, 70.0, 113.0, 138.0, 191.0, 272.0, 409.0, 597.0, 963.0, 1511.0, 2377.0, 4111.0, 8094.0, 18621.0, 60593.0, 405781.0, 2748572.0, 797447.0, 96909.0, 24514.0, 10060.0, 4963.0, 2840.0, 1659.0, 1068.0, 669.0, 447.0, 315.0, 208.0, 181.0, 110.0, 82.0, 61.0, 47.0, 27.0, 31.0, 11.0, 15.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.140625, -0.13603591918945312, -0.13144683837890625, -0.12685775756835938, -0.1222686767578125, -0.11767959594726562, -0.11309051513671875, -0.10850143432617188, -0.103912353515625, -0.09932327270507812, -0.09473419189453125, -0.09014511108398438, -0.0855560302734375, -0.08096694946289062, -0.07637786865234375, -0.07178878784179688, -0.06719970703125, -0.06261062622070312, -0.05802154541015625, -0.053432464599609375, -0.0488433837890625, -0.044254302978515625, -0.03966522216796875, -0.035076141357421875, -0.030487060546875, -0.025897979736328125, -0.02130889892578125, -0.016719818115234375, -0.0121307373046875, -0.007541656494140625, -0.00295257568359375, 0.001636505126953125, 0.0062255859375, 0.010814666748046875, 0.01540374755859375, 0.019992828369140625, 0.0245819091796875, 0.029170989990234375, 0.03376007080078125, 0.038349151611328125, 0.042938232421875, 0.047527313232421875, 0.05211639404296875, 0.056705474853515625, 0.0612945556640625, 0.06588363647460938, 0.07047271728515625, 0.07506179809570312, 0.07965087890625, 0.08423995971679688, 0.08882904052734375, 0.09341812133789062, 0.0980072021484375, 0.10259628295898438, 0.10718536376953125, 0.11177444458007812, 0.116363525390625, 0.12095260620117188, 0.12554168701171875, 0.13013076782226562, 0.1347198486328125, 0.13930892944335938, 0.14389801025390625, 0.14848709106445312, 0.153076171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 8.0, 3.0, 8.0, 8.0, 6.0, 14.0, 11.0, 26.0, 23.0, 24.0, 21.0, 40.0, 33.0, 48.0, 43.0, 54.0, 51.0, 55.0, 46.0, 48.0, 60.0, 43.0, 50.0, 44.0, 48.0, 29.0, 33.0, 21.0, 17.0, 14.0, 12.0, 9.0, 9.0, 10.0, 6.0, 4.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09100341796875, -0.08842849731445312, -0.08585357666015625, -0.08327865600585938, -0.0807037353515625, -0.07812881469726562, -0.07555389404296875, -0.07297897338867188, -0.070404052734375, -0.06782913208007812, -0.06525421142578125, -0.06267929077148438, -0.0601043701171875, -0.057529449462890625, -0.05495452880859375, -0.052379608154296875, -0.0498046875, -0.047229766845703125, -0.04465484619140625, -0.042079925537109375, -0.0395050048828125, -0.036930084228515625, -0.03435516357421875, -0.031780242919921875, -0.029205322265625, -0.026630401611328125, -0.02405548095703125, -0.021480560302734375, -0.0189056396484375, -0.016330718994140625, -0.01375579833984375, -0.011180877685546875, -0.00860595703125, -0.006031036376953125, -0.00345611572265625, -0.000881195068359375, 0.0016937255859375, 0.004268646240234375, 0.00684356689453125, 0.009418487548828125, 0.011993408203125, 0.014568328857421875, 0.01714324951171875, 0.019718170166015625, 0.0222930908203125, 0.024868011474609375, 0.02744293212890625, 0.030017852783203125, 0.0325927734375, 0.035167694091796875, 0.03774261474609375, 0.040317535400390625, 0.0428924560546875, 0.045467376708984375, 0.04804229736328125, 0.050617218017578125, 0.053192138671875, 0.055767059326171875, 0.05834197998046875, 0.060916900634765625, 0.0634918212890625, 0.06606674194335938, 0.06864166259765625, 0.07121658325195312, 0.07379150390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 10.0, 3.0, 10.0, 14.0, 17.0, 26.0, 33.0, 51.0, 57.0, 95.0, 107.0, 175.0, 278.0, 664.0, 2159.0, 12609.0, 672672.0, 3479718.0, 20752.0, 2953.0, 802.0, 383.0, 204.0, 133.0, 75.0, 59.0, 46.0, 39.0, 26.0, 17.0, 16.0, 13.0, 12.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.80126953125, -0.7784423828125, -0.755615234375, -0.7327880859375, -0.7099609375, -0.6871337890625, -0.664306640625, -0.6414794921875, -0.61865234375, -0.5958251953125, -0.572998046875, -0.5501708984375, -0.52734375, -0.5045166015625, -0.481689453125, -0.4588623046875, -0.43603515625, -0.4132080078125, -0.390380859375, -0.3675537109375, -0.3447265625, -0.3218994140625, -0.299072265625, -0.2762451171875, -0.25341796875, -0.2305908203125, -0.207763671875, -0.1849365234375, -0.162109375, -0.1392822265625, -0.116455078125, -0.0936279296875, -0.07080078125, -0.0479736328125, -0.025146484375, -0.0023193359375, 0.0205078125, 0.0433349609375, 0.066162109375, 0.0889892578125, 0.11181640625, 0.1346435546875, 0.157470703125, 0.1802978515625, 0.203125, 0.2259521484375, 0.248779296875, 0.2716064453125, 0.29443359375, 0.3172607421875, 0.340087890625, 0.3629150390625, 0.3857421875, 0.4085693359375, 0.431396484375, 0.4542236328125, 0.47705078125, 0.4998779296875, 0.522705078125, 0.5455322265625, 0.568359375, 0.5911865234375, 0.614013671875, 0.6368408203125, 0.65966796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 16.0, 22.0, 28.0, 49.0, 109.0, 295.0, 1103.0, 1575.0, 506.0, 180.0, 69.0, 38.0, 23.0, 23.0, 11.0, 6.0, 1.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58154296875, -0.565032958984375, -0.54852294921875, -0.532012939453125, -0.5155029296875, -0.498992919921875, -0.48248291015625, -0.465972900390625, -0.449462890625, -0.432952880859375, -0.41644287109375, -0.399932861328125, -0.3834228515625, -0.366912841796875, -0.35040283203125, -0.333892822265625, -0.3173828125, -0.300872802734375, -0.28436279296875, -0.267852783203125, -0.2513427734375, -0.234832763671875, -0.21832275390625, -0.201812744140625, -0.185302734375, -0.168792724609375, -0.15228271484375, -0.135772705078125, -0.1192626953125, -0.102752685546875, -0.08624267578125, -0.069732666015625, -0.05322265625, -0.036712646484375, -0.02020263671875, -0.003692626953125, 0.0128173828125, 0.029327392578125, 0.04583740234375, 0.062347412109375, 0.078857421875, 0.095367431640625, 0.11187744140625, 0.128387451171875, 0.1448974609375, 0.161407470703125, 0.17791748046875, 0.194427490234375, 0.2109375, 0.227447509765625, 0.24395751953125, 0.260467529296875, 0.2769775390625, 0.293487548828125, 0.30999755859375, 0.326507568359375, 0.343017578125, 0.359527587890625, 0.37603759765625, 0.392547607421875, 0.4090576171875, 0.425567626953125, 0.44207763671875, 0.458587646484375, 0.47509765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 9.0, 14.0, 19.0, 20.0, 70.0, 111.0, 193.0, 216.0, 147.0, 74.0, 47.0, 28.0, 24.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.669887542724609, -4.550622463226318, -4.4313578605651855, -4.3120927810668945, -4.1928277015686035, -4.073563098907471, -3.9542980194091797, -3.8350331783294678, -3.715768337249756, -3.596503496170044, -3.477238416671753, -3.357973575592041, -3.238708734512329, -3.119443893432617, -3.000178813934326, -2.8809139728546143, -2.7616488933563232, -2.6423840522766113, -2.5231189727783203, -2.4038541316986084, -2.2845892906188965, -2.1653242111206055, -2.0460593700408936, -1.9267945289611816, -1.8075295686721802, -1.6882646083831787, -1.5689997673034668, -1.4497348070144653, -1.3304698467254639, -1.211205005645752, -1.0919400453567505, -0.9726751446723938, -0.8534104824066162, -0.7341455817222595, -0.6148806810379028, -0.49561572074890137, -0.3763508200645447, -0.257085919380188, -0.13782095909118652, -0.018556058406829834, 0.10070884227752686, 0.21997375786304474, 0.3392386734485626, 0.4585036039352417, 0.5777685046195984, 0.6970334053039551, 0.8162983655929565, 0.9355632662773132, 1.05482816696167, 1.1740931272506714, 1.2933579683303833, 1.4126229286193848, 1.5318877696990967, 1.6511527299880981, 1.7704176902770996, 1.8896825313568115, 2.0089473724365234, 2.1282122135162354, 2.2474772930145264, 2.3667421340942383, 2.48600697517395, 2.605271816253662, 2.724536895751953, 2.843801736831665, 2.963066816329956]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 8.0, 11.0, 22.0, 23.0, 25.0, 29.0, 42.0, 34.0, 50.0, 56.0, 63.0, 62.0, 71.0, 72.0, 62.0, 72.0, 53.0, 53.0, 50.0, 24.0, 33.0, 18.0, 19.0, 10.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1675922870635986, -1.113559603691101, -1.059527039527893, -1.0054943561553955, -0.9514617919921875, -0.8974291086196899, -0.8433965444564819, -0.7893638610839844, -0.7353312969207764, -0.6812986731529236, -0.6272660493850708, -0.573233425617218, -0.5192008018493652, -0.46516814827919006, -0.4111355245113373, -0.3571029007434845, -0.3030702471733093, -0.24903762340545654, -0.19500499963760376, -0.14097236096858978, -0.086939737200737, -0.03290709853172302, 0.02112552523612976, 0.07515814900398254, 0.12919077277183533, 0.1832233965396881, 0.2372560203075409, 0.29128867387771606, 0.34532129764556885, 0.39935392141342163, 0.4533865451812744, 0.5074191689491272, 0.56145179271698, 0.6154844164848328, 0.6695170402526855, 0.7235496640205383, 0.7775822877883911, 0.8316149711608887, 0.8856475353240967, 0.9396802186965942, 0.9937127828598022, 1.0477454662322998, 1.1017780303955078, 1.1558107137680054, 1.2098432779312134, 1.263875961303711, 1.317908525466919, 1.3719412088394165, 1.425973892211914, 1.4800065755844116, 1.5340391397476196, 1.5880718231201172, 1.6421043872833252, 1.6961370706558228, 1.7501696348190308, 1.8042023181915283, 1.8582348823547363, 1.9122675657272339, 1.966300129890442, 2.0203328132629395, 2.0743653774261475, 2.1283979415893555, 2.1824307441711426, 2.2364633083343506, 2.2904958724975586]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 13.0, 29.0, 28.0, 65.0, 63.0, 101.0, 186.0, 244.0, 400.0, 693.0, 1083.0, 1919.0, 3321.0, 5794.0, 11421.0, 22678.0, 46795.0, 102533.0, 221731.0, 299569.0, 175500.0, 78899.0, 36812.0, 17843.0, 9172.0, 4868.0, 2698.0, 1622.0, 892.0, 583.0, 357.0, 213.0, 137.0, 92.0, 70.0, 39.0, 36.0, 14.0, 12.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1531982421875, -0.14898204803466797, -0.14476585388183594, -0.1405496597290039, -0.13633346557617188, -0.13211727142333984, -0.1279010772705078, -0.12368488311767578, -0.11946868896484375, -0.11525249481201172, -0.11103630065917969, -0.10682010650634766, -0.10260391235351562, -0.0983877182006836, -0.09417152404785156, -0.08995532989501953, -0.0857391357421875, -0.08152294158935547, -0.07730674743652344, -0.0730905532836914, -0.06887435913085938, -0.06465816497802734, -0.06044197082519531, -0.05622577667236328, -0.05200958251953125, -0.04779338836669922, -0.04357719421386719, -0.039361000061035156, -0.035144805908203125, -0.030928611755371094, -0.026712417602539062, -0.02249622344970703, -0.018280029296875, -0.014063835144042969, -0.009847640991210938, -0.005631446838378906, -0.001415252685546875, 0.0028009414672851562, 0.0070171356201171875, 0.011233329772949219, 0.01544952392578125, 0.01966571807861328, 0.023881912231445312, 0.028098106384277344, 0.032314300537109375, 0.036530494689941406, 0.04074668884277344, 0.04496288299560547, 0.0491790771484375, 0.05339527130126953, 0.05761146545410156, 0.061827659606933594, 0.06604385375976562, 0.07026004791259766, 0.07447624206542969, 0.07869243621826172, 0.08290863037109375, 0.08712482452392578, 0.09134101867675781, 0.09555721282958984, 0.09977340698242188, 0.1039896011352539, 0.10820579528808594, 0.11242198944091797, 0.11663818359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 7.0, 8.0, 5.0, 11.0, 14.0, 13.0, 15.0, 27.0, 23.0, 31.0, 26.0, 38.0, 35.0, 61.0, 46.0, 45.0, 47.0, 48.0, 49.0, 62.0, 45.0, 51.0, 45.0, 37.0, 30.0, 39.0, 25.0, 22.0, 19.0, 15.0, 3.0, 16.0, 9.0, 9.0, 3.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08953857421875, -0.08631229400634766, -0.08308601379394531, -0.07985973358154297, -0.07663345336914062, -0.07340717315673828, -0.07018089294433594, -0.0669546127319336, -0.06372833251953125, -0.060502052307128906, -0.05727577209472656, -0.05404949188232422, -0.050823211669921875, -0.04759693145751953, -0.04437065124511719, -0.041144371032714844, -0.0379180908203125, -0.034691810607910156, -0.03146553039550781, -0.02823925018310547, -0.025012969970703125, -0.02178668975830078, -0.018560409545898438, -0.015334129333496094, -0.01210784912109375, -0.008881568908691406, -0.0056552886962890625, -0.0024290084838867188, 0.000797271728515625, 0.004023551940917969, 0.0072498321533203125, 0.010476112365722656, 0.013702392578125, 0.016928672790527344, 0.020154953002929688, 0.02338123321533203, 0.026607513427734375, 0.02983379364013672, 0.03306007385253906, 0.036286354064941406, 0.03951263427734375, 0.042738914489746094, 0.04596519470214844, 0.04919147491455078, 0.052417755126953125, 0.05564403533935547, 0.05887031555175781, 0.062096595764160156, 0.0653228759765625, 0.06854915618896484, 0.07177543640136719, 0.07500171661376953, 0.07822799682617188, 0.08145427703857422, 0.08468055725097656, 0.0879068374633789, 0.09113311767578125, 0.0943593978881836, 0.09758567810058594, 0.10081195831298828, 0.10403823852539062, 0.10726451873779297, 0.11049079895019531, 0.11371707916259766, 0.116943359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 3.0, 28.0, 12.0, 18.0, 29.0, 65.0, 77.0, 133.0, 186.0, 340.0, 584.0, 1356.0, 4369.0, 22364.0, 252370.0, 711610.0, 44519.0, 6787.0, 1844.0, 754.0, 397.0, 231.0, 139.0, 80.0, 79.0, 43.0, 36.0, 21.0, 18.0, 15.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.55810546875, -0.5417671203613281, -0.5254287719726562, -0.5090904235839844, -0.4927520751953125, -0.4764137268066406, -0.46007537841796875, -0.4437370300292969, -0.427398681640625, -0.4110603332519531, -0.39472198486328125, -0.3783836364746094, -0.3620452880859375, -0.3457069396972656, -0.32936859130859375, -0.3130302429199219, -0.29669189453125, -0.2803535461425781, -0.26401519775390625, -0.24767684936523438, -0.2313385009765625, -0.21500015258789062, -0.19866180419921875, -0.18232345581054688, -0.165985107421875, -0.14964675903320312, -0.13330841064453125, -0.11697006225585938, -0.1006317138671875, -0.08429336547851562, -0.06795501708984375, -0.051616668701171875, -0.0352783203125, -0.018939971923828125, -0.00260162353515625, 0.013736724853515625, 0.0300750732421875, 0.046413421630859375, 0.06275177001953125, 0.07909011840820312, 0.095428466796875, 0.11176681518554688, 0.12810516357421875, 0.14444351196289062, 0.1607818603515625, 0.17712020874023438, 0.19345855712890625, 0.20979690551757812, 0.22613525390625, 0.24247360229492188, 0.25881195068359375, 0.2751502990722656, 0.2914886474609375, 0.3078269958496094, 0.32416534423828125, 0.3405036926269531, 0.356842041015625, 0.3731803894042969, 0.38951873779296875, 0.4058570861816406, 0.4221954345703125, 0.4385337829589844, 0.45487213134765625, 0.4712104797363281, 0.487548828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 9.0, 11.0, 16.0, 18.0, 12.0, 20.0, 30.0, 36.0, 42.0, 34.0, 43.0, 57.0, 45.0, 73.0, 53.0, 54.0, 50.0, 52.0, 46.0, 32.0, 43.0, 34.0, 26.0, 21.0, 24.0, 36.0, 16.0, 9.0, 8.0, 7.0, 4.0, 8.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.478759765625, -0.4642448425292969, -0.44972991943359375, -0.4352149963378906, -0.4207000732421875, -0.4061851501464844, -0.39167022705078125, -0.3771553039550781, -0.362640380859375, -0.3481254577636719, -0.33361053466796875, -0.3190956115722656, -0.3045806884765625, -0.2900657653808594, -0.27555084228515625, -0.2610359191894531, -0.24652099609375, -0.23200607299804688, -0.21749114990234375, -0.20297622680664062, -0.1884613037109375, -0.17394638061523438, -0.15943145751953125, -0.14491653442382812, -0.130401611328125, -0.11588668823242188, -0.10137176513671875, -0.08685684204101562, -0.0723419189453125, -0.057826995849609375, -0.04331207275390625, -0.028797149658203125, -0.0142822265625, 0.000232696533203125, 0.01474761962890625, 0.029262542724609375, 0.0437774658203125, 0.058292388916015625, 0.07280731201171875, 0.08732223510742188, 0.101837158203125, 0.11635208129882812, 0.13086700439453125, 0.14538192749023438, 0.1598968505859375, 0.17441177368164062, 0.18892669677734375, 0.20344161987304688, 0.21795654296875, 0.23247146606445312, 0.24698638916015625, 0.2615013122558594, 0.2760162353515625, 0.2905311584472656, 0.30504608154296875, 0.3195610046386719, 0.334075927734375, 0.3485908508300781, 0.36310577392578125, 0.3776206970214844, 0.3921356201171875, 0.4066505432128906, 0.42116546630859375, 0.4356803894042969, 0.4501953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 8.0, 4.0, 14.0, 18.0, 20.0, 43.0, 49.0, 65.0, 129.0, 198.0, 423.0, 986.0, 2569.0, 7651.0, 29562.0, 192845.0, 734687.0, 59529.0, 13081.0, 3928.0, 1457.0, 609.0, 267.0, 151.0, 86.0, 49.0, 34.0, 21.0, 17.0, 8.0, 11.0, 12.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.277587890625, -0.2694740295410156, -0.26136016845703125, -0.2532463073730469, -0.2451324462890625, -0.23701858520507812, -0.22890472412109375, -0.22079086303710938, -0.212677001953125, -0.20456314086914062, -0.19644927978515625, -0.18833541870117188, -0.1802215576171875, -0.17210769653320312, -0.16399383544921875, -0.15587997436523438, -0.14776611328125, -0.13965225219726562, -0.13153839111328125, -0.12342453002929688, -0.1153106689453125, -0.10719680786132812, -0.09908294677734375, -0.09096908569335938, -0.082855224609375, -0.07474136352539062, -0.06662750244140625, -0.058513641357421875, -0.0503997802734375, -0.042285919189453125, -0.03417205810546875, -0.026058197021484375, -0.0179443359375, -0.009830474853515625, -0.00171661376953125, 0.006397247314453125, 0.0145111083984375, 0.022624969482421875, 0.03073883056640625, 0.038852691650390625, 0.046966552734375, 0.055080413818359375, 0.06319427490234375, 0.07130813598632812, 0.0794219970703125, 0.08753585815429688, 0.09564971923828125, 0.10376358032226562, 0.11187744140625, 0.11999130249023438, 0.12810516357421875, 0.13621902465820312, 0.1443328857421875, 0.15244674682617188, 0.16056060791015625, 0.16867446899414062, 0.176788330078125, 0.18490219116210938, 0.19301605224609375, 0.20112991333007812, 0.2092437744140625, 0.21735763549804688, 0.22547149658203125, 0.23358535766601562, 0.24169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 6.0, 3.0, 9.0, 11.0, 11.0, 15.0, 37.0, 49.0, 81.0, 144.0, 216.0, 148.0, 79.0, 59.0, 27.0, 20.0, 22.0, 11.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00011152029037475586, -0.00010798312723636627, -0.00010444596409797668, -0.0001009088009595871, -9.737163782119751e-05, -9.383447468280792e-05, -9.029731154441833e-05, -8.676014840602875e-05, -8.322298526763916e-05, -7.968582212924957e-05, -7.614865899085999e-05, -7.26114958524704e-05, -6.907433271408081e-05, -6.553716957569122e-05, -6.200000643730164e-05, -5.846284329891205e-05, -5.492568016052246e-05, -5.1388517022132874e-05, -4.7851353883743286e-05, -4.43141907453537e-05, -4.077702760696411e-05, -3.7239864468574524e-05, -3.3702701330184937e-05, -3.016553819179535e-05, -2.6628375053405762e-05, -2.3091211915016174e-05, -1.9554048776626587e-05, -1.6016885638237e-05, -1.2479722499847412e-05, -8.942559361457825e-06, -5.405396223068237e-06, -1.86823308467865e-06, 1.6689300537109375e-06, 5.206093192100525e-06, 8.743256330490112e-06, 1.22804194688797e-05, 1.5817582607269287e-05, 1.9354745745658875e-05, 2.2891908884048462e-05, 2.642907202243805e-05, 2.9966235160827637e-05, 3.3503398299217224e-05, 3.704056143760681e-05, 4.05777245759964e-05, 4.4114887714385986e-05, 4.7652050852775574e-05, 5.118921399116516e-05, 5.472637712955475e-05, 5.8263540267944336e-05, 6.180070340633392e-05, 6.533786654472351e-05, 6.88750296831131e-05, 7.241219282150269e-05, 7.594935595989227e-05, 7.948651909828186e-05, 8.302368223667145e-05, 8.656084537506104e-05, 9.009800851345062e-05, 9.363517165184021e-05, 9.71723347902298e-05, 0.00010070949792861938, 0.00010424666106700897, 0.00010778382420539856, 0.00011132098734378815, 0.00011485815048217773]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 11.0, 17.0, 13.0, 23.0, 31.0, 33.0, 64.0, 85.0, 124.0, 293.0, 557.0, 1243.0, 2935.0, 8023.0, 24596.0, 103818.0, 731502.0, 130705.0, 29196.0, 9176.0, 3309.0, 1329.0, 673.0, 311.0, 154.0, 100.0, 59.0, 43.0, 26.0, 23.0, 16.0, 18.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1988525390625, -0.1925525665283203, -0.18625259399414062, -0.17995262145996094, -0.17365264892578125, -0.16735267639160156, -0.16105270385742188, -0.1547527313232422, -0.1484527587890625, -0.1421527862548828, -0.13585281372070312, -0.12955284118652344, -0.12325286865234375, -0.11695289611816406, -0.11065292358398438, -0.10435295104980469, -0.098052978515625, -0.09175300598144531, -0.08545303344726562, -0.07915306091308594, -0.07285308837890625, -0.06655311584472656, -0.060253143310546875, -0.05395317077636719, -0.0476531982421875, -0.04135322570800781, -0.035053253173828125, -0.028753280639648438, -0.02245330810546875, -0.016153335571289062, -0.009853363037109375, -0.0035533905029296875, 0.00274658203125, 0.009046554565429688, 0.015346527099609375, 0.021646499633789062, 0.02794647216796875, 0.03424644470214844, 0.040546417236328125, 0.04684638977050781, 0.0531463623046875, 0.05944633483886719, 0.06574630737304688, 0.07204627990722656, 0.07834625244140625, 0.08464622497558594, 0.09094619750976562, 0.09724617004394531, 0.103546142578125, 0.10984611511230469, 0.11614608764648438, 0.12244606018066406, 0.12874603271484375, 0.13504600524902344, 0.14134597778320312, 0.1476459503173828, 0.1539459228515625, 0.1602458953857422, 0.16654586791992188, 0.17284584045410156, 0.17914581298828125, 0.18544578552246094, 0.19174575805664062, 0.1980457305908203, 0.204345703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 5.0, 7.0, 11.0, 6.0, 12.0, 14.0, 12.0, 22.0, 22.0, 21.0, 31.0, 44.0, 50.0, 75.0, 118.0, 104.0, 94.0, 78.0, 51.0, 31.0, 32.0, 18.0, 25.0, 16.0, 15.0, 15.0, 12.0, 7.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1434326171875, -0.1390094757080078, -0.13458633422851562, -0.13016319274902344, -0.12574005126953125, -0.12131690979003906, -0.11689376831054688, -0.11247062683105469, -0.1080474853515625, -0.10362434387207031, -0.09920120239257812, -0.09477806091308594, -0.09035491943359375, -0.08593177795410156, -0.08150863647460938, -0.07708549499511719, -0.072662353515625, -0.06823921203613281, -0.06381607055664062, -0.05939292907714844, -0.05496978759765625, -0.05054664611816406, -0.046123504638671875, -0.04170036315917969, -0.0372772216796875, -0.03285408020019531, -0.028430938720703125, -0.024007797241210938, -0.01958465576171875, -0.015161514282226562, -0.010738372802734375, -0.0063152313232421875, -0.00189208984375, 0.0025310516357421875, 0.006954193115234375, 0.011377334594726562, 0.01580047607421875, 0.020223617553710938, 0.024646759033203125, 0.029069900512695312, 0.0334930419921875, 0.03791618347167969, 0.042339324951171875, 0.04676246643066406, 0.05118560791015625, 0.05560874938964844, 0.060031890869140625, 0.06445503234863281, 0.068878173828125, 0.07330131530761719, 0.07772445678710938, 0.08214759826660156, 0.08657073974609375, 0.09099388122558594, 0.09541702270507812, 0.09984016418457031, 0.1042633056640625, 0.10868644714355469, 0.11310958862304688, 0.11753273010253906, 0.12195587158203125, 0.12637901306152344, 0.13080215454101562, 0.1352252960205078, 0.1396484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 12.0, 74.0, 275.0, 428.0, 135.0, 43.0, 24.0, 1.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8018062114715576, -2.5485482215881348, -2.295290470123291, -2.042032480239868, -1.7887744903564453, -1.5355165004730225, -1.2822586297988892, -1.0290007591247559, -0.775742769241333, -0.5224848389625549, -0.26922690868377686, -0.01596897840499878, 0.2372889518737793, 0.49054694175720215, 0.7438048124313354, 0.9970626831054688, 1.2503206729888916, 1.5035786628723145, 1.7568365335464478, 2.010094404220581, 2.263352394104004, 2.5166103839874268, 2.7698683738708496, 3.0231261253356934, 3.276384115219116, 3.529642105102539, 3.782899856567383, 4.036158084869385, 4.2894158363342285, 4.5426740646362305, 4.795931816101074, 5.049189567565918, 5.302448272705078, 5.555706024169922, 5.808964252471924, 6.062222003936768, 6.3154802322387695, 6.568737983703613, 6.821995735168457, 7.075253486633301, 7.328511714935303, 7.5817694664001465, 7.835027694702148, 8.088285446166992, 8.341543197631836, 8.59480094909668, 8.84805965423584, 9.101317405700684, 9.354575157165527, 9.607832908630371, 9.861090660095215, 10.114349365234375, 10.367607116699219, 10.620864868164062, 10.874122619628906, 11.12738037109375, 11.380638122558594, 11.633895874023438, 11.887153625488281, 12.140412330627441, 12.393670082092285, 12.646927833557129, 12.900185585021973, 13.153443336486816, 13.406702041625977]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 1.0, 6.0, 9.0, 8.0, 9.0, 14.0, 30.0, 26.0, 22.0, 25.0, 35.0, 53.0, 44.0, 40.0, 100.0, 114.0, 112.0, 45.0, 44.0, 46.0, 45.0, 27.0, 29.0, 29.0, 22.0, 16.0, 20.0, 11.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0957438945770264, -2.0195343494415283, -1.9433245658874512, -1.8671149015426636, -1.790905237197876, -1.714695692062378, -1.6384860277175903, -1.5622763633728027, -1.4860666990280151, -1.4098570346832275, -1.33364737033844, -1.2574377059936523, -1.1812281608581543, -1.1050183773040771, -1.028808832168579, -0.9525991678237915, -0.8763895034790039, -0.8001798391342163, -0.7239701747894287, -0.6477605700492859, -0.5715509057044983, -0.4953412413597107, -0.4191316068172455, -0.3429219722747803, -0.2667123079299927, -0.19050265848636627, -0.11429300904273987, -0.038083359599113464, 0.03812628984451294, 0.11433595418930054, 0.19054558873176575, 0.26675522327423096, 0.34296464920043945, 0.41917431354522705, 0.49538394808769226, 0.5715935826301575, 0.6478032469749451, 0.7240129113197327, 0.8002225160598755, 0.8764321804046631, 0.9526418447494507, 1.0288515090942383, 1.1050611734390259, 1.1812708377838135, 1.2574803829193115, 1.3336901664733887, 1.4098997116088867, 1.4861093759536743, 1.562319040298462, 1.6385287046432495, 1.714738368988037, 1.7909480333328247, 1.8671576976776123, 1.9433672428131104, 2.0195770263671875, 2.0957865715026855, 2.1719961166381836, 2.2482056617736816, 2.324415445327759, 2.400624990463257, 2.476834774017334, 2.553044319152832, 2.629254102706909, 2.7054636478424072, 2.7816734313964844]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 7.0, 10.0, 20.0, 30.0, 54.0, 64.0, 107.0, 157.0, 280.0, 519.0, 983.0, 2240.0, 5065.0, 15062.0, 66325.0, 848387.0, 2936853.0, 267473.0, 34009.0, 9568.0, 3584.0, 1615.0, 787.0, 414.0, 236.0, 129.0, 83.0, 61.0, 32.0, 21.0, 34.0, 12.0, 9.0, 11.0, 2.0, 0.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2451171875, -0.23797035217285156, -0.23082351684570312, -0.2236766815185547, -0.21652984619140625, -0.2093830108642578, -0.20223617553710938, -0.19508934020996094, -0.1879425048828125, -0.18079566955566406, -0.17364883422851562, -0.1665019989013672, -0.15935516357421875, -0.1522083282470703, -0.14506149291992188, -0.13791465759277344, -0.130767822265625, -0.12362098693847656, -0.11647415161132812, -0.10932731628417969, -0.10218048095703125, -0.09503364562988281, -0.08788681030273438, -0.08073997497558594, -0.0735931396484375, -0.06644630432128906, -0.059299468994140625, -0.05215263366699219, -0.04500579833984375, -0.03785896301269531, -0.030712127685546875, -0.023565292358398438, -0.01641845703125, -0.009271621704101562, -0.002124786376953125, 0.0050220489501953125, 0.01216888427734375, 0.019315719604492188, 0.026462554931640625, 0.03360939025878906, 0.0407562255859375, 0.04790306091308594, 0.055049896240234375, 0.06219673156738281, 0.06934356689453125, 0.07649040222167969, 0.08363723754882812, 0.09078407287597656, 0.097930908203125, 0.10507774353027344, 0.11222457885742188, 0.11937141418457031, 0.12651824951171875, 0.1336650848388672, 0.14081192016601562, 0.14795875549316406, 0.1551055908203125, 0.16225242614746094, 0.16939926147460938, 0.1765460968017578, 0.18369293212890625, 0.1908397674560547, 0.19798660278320312, 0.20513343811035156, 0.2122802734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 10.0, 6.0, 5.0, 10.0, 13.0, 15.0, 21.0, 17.0, 23.0, 24.0, 37.0, 39.0, 44.0, 41.0, 50.0, 47.0, 46.0, 33.0, 53.0, 44.0, 42.0, 39.0, 53.0, 33.0, 40.0, 19.0, 29.0, 25.0, 19.0, 20.0, 21.0, 14.0, 13.0, 10.0, 13.0, 8.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08544921875, -0.08260726928710938, -0.07976531982421875, -0.07692337036132812, -0.0740814208984375, -0.07123947143554688, -0.06839752197265625, -0.06555557250976562, -0.062713623046875, -0.059871673583984375, -0.05702972412109375, -0.054187774658203125, -0.0513458251953125, -0.048503875732421875, -0.04566192626953125, -0.042819976806640625, -0.03997802734375, -0.037136077880859375, -0.03429412841796875, -0.031452178955078125, -0.0286102294921875, -0.025768280029296875, -0.02292633056640625, -0.020084381103515625, -0.017242431640625, -0.014400482177734375, -0.01155853271484375, -0.008716583251953125, -0.0058746337890625, -0.003032684326171875, -0.00019073486328125, 0.002651214599609375, 0.0054931640625, 0.008335113525390625, 0.01117706298828125, 0.014019012451171875, 0.0168609619140625, 0.019702911376953125, 0.02254486083984375, 0.025386810302734375, 0.028228759765625, 0.031070709228515625, 0.03391265869140625, 0.036754608154296875, 0.0395965576171875, 0.042438507080078125, 0.04528045654296875, 0.048122406005859375, 0.05096435546875, 0.053806304931640625, 0.05664825439453125, 0.059490203857421875, 0.0623321533203125, 0.06517410278320312, 0.06801605224609375, 0.07085800170898438, 0.073699951171875, 0.07654190063476562, 0.07938385009765625, 0.08222579956054688, 0.0850677490234375, 0.08790969848632812, 0.09075164794921875, 0.09359359741210938, 0.096435546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 4.0, 2.0, 7.0, 8.0, 5.0, 20.0, 22.0, 27.0, 36.0, 45.0, 51.0, 72.0, 80.0, 108.0, 163.0, 257.0, 443.0, 971.0, 3392.0, 26400.0, 3642148.0, 503717.0, 12265.0, 2141.0, 752.0, 355.0, 202.0, 136.0, 125.0, 86.0, 58.0, 63.0, 31.0, 29.0, 26.0, 16.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.56329345703125, -0.5396728515625, -0.51605224609375, -0.492431640625, -0.46881103515625, -0.4451904296875, -0.42156982421875, -0.39794921875, -0.37432861328125, -0.3507080078125, -0.32708740234375, -0.303466796875, -0.27984619140625, -0.2562255859375, -0.23260498046875, -0.208984375, -0.18536376953125, -0.1617431640625, -0.13812255859375, -0.114501953125, -0.09088134765625, -0.0672607421875, -0.04364013671875, -0.02001953125, 0.00360107421875, 0.0272216796875, 0.05084228515625, 0.074462890625, 0.09808349609375, 0.1217041015625, 0.14532470703125, 0.1689453125, 0.19256591796875, 0.2161865234375, 0.23980712890625, 0.263427734375, 0.28704833984375, 0.3106689453125, 0.33428955078125, 0.35791015625, 0.38153076171875, 0.4051513671875, 0.42877197265625, 0.452392578125, 0.47601318359375, 0.4996337890625, 0.52325439453125, 0.546875, 0.57049560546875, 0.5941162109375, 0.61773681640625, 0.641357421875, 0.66497802734375, 0.6885986328125, 0.71221923828125, 0.73583984375, 0.75946044921875, 0.7830810546875, 0.80670166015625, 0.830322265625, 0.85394287109375, 0.8775634765625, 0.90118408203125, 0.9248046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 9.0, 8.0, 22.0, 18.0, 28.0, 37.0, 65.0, 89.0, 168.0, 351.0, 686.0, 968.0, 729.0, 382.0, 175.0, 97.0, 76.0, 44.0, 22.0, 23.0, 14.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40234375, -0.3907012939453125, -0.379058837890625, -0.3674163818359375, -0.35577392578125, -0.3441314697265625, -0.332489013671875, -0.3208465576171875, -0.3092041015625, -0.2975616455078125, -0.285919189453125, -0.2742767333984375, -0.26263427734375, -0.2509918212890625, -0.239349365234375, -0.2277069091796875, -0.216064453125, -0.2044219970703125, -0.192779541015625, -0.1811370849609375, -0.16949462890625, -0.1578521728515625, -0.146209716796875, -0.1345672607421875, -0.1229248046875, -0.1112823486328125, -0.099639892578125, -0.0879974365234375, -0.07635498046875, -0.0647125244140625, -0.053070068359375, -0.0414276123046875, -0.02978515625, -0.0181427001953125, -0.006500244140625, 0.0051422119140625, 0.01678466796875, 0.0284271240234375, 0.040069580078125, 0.0517120361328125, 0.0633544921875, 0.0749969482421875, 0.086639404296875, 0.0982818603515625, 0.10992431640625, 0.1215667724609375, 0.133209228515625, 0.1448516845703125, 0.156494140625, 0.1681365966796875, 0.179779052734375, 0.1914215087890625, 0.20306396484375, 0.2147064208984375, 0.226348876953125, 0.2379913330078125, 0.2496337890625, 0.2612762451171875, 0.272918701171875, 0.2845611572265625, 0.29620361328125, 0.3078460693359375, 0.319488525390625, 0.3311309814453125, 0.3427734375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 3.0, 3.0, 8.0, 8.0, 6.0, 8.0, 23.0, 34.0, 35.0, 42.0, 74.0, 110.0, 148.0, 142.0, 114.0, 82.0, 54.0, 37.0, 20.0, 14.0, 9.0, 4.0, 2.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2938127517700195, -3.191105604171753, -3.0883984565734863, -2.9856910705566406, -2.882983922958374, -2.7802767753601074, -2.6775693893432617, -2.574862241744995, -2.4721550941467285, -2.369447946548462, -2.2667407989501953, -2.1640334129333496, -2.061326265335083, -1.9586191177368164, -1.8559118509292603, -1.753204584121704, -1.6504974365234375, -1.547790288925171, -1.4450830221176147, -1.3423757553100586, -1.239668607711792, -1.1369614601135254, -1.0342541933059692, -0.9315469861030579, -0.8288397789001465, -0.7261325716972351, -0.6234253644943237, -0.5207181572914124, -0.418010950088501, -0.3153037428855896, -0.21259653568267822, -0.10988932847976685, -0.007182121276855469, 0.09552508592605591, 0.19823229312896729, 0.30093950033187866, 0.40364670753479004, 0.5063539147377014, 0.6090611219406128, 0.7117683291435242, 0.8144755363464355, 0.9171827435493469, 1.0198899507522583, 1.1225972175598145, 1.225304365158081, 1.3280115127563477, 1.4307187795639038, 1.53342604637146, 1.6361331939697266, 1.7388403415679932, 1.8415476083755493, 1.9442548751831055, 2.046962022781372, 2.1496691703796387, 2.2523765563964844, 2.355083703994751, 2.4577908515930176, 2.560497999191284, 2.663205146789551, 2.7659125328063965, 2.868619680404663, 2.9713268280029297, 3.0740342140197754, 3.176741361618042, 3.2794485092163086]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 5.0, 6.0, 4.0, 7.0, 13.0, 16.0, 6.0, 8.0, 16.0, 11.0, 12.0, 11.0, 20.0, 20.0, 24.0, 34.0, 30.0, 41.0, 34.0, 47.0, 38.0, 51.0, 39.0, 46.0, 56.0, 39.0, 40.0, 31.0, 38.0, 28.0, 26.0, 24.0, 33.0, 26.0, 12.0, 17.0, 13.0, 11.0, 11.0, 12.0, 8.0, 7.0, 10.0, 6.0, 2.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2753994464874268, -1.2358005046844482, -1.1962014436721802, -1.1566025018692017, -1.1170034408569336, -1.077404499053955, -1.0378055572509766, -0.9982064962387085, -0.95860755443573, -0.9190085530281067, -0.8794095516204834, -0.8398106098175049, -0.8002116084098816, -0.7606126070022583, -0.721013605594635, -0.6814146041870117, -0.6418156027793884, -0.6022166013717651, -0.5626175999641418, -0.5230185985565186, -0.48341965675354004, -0.44382065534591675, -0.40422165393829346, -0.36462268233299255, -0.32502368092536926, -0.28542467951774597, -0.24582570791244507, -0.20622670650482178, -0.16662771999835968, -0.12702873349189758, -0.08742973208427429, -0.04783076047897339, -0.008231759071350098, 0.0313672311604023, 0.0709662213921547, 0.11056521534919739, 0.15016420185565948, 0.18976318836212158, 0.22936218976974487, 0.2689611613750458, 0.30856016278266907, 0.34815916419029236, 0.38775813579559326, 0.42735713720321655, 0.46695613861083984, 0.5065550804138184, 0.5461541414260864, 0.5857530832290649, 0.6253520846366882, 0.6649510860443115, 0.7045500874519348, 0.7441490888595581, 0.7837480306625366, 0.8233470320701599, 0.8629460334777832, 0.9025449752807617, 0.9421440362930298, 0.9817430377006531, 1.0213420391082764, 1.0609409809112549, 1.100540041923523, 1.1401389837265015, 1.1797380447387695, 1.219336986541748, 1.2589359283447266]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 14.0, 14.0, 23.0, 36.0, 63.0, 85.0, 119.0, 200.0, 388.0, 590.0, 981.0, 1806.0, 3353.0, 6384.0, 13173.0, 28979.0, 72210.0, 203977.0, 400501.0, 192656.0, 68785.0, 28190.0, 12468.0, 6318.0, 3038.0, 1721.0, 957.0, 544.0, 366.0, 217.0, 138.0, 78.0, 68.0, 27.0, 24.0, 14.0, 14.0, 5.0, 11.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2527046203613281, -0.24515533447265625, -0.23760604858398438, -0.2300567626953125, -0.22250747680664062, -0.21495819091796875, -0.20740890502929688, -0.199859619140625, -0.19231033325195312, -0.18476104736328125, -0.17721176147460938, -0.1696624755859375, -0.16211318969726562, -0.15456390380859375, -0.14701461791992188, -0.13946533203125, -0.13191604614257812, -0.12436676025390625, -0.11681747436523438, -0.1092681884765625, -0.10171890258789062, -0.09416961669921875, -0.08662033081054688, -0.079071044921875, -0.07152175903320312, -0.06397247314453125, -0.056423187255859375, -0.0488739013671875, -0.041324615478515625, -0.03377532958984375, -0.026226043701171875, -0.0186767578125, -0.011127471923828125, -0.00357818603515625, 0.003971099853515625, 0.0115203857421875, 0.019069671630859375, 0.02661895751953125, 0.034168243408203125, 0.041717529296875, 0.049266815185546875, 0.05681610107421875, 0.06436538696289062, 0.0719146728515625, 0.07946395874023438, 0.08701324462890625, 0.09456253051757812, 0.10211181640625, 0.10966110229492188, 0.11721038818359375, 0.12475967407226562, 0.1323089599609375, 0.13985824584960938, 0.14740753173828125, 0.15495681762695312, 0.162506103515625, 0.17005538940429688, 0.17760467529296875, 0.18515396118164062, 0.1927032470703125, 0.20025253295898438, 0.20780181884765625, 0.21535110473632812, 0.222900390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 7.0, 10.0, 6.0, 15.0, 24.0, 8.0, 19.0, 27.0, 21.0, 36.0, 43.0, 52.0, 35.0, 48.0, 41.0, 62.0, 43.0, 57.0, 38.0, 53.0, 44.0, 30.0, 42.0, 26.0, 32.0, 33.0, 21.0, 14.0, 24.0, 16.0, 16.0, 9.0, 8.0, 6.0, 5.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10931396484375, -0.1057586669921875, -0.102203369140625, -0.0986480712890625, -0.0950927734375, -0.0915374755859375, -0.087982177734375, -0.0844268798828125, -0.08087158203125, -0.0773162841796875, -0.073760986328125, -0.0702056884765625, -0.066650390625, -0.0630950927734375, -0.059539794921875, -0.0559844970703125, -0.05242919921875, -0.0488739013671875, -0.045318603515625, -0.0417633056640625, -0.0382080078125, -0.0346527099609375, -0.031097412109375, -0.0275421142578125, -0.02398681640625, -0.0204315185546875, -0.016876220703125, -0.0133209228515625, -0.009765625, -0.0062103271484375, -0.002655029296875, 0.0009002685546875, 0.00445556640625, 0.0080108642578125, 0.011566162109375, 0.0151214599609375, 0.0186767578125, 0.0222320556640625, 0.025787353515625, 0.0293426513671875, 0.03289794921875, 0.0364532470703125, 0.040008544921875, 0.0435638427734375, 0.047119140625, 0.0506744384765625, 0.054229736328125, 0.0577850341796875, 0.06134033203125, 0.0648956298828125, 0.068450927734375, 0.0720062255859375, 0.0755615234375, 0.0791168212890625, 0.082672119140625, 0.0862274169921875, 0.08978271484375, 0.0933380126953125, 0.096893310546875, 0.1004486083984375, 0.10400390625, 0.1075592041015625, 0.111114501953125, 0.1146697998046875, 0.11822509765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 12.0, 12.0, 28.0, 29.0, 50.0, 72.0, 97.0, 174.0, 340.0, 725.0, 1615.0, 5325.0, 33512.0, 791607.0, 194290.0, 15124.0, 3246.0, 1067.0, 523.0, 280.0, 134.0, 92.0, 65.0, 27.0, 32.0, 12.0, 17.0, 10.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8671875, -0.8429718017578125, -0.818756103515625, -0.7945404052734375, -0.77032470703125, -0.7461090087890625, -0.721893310546875, -0.6976776123046875, -0.6734619140625, -0.6492462158203125, -0.625030517578125, -0.6008148193359375, -0.57659912109375, -0.5523834228515625, -0.528167724609375, -0.5039520263671875, -0.479736328125, -0.4555206298828125, -0.431304931640625, -0.4070892333984375, -0.38287353515625, -0.3586578369140625, -0.334442138671875, -0.3102264404296875, -0.2860107421875, -0.2617950439453125, -0.237579345703125, -0.2133636474609375, -0.18914794921875, -0.1649322509765625, -0.140716552734375, -0.1165008544921875, -0.09228515625, -0.0680694580078125, -0.043853759765625, -0.0196380615234375, 0.00457763671875, 0.0287933349609375, 0.053009033203125, 0.0772247314453125, 0.1014404296875, 0.1256561279296875, 0.149871826171875, 0.1740875244140625, 0.19830322265625, 0.2225189208984375, 0.246734619140625, 0.2709503173828125, 0.295166015625, 0.3193817138671875, 0.343597412109375, 0.3678131103515625, 0.39202880859375, 0.4162445068359375, 0.440460205078125, 0.4646759033203125, 0.4888916015625, 0.5131072998046875, 0.537322998046875, 0.5615386962890625, 0.58575439453125, 0.6099700927734375, 0.634185791015625, 0.6584014892578125, 0.6826171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 15.0, 23.0, 19.0, 30.0, 29.0, 35.0, 47.0, 48.0, 60.0, 70.0, 85.0, 69.0, 72.0, 76.0, 67.0, 54.0, 31.0, 42.0, 32.0, 24.0, 13.0, 9.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.7742385864257812, -0.7535552978515625, -0.7328720092773438, -0.712188720703125, -0.6915054321289062, -0.6708221435546875, -0.6501388549804688, -0.62945556640625, -0.6087722778320312, -0.5880889892578125, -0.5674057006835938, -0.546722412109375, -0.5260391235351562, -0.5053558349609375, -0.48467254638671875, -0.4639892578125, -0.44330596923828125, -0.4226226806640625, -0.40193939208984375, -0.381256103515625, -0.36057281494140625, -0.3398895263671875, -0.31920623779296875, -0.29852294921875, -0.27783966064453125, -0.2571563720703125, -0.23647308349609375, -0.215789794921875, -0.19510650634765625, -0.1744232177734375, -0.15373992919921875, -0.133056640625, -0.11237335205078125, -0.0916900634765625, -0.07100677490234375, -0.050323486328125, -0.02964019775390625, -0.0089569091796875, 0.01172637939453125, 0.03240966796875, 0.05309295654296875, 0.0737762451171875, 0.09445953369140625, 0.115142822265625, 0.13582611083984375, 0.1565093994140625, 0.17719268798828125, 0.1978759765625, 0.21855926513671875, 0.2392425537109375, 0.25992584228515625, 0.280609130859375, 0.30129241943359375, 0.3219757080078125, 0.34265899658203125, 0.36334228515625, 0.38402557373046875, 0.4047088623046875, 0.42539215087890625, 0.446075439453125, 0.46675872802734375, 0.4874420166015625, 0.5081253051757812, 0.52880859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 9.0, 8.0, 17.0, 7.0, 22.0, 31.0, 39.0, 36.0, 55.0, 72.0, 112.0, 187.0, 299.0, 442.0, 849.0, 1437.0, 2979.0, 6515.0, 16995.0, 56019.0, 626408.0, 262626.0, 46911.0, 14460.0, 5869.0, 2709.0, 1379.0, 742.0, 447.0, 298.0, 169.0, 117.0, 66.0, 56.0, 39.0, 33.0, 18.0, 15.0, 8.0, 8.0, 11.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.2000732421875, -0.1939983367919922, -0.18792343139648438, -0.18184852600097656, -0.17577362060546875, -0.16969871520996094, -0.16362380981445312, -0.1575489044189453, -0.1514739990234375, -0.1453990936279297, -0.13932418823242188, -0.13324928283691406, -0.12717437744140625, -0.12109947204589844, -0.11502456665039062, -0.10894966125488281, -0.102874755859375, -0.09679985046386719, -0.09072494506835938, -0.08465003967285156, -0.07857513427734375, -0.07250022888183594, -0.06642532348632812, -0.06035041809082031, -0.0542755126953125, -0.04820060729980469, -0.042125701904296875, -0.03605079650878906, -0.02997589111328125, -0.023900985717773438, -0.017826080322265625, -0.011751174926757812, -0.00567626953125, 0.0003986358642578125, 0.006473541259765625, 0.012548446655273438, 0.01862335205078125, 0.024698257446289062, 0.030773162841796875, 0.03684806823730469, 0.0429229736328125, 0.04899787902832031, 0.055072784423828125, 0.06114768981933594, 0.06722259521484375, 0.07329750061035156, 0.07937240600585938, 0.08544731140136719, 0.091522216796875, 0.09759712219238281, 0.10367202758789062, 0.10974693298339844, 0.11582183837890625, 0.12189674377441406, 0.12797164916992188, 0.1340465545654297, 0.1401214599609375, 0.1461963653564453, 0.15227127075195312, 0.15834617614746094, 0.16442108154296875, 0.17049598693847656, 0.17657089233398438, 0.1826457977294922, 0.188720703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 3.0, 12.0, 19.0, 16.0, 21.0, 22.0, 39.0, 61.0, 77.0, 131.0, 179.0, 122.0, 89.0, 60.0, 37.0, 27.0, 20.0, 11.0, 9.0, 8.0, 7.0, 2.0, 7.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013065338134765625, -0.00012673065066337585, -0.00012280791997909546, -0.00011888518929481506, -0.00011496245861053467, -0.00011103972792625427, -0.00010711699724197388, -0.00010319426655769348, -9.927153587341309e-05, -9.534880518913269e-05, -9.14260745048523e-05, -8.75033438205719e-05, -8.35806131362915e-05, -7.965788245201111e-05, -7.573515176773071e-05, -7.181242108345032e-05, -6.788969039916992e-05, -6.396695971488953e-05, -6.004422903060913e-05, -5.6121498346328735e-05, -5.219876766204834e-05, -4.8276036977767944e-05, -4.435330629348755e-05, -4.043057560920715e-05, -3.650784492492676e-05, -3.258511424064636e-05, -2.8662383556365967e-05, -2.473965287208557e-05, -2.0816922187805176e-05, -1.689419150352478e-05, -1.2971460819244385e-05, -9.04873013496399e-06, -5.125999450683594e-06, -1.2032687664031982e-06, 2.7194619178771973e-06, 6.642192602157593e-06, 1.0564923286437988e-05, 1.4487653970718384e-05, 1.841038465499878e-05, 2.2333115339279175e-05, 2.625584602355957e-05, 3.0178576707839966e-05, 3.410130739212036e-05, 3.802403807640076e-05, 4.194676876068115e-05, 4.586949944496155e-05, 4.979223012924194e-05, 5.371496081352234e-05, 5.7637691497802734e-05, 6.156042218208313e-05, 6.548315286636353e-05, 6.940588355064392e-05, 7.332861423492432e-05, 7.725134491920471e-05, 8.117407560348511e-05, 8.50968062877655e-05, 8.90195369720459e-05, 9.29422676563263e-05, 9.686499834060669e-05, 0.00010078772902488708, 0.00010471045970916748, 0.00010863319039344788, 0.00011255592107772827, 0.00011647865176200867, 0.00012040138244628906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 9.0, 11.0, 10.0, 23.0, 35.0, 44.0, 77.0, 112.0, 107.0, 216.0, 397.0, 767.0, 1717.0, 4504.0, 15374.0, 76243.0, 782251.0, 133798.0, 22540.0, 5836.0, 2221.0, 947.0, 480.0, 275.0, 168.0, 103.0, 82.0, 53.0, 36.0, 30.0, 26.0, 17.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2396240234375, -0.23204994201660156, -0.22447586059570312, -0.2169017791748047, -0.20932769775390625, -0.2017536163330078, -0.19417953491210938, -0.18660545349121094, -0.1790313720703125, -0.17145729064941406, -0.16388320922851562, -0.1563091278076172, -0.14873504638671875, -0.1411609649658203, -0.13358688354492188, -0.12601280212402344, -0.118438720703125, -0.11086463928222656, -0.10329055786132812, -0.09571647644042969, -0.08814239501953125, -0.08056831359863281, -0.07299423217773438, -0.06542015075683594, -0.0578460693359375, -0.05027198791503906, -0.042697906494140625, -0.03512382507324219, -0.02754974365234375, -0.019975662231445312, -0.012401580810546875, -0.0048274993896484375, 0.00274658203125, 0.010320663452148438, 0.017894744873046875, 0.025468826293945312, 0.03304290771484375, 0.04061698913574219, 0.048191070556640625, 0.05576515197753906, 0.0633392333984375, 0.07091331481933594, 0.07848739624023438, 0.08606147766113281, 0.09363555908203125, 0.10120964050292969, 0.10878372192382812, 0.11635780334472656, 0.123931884765625, 0.13150596618652344, 0.13908004760742188, 0.1466541290283203, 0.15422821044921875, 0.1618022918701172, 0.16937637329101562, 0.17695045471191406, 0.1845245361328125, 0.19209861755371094, 0.19967269897460938, 0.2072467803955078, 0.21482086181640625, 0.2223949432373047, 0.22996902465820312, 0.23754310607910156, 0.2451171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 7.0, 10.0, 7.0, 20.0, 16.0, 25.0, 41.0, 32.0, 55.0, 78.0, 83.0, 129.0, 105.0, 81.0, 49.0, 50.0, 35.0, 38.0, 28.0, 23.0, 14.0, 9.0, 7.0, 13.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15747833251953125, -0.1523590087890625, -0.14723968505859375, -0.142120361328125, -0.13700103759765625, -0.1318817138671875, -0.12676239013671875, -0.12164306640625, -0.11652374267578125, -0.1114044189453125, -0.10628509521484375, -0.101165771484375, -0.09604644775390625, -0.0909271240234375, -0.08580780029296875, -0.0806884765625, -0.07556915283203125, -0.0704498291015625, -0.06533050537109375, -0.060211181640625, -0.05509185791015625, -0.0499725341796875, -0.04485321044921875, -0.03973388671875, -0.03461456298828125, -0.0294952392578125, -0.02437591552734375, -0.019256591796875, -0.01413726806640625, -0.0090179443359375, -0.00389862060546875, 0.001220703125, 0.00634002685546875, 0.0114593505859375, 0.01657867431640625, 0.021697998046875, 0.02681732177734375, 0.0319366455078125, 0.03705596923828125, 0.04217529296875, 0.04729461669921875, 0.0524139404296875, 0.05753326416015625, 0.062652587890625, 0.06777191162109375, 0.0728912353515625, 0.07801055908203125, 0.0831298828125, 0.08824920654296875, 0.0933685302734375, 0.09848785400390625, 0.103607177734375, 0.10872650146484375, 0.1138458251953125, 0.11896514892578125, 0.12408447265625, 0.12920379638671875, 0.1343231201171875, 0.13944244384765625, 0.144561767578125, 0.14968109130859375, 0.1548004150390625, 0.15991973876953125, 0.1650390625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 16.0, 32.0, 52.0, 118.0, 242.0, 307.0, 97.0, 70.0, 27.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.929653644561768, -5.750265598297119, -5.570877552032471, -5.391489028930664, -5.212100982666016, -5.032712936401367, -4.853324890136719, -4.67393684387207, -4.494548797607422, -4.315160751342773, -4.135772705078125, -3.9563844203948975, -3.776996374130249, -3.5976080894470215, -3.418220043182373, -3.2388319969177246, -3.059443712234497, -2.8800556659698486, -2.700667381286621, -2.5212793350219727, -2.341891288757324, -2.162503242492676, -1.9831149578094482, -1.8037269115447998, -1.6243387460708618, -1.4449505805969238, -1.2655625343322754, -1.0861743688583374, -0.9067862629890442, -0.727398157119751, -0.548009991645813, -0.36862194538116455, -0.18923377990722656, -0.009845659136772156, 0.16954246163368225, 0.34893059730529785, 0.5283187031745911, 0.7077068090438843, 0.8870949745178223, 1.0664830207824707, 1.2458711862564087, 1.4252593517303467, 1.6046473979949951, 1.784035563468933, 1.963423728942871, 2.1428117752075195, 2.322199821472168, 2.5015878677368164, 2.680976152420044, 2.8603641986846924, 3.03975248336792, 3.2191405296325684, 3.398528575897217, 3.5779166221618652, 3.7573049068450928, 3.936692953109741, 4.116081237792969, 4.295469284057617, 4.474857330322266, 4.654245376586914, 4.833633899688721, 5.013021945953369, 5.192409992218018, 5.371798038482666, 5.5511860847473145]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 9.0, 8.0, 10.0, 9.0, 22.0, 30.0, 26.0, 33.0, 30.0, 37.0, 37.0, 34.0, 76.0, 160.0, 132.0, 57.0, 42.0, 31.0, 33.0, 26.0, 30.0, 23.0, 19.0, 22.0, 9.0, 7.0, 9.0, 10.0, 4.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.215944290161133, -2.1441547870635986, -2.0723655223846436, -2.0005760192871094, -1.9287867546081543, -1.8569972515106201, -1.7852078676223755, -1.7134184837341309, -1.6416290998458862, -1.5698397159576416, -1.498050332069397, -1.4262609481811523, -1.3544714450836182, -1.282682180404663, -1.210892677307129, -1.1391032934188843, -1.0673139095306396, -0.995524525642395, -0.9237351417541504, -0.851945698261261, -0.7801563143730164, -0.7083669304847717, -0.6365774869918823, -0.5647881031036377, -0.49299871921539307, -0.42120933532714844, -0.3494199216365814, -0.2776305079460144, -0.20584112405776978, -0.13405174016952515, -0.06226232647895813, 0.009527087211608887, 0.08131623268127441, 0.15310563147068024, 0.22489503026008606, 0.2966844439506531, 0.3684738278388977, 0.44026321172714233, 0.5120526552200317, 0.5838420391082764, 0.655631422996521, 0.7274208068847656, 0.7992101907730103, 0.8709996342658997, 0.9427890181541443, 1.0145783424377441, 1.0863678455352783, 1.158157229423523, 1.2299466133117676, 1.3017359972000122, 1.3735253810882568, 1.4453147649765015, 1.517104148864746, 1.5888936519622803, 1.660683035850525, 1.7324724197387695, 1.8042618036270142, 1.8760511875152588, 1.9478405714035034, 2.019629955291748, 2.0914194583892822, 2.1632087230682373, 2.2349982261657715, 2.3067874908447266, 2.3785769939422607]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 6.0, 8.0, 6.0, 8.0, 14.0, 24.0, 40.0, 57.0, 98.0, 138.0, 240.0, 366.0, 650.0, 1189.0, 2209.0, 4478.0, 9603.0, 23663.0, 73939.0, 405851.0, 2491321.0, 982681.0, 135332.0, 36057.0, 13831.0, 5985.0, 2908.0, 1436.0, 824.0, 483.0, 328.0, 179.0, 103.0, 90.0, 49.0, 33.0, 19.0, 16.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31640625, -0.3075447082519531, -0.29868316650390625, -0.2898216247558594, -0.2809600830078125, -0.2720985412597656, -0.26323699951171875, -0.2543754577636719, -0.245513916015625, -0.23665237426757812, -0.22779083251953125, -0.21892929077148438, -0.2100677490234375, -0.20120620727539062, -0.19234466552734375, -0.18348312377929688, -0.17462158203125, -0.16576004028320312, -0.15689849853515625, -0.14803695678710938, -0.1391754150390625, -0.13031387329101562, -0.12145233154296875, -0.11259078979492188, -0.103729248046875, -0.09486770629882812, -0.08600616455078125, -0.07714462280273438, -0.0682830810546875, -0.059421539306640625, -0.05055999755859375, -0.041698455810546875, -0.0328369140625, -0.023975372314453125, -0.01511383056640625, -0.006252288818359375, 0.0026092529296875, 0.011470794677734375, 0.02033233642578125, 0.029193878173828125, 0.038055419921875, 0.046916961669921875, 0.05577850341796875, 0.06464004516601562, 0.0735015869140625, 0.08236312866210938, 0.09122467041015625, 0.10008621215820312, 0.10894775390625, 0.11780929565429688, 0.12667083740234375, 0.13553237915039062, 0.1443939208984375, 0.15325546264648438, 0.16211700439453125, 0.17097854614257812, 0.179840087890625, 0.18870162963867188, 0.19756317138671875, 0.20642471313476562, 0.2152862548828125, 0.22414779663085938, 0.23300933837890625, 0.24187088012695312, 0.250732421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 10.0, 12.0, 18.0, 13.0, 23.0, 24.0, 27.0, 33.0, 37.0, 43.0, 41.0, 40.0, 49.0, 56.0, 65.0, 53.0, 48.0, 42.0, 34.0, 53.0, 32.0, 39.0, 33.0, 38.0, 25.0, 14.0, 16.0, 12.0, 14.0, 10.0, 11.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093994140625, -0.09064769744873047, -0.08730125427246094, -0.0839548110961914, -0.08060836791992188, -0.07726192474365234, -0.07391548156738281, -0.07056903839111328, -0.06722259521484375, -0.06387615203857422, -0.06052970886230469, -0.057183265686035156, -0.053836822509765625, -0.050490379333496094, -0.04714393615722656, -0.04379749298095703, -0.0404510498046875, -0.03710460662841797, -0.03375816345214844, -0.030411720275878906, -0.027065277099609375, -0.023718833923339844, -0.020372390747070312, -0.01702594757080078, -0.01367950439453125, -0.010333061218261719, -0.0069866180419921875, -0.0036401748657226562, -0.000293731689453125, 0.0030527114868164062, 0.0063991546630859375, 0.009745597839355469, 0.013092041015625, 0.01643848419189453, 0.019784927368164062, 0.023131370544433594, 0.026477813720703125, 0.029824256896972656, 0.03317070007324219, 0.03651714324951172, 0.03986358642578125, 0.04321002960205078, 0.04655647277832031, 0.049902915954589844, 0.053249359130859375, 0.056595802307128906, 0.05994224548339844, 0.06328868865966797, 0.0666351318359375, 0.06998157501220703, 0.07332801818847656, 0.0766744613647461, 0.08002090454101562, 0.08336734771728516, 0.08671379089355469, 0.09006023406982422, 0.09340667724609375, 0.09675312042236328, 0.10009956359863281, 0.10344600677490234, 0.10679244995117188, 0.1101388931274414, 0.11348533630371094, 0.11683177947998047, 0.12017822265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 21.0, 28.0, 29.0, 56.0, 108.0, 157.0, 343.0, 850.0, 2890.0, 55104.0, 4112161.0, 19310.0, 1869.0, 657.0, 302.0, 143.0, 79.0, 58.0, 21.0, 29.0, 15.0, 9.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8349609375, -1.7703094482421875, -1.705657958984375, -1.6410064697265625, -1.57635498046875, -1.5117034912109375, -1.447052001953125, -1.3824005126953125, -1.3177490234375, -1.2530975341796875, -1.188446044921875, -1.1237945556640625, -1.05914306640625, -0.9944915771484375, -0.929840087890625, -0.8651885986328125, -0.800537109375, -0.7358856201171875, -0.671234130859375, -0.6065826416015625, -0.54193115234375, -0.4772796630859375, -0.412628173828125, -0.3479766845703125, -0.2833251953125, -0.2186737060546875, -0.154022216796875, -0.0893707275390625, -0.02471923828125, 0.0399322509765625, 0.104583740234375, 0.1692352294921875, 0.23388671875, 0.2985382080078125, 0.363189697265625, 0.4278411865234375, 0.49249267578125, 0.5571441650390625, 0.621795654296875, 0.6864471435546875, 0.7510986328125, 0.8157501220703125, 0.880401611328125, 0.9450531005859375, 1.00970458984375, 1.0743560791015625, 1.139007568359375, 1.2036590576171875, 1.268310546875, 1.3329620361328125, 1.397613525390625, 1.4622650146484375, 1.52691650390625, 1.5915679931640625, 1.656219482421875, 1.7208709716796875, 1.7855224609375, 1.8501739501953125, 1.914825439453125, 1.9794769287109375, 2.04412841796875, 2.1087799072265625, 2.173431396484375, 2.2380828857421875, 2.302734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 19.0, 16.0, 23.0, 45.0, 76.0, 150.0, 333.0, 888.0, 1345.0, 652.0, 252.0, 140.0, 48.0, 35.0, 20.0, 18.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2260208129882812, -1.1912994384765625, -1.1565780639648438, -1.121856689453125, -1.0871353149414062, -1.0524139404296875, -1.0176925659179688, -0.98297119140625, -0.9482498168945312, -0.9135284423828125, -0.8788070678710938, -0.844085693359375, -0.8093643188476562, -0.7746429443359375, -0.7399215698242188, -0.7052001953125, -0.6704788208007812, -0.6357574462890625, -0.6010360717773438, -0.566314697265625, -0.5315933227539062, -0.4968719482421875, -0.46215057373046875, -0.42742919921875, -0.39270782470703125, -0.3579864501953125, -0.32326507568359375, -0.288543701171875, -0.25382232666015625, -0.2191009521484375, -0.18437957763671875, -0.149658203125, -0.11493682861328125, -0.0802154541015625, -0.04549407958984375, -0.010772705078125, 0.02394866943359375, 0.0586700439453125, 0.09339141845703125, 0.12811279296875, 0.16283416748046875, 0.1975555419921875, 0.23227691650390625, 0.266998291015625, 0.30171966552734375, 0.3364410400390625, 0.37116241455078125, 0.4058837890625, 0.44060516357421875, 0.4753265380859375, 0.5100479125976562, 0.544769287109375, 0.5794906616210938, 0.6142120361328125, 0.6489334106445312, 0.68365478515625, 0.7183761596679688, 0.7530975341796875, 0.7878189086914062, 0.822540283203125, 0.8572616577148438, 0.8919830322265625, 0.9267044067382812, 0.96142578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 5.0, 11.0, 12.0, 31.0, 46.0, 104.0, 154.0, 210.0, 157.0, 107.0, 71.0, 36.0, 11.0, 15.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.268807411193848, -10.009757995605469, -9.75070858001709, -9.491660118103027, -9.232610702514648, -8.97356128692627, -8.71451187133789, -8.455463409423828, -8.19641399383545, -7.93736457824707, -7.67831563949585, -7.419266223907471, -7.16021728515625, -6.901167869567871, -6.642118453979492, -6.3830695152282715, -6.124020099639893, -5.864970684051514, -5.605921745300293, -5.346872329711914, -5.087823390960693, -4.8287739753723145, -4.569725036621094, -4.310675621032715, -4.051626205444336, -3.792577028274536, -3.5335278511047363, -3.2744784355163574, -3.0154294967651367, -2.756380081176758, -2.497330904006958, -2.238281726837158, -1.9792327880859375, -1.7201836109161377, -1.461134433746338, -1.2020851373672485, -0.9430359601974487, -0.6839867830276489, -0.42493748664855957, -0.16588830947875977, 0.09316086769104004, 0.35221007466316223, 0.6112592816352844, 0.870308518409729, 1.1293576955795288, 1.3884068727493286, 1.647456169128418, 1.9065053462982178, 2.1655545234680176, 2.4246037006378174, 2.683652877807617, 2.942702293395996, 3.201751232147217, 3.4608006477355957, 3.7198498249053955, 3.9788990020751953, 4.237948417663574, 4.496997833251953, 4.756046772003174, 5.015096187591553, 5.274145126342773, 5.533194541931152, 5.792243957519531, 6.051292896270752, 6.310341835021973]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 9.0, 3.0, 18.0, 17.0, 16.0, 18.0, 11.0, 25.0, 16.0, 23.0, 32.0, 31.0, 35.0, 32.0, 28.0, 31.0, 41.0, 37.0, 44.0, 48.0, 38.0, 38.0, 51.0, 38.0, 33.0, 34.0, 34.0, 26.0, 17.0, 19.0, 25.0, 15.0, 18.0, 10.0, 11.0, 8.0, 13.0, 9.0, 5.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.7060012817382812, -2.62267804145813, -2.5393550395965576, -2.4560317993164062, -2.372708797454834, -2.2893855571746826, -2.2060623168945312, -2.122739315032959, -2.0394160747528076, -1.9560929536819458, -1.872769832611084, -1.7894465923309326, -1.7061234712600708, -1.622800350189209, -1.5394771099090576, -1.4561539888381958, -1.372830867767334, -1.2895077466964722, -1.2061846256256104, -1.122861385345459, -1.0395382642745972, -0.9562151432037354, -0.8728919625282288, -0.7895687818527222, -0.7062456607818604, -0.6229225397109985, -0.5395993590354919, -0.45627620816230774, -0.37295305728912354, -0.28962990641593933, -0.20630675554275513, -0.12298357486724854, -0.03966069221496582, 0.043662458658218384, 0.1269856095314026, 0.2103087604045868, 0.293631911277771, 0.3769550621509552, 0.4602782130241394, 0.543601393699646, 0.6269245147705078, 0.7102476358413696, 0.7935708165168762, 0.8768939971923828, 0.9602171182632446, 1.0435402393341064, 1.1268634796142578, 1.2101866006851196, 1.2935097217559814, 1.3768328428268433, 1.460155963897705, 1.5434792041778564, 1.6268023252487183, 1.71012544631958, 1.7934486865997314, 1.8767718076705933, 1.960094928741455, 2.0434181690216064, 2.1267411708831787, 2.21006441116333, 2.2933874130249023, 2.3767106533050537, 2.460033893585205, 2.5433568954467773, 2.6266801357269287]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 13.0, 14.0, 21.0, 15.0, 42.0, 50.0, 86.0, 129.0, 187.0, 290.0, 461.0, 730.0, 1208.0, 2055.0, 3941.0, 7502.0, 15962.0, 39178.0, 119987.0, 530996.0, 220783.0, 60192.0, 22731.0, 10081.0, 5085.0, 2721.0, 1574.0, 923.0, 509.0, 352.0, 236.0, 162.0, 101.0, 72.0, 53.0, 38.0, 19.0, 12.0, 14.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.342529296875, -0.33319854736328125, -0.3238677978515625, -0.31453704833984375, -0.305206298828125, -0.29587554931640625, -0.2865447998046875, -0.27721405029296875, -0.26788330078125, -0.25855255126953125, -0.2492218017578125, -0.23989105224609375, -0.230560302734375, -0.22122955322265625, -0.2118988037109375, -0.20256805419921875, -0.1932373046875, -0.18390655517578125, -0.1745758056640625, -0.16524505615234375, -0.155914306640625, -0.14658355712890625, -0.1372528076171875, -0.12792205810546875, -0.11859130859375, -0.10926055908203125, -0.0999298095703125, -0.09059906005859375, -0.081268310546875, -0.07193756103515625, -0.0626068115234375, -0.05327606201171875, -0.0439453125, -0.03461456298828125, -0.0252838134765625, -0.01595306396484375, -0.006622314453125, 0.00270843505859375, 0.0120391845703125, 0.02136993408203125, 0.03070068359375, 0.04003143310546875, 0.0493621826171875, 0.05869293212890625, 0.068023681640625, 0.07735443115234375, 0.0866851806640625, 0.09601593017578125, 0.1053466796875, 0.11467742919921875, 0.1240081787109375, 0.13333892822265625, 0.142669677734375, 0.15200042724609375, 0.1613311767578125, 0.17066192626953125, 0.17999267578125, 0.18932342529296875, 0.1986541748046875, 0.20798492431640625, 0.217315673828125, 0.22664642333984375, 0.2359771728515625, 0.24530792236328125, 0.254638671875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 4.0, 11.0, 12.0, 5.0, 19.0, 18.0, 21.0, 21.0, 25.0, 25.0, 35.0, 51.0, 54.0, 44.0, 68.0, 53.0, 54.0, 59.0, 47.0, 47.0, 44.0, 43.0, 31.0, 31.0, 26.0, 24.0, 27.0, 13.0, 18.0, 13.0, 11.0, 11.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.2120361328125, -0.20607566833496094, -0.20011520385742188, -0.1941547393798828, -0.18819427490234375, -0.1822338104248047, -0.17627334594726562, -0.17031288146972656, -0.1643524169921875, -0.15839195251464844, -0.15243148803710938, -0.1464710235595703, -0.14051055908203125, -0.1345500946044922, -0.12858963012695312, -0.12262916564941406, -0.116668701171875, -0.11070823669433594, -0.10474777221679688, -0.09878730773925781, -0.09282684326171875, -0.08686637878417969, -0.08090591430664062, -0.07494544982910156, -0.0689849853515625, -0.06302452087402344, -0.057064056396484375, -0.05110359191894531, -0.04514312744140625, -0.03918266296386719, -0.033222198486328125, -0.027261734008789062, -0.02130126953125, -0.015340805053710938, -0.009380340576171875, -0.0034198760986328125, 0.00254058837890625, 0.008501052856445312, 0.014461517333984375, 0.020421981811523438, 0.0263824462890625, 0.03234291076660156, 0.038303375244140625, 0.04426383972167969, 0.05022430419921875, 0.05618476867675781, 0.062145233154296875, 0.06810569763183594, 0.074066162109375, 0.08002662658691406, 0.08598709106445312, 0.09194755554199219, 0.09790802001953125, 0.10386848449707031, 0.10982894897460938, 0.11578941345214844, 0.1217498779296875, 0.12771034240722656, 0.13367080688476562, 0.1396312713623047, 0.14559173583984375, 0.1515522003173828, 0.15751266479492188, 0.16347312927246094, 0.16943359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 8.0, 9.0, 10.0, 21.0, 23.0, 50.0, 61.0, 95.0, 171.0, 291.0, 700.0, 1656.0, 6759.0, 77194.0, 929132.0, 26415.0, 3686.0, 1096.0, 472.0, 260.0, 146.0, 96.0, 61.0, 44.0, 26.0, 17.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.04296875, -1.0177230834960938, -0.9924774169921875, -0.9672317504882812, -0.941986083984375, -0.9167404174804688, -0.8914947509765625, -0.8662490844726562, -0.84100341796875, -0.8157577514648438, -0.7905120849609375, -0.7652664184570312, -0.740020751953125, -0.7147750854492188, -0.6895294189453125, -0.6642837524414062, -0.6390380859375, -0.6137924194335938, -0.5885467529296875, -0.5633010864257812, -0.538055419921875, -0.5128097534179688, -0.4875640869140625, -0.46231842041015625, -0.43707275390625, -0.41182708740234375, -0.3865814208984375, -0.36133575439453125, -0.336090087890625, -0.31084442138671875, -0.2855987548828125, -0.26035308837890625, -0.235107421875, -0.20986175537109375, -0.1846160888671875, -0.15937042236328125, -0.134124755859375, -0.10887908935546875, -0.0836334228515625, -0.05838775634765625, -0.03314208984375, -0.00789642333984375, 0.0173492431640625, 0.04259490966796875, 0.067840576171875, 0.09308624267578125, 0.1183319091796875, 0.14357757568359375, 0.1688232421875, 0.19406890869140625, 0.2193145751953125, 0.24456024169921875, 0.269805908203125, 0.29505157470703125, 0.3202972412109375, 0.34554290771484375, 0.37078857421875, 0.39603424072265625, 0.4212799072265625, 0.44652557373046875, 0.471771240234375, 0.49701690673828125, 0.5222625732421875, 0.5475082397460938, 0.57275390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 2.0, 5.0, 8.0, 8.0, 7.0, 15.0, 8.0, 16.0, 14.0, 23.0, 21.0, 28.0, 41.0, 26.0, 62.0, 90.0, 91.0, 93.0, 75.0, 52.0, 50.0, 45.0, 39.0, 32.0, 28.0, 24.0, 18.0, 12.0, 7.0, 11.0, 11.0, 7.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-1.0595703125, -1.0318145751953125, -1.004058837890625, -0.9763031005859375, -0.94854736328125, -0.9207916259765625, -0.893035888671875, -0.8652801513671875, -0.8375244140625, -0.8097686767578125, -0.782012939453125, -0.7542572021484375, -0.72650146484375, -0.6987457275390625, -0.670989990234375, -0.6432342529296875, -0.615478515625, -0.5877227783203125, -0.559967041015625, -0.5322113037109375, -0.50445556640625, -0.4766998291015625, -0.448944091796875, -0.4211883544921875, -0.3934326171875, -0.3656768798828125, -0.337921142578125, -0.3101654052734375, -0.28240966796875, -0.2546539306640625, -0.226898193359375, -0.1991424560546875, -0.17138671875, -0.1436309814453125, -0.115875244140625, -0.0881195068359375, -0.06036376953125, -0.0326080322265625, -0.004852294921875, 0.0229034423828125, 0.0506591796875, 0.0784149169921875, 0.106170654296875, 0.1339263916015625, 0.16168212890625, 0.1894378662109375, 0.217193603515625, 0.2449493408203125, 0.272705078125, 0.3004608154296875, 0.328216552734375, 0.3559722900390625, 0.38372802734375, 0.4114837646484375, 0.439239501953125, 0.4669952392578125, 0.4947509765625, 0.5225067138671875, 0.550262451171875, 0.5780181884765625, 0.60577392578125, 0.6335296630859375, 0.661285400390625, 0.6890411376953125, 0.716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 12.0, 16.0, 16.0, 24.0, 27.0, 53.0, 73.0, 134.0, 190.0, 379.0, 777.0, 1785.0, 5782.0, 27469.0, 874010.0, 118342.0, 13480.0, 3447.0, 1274.0, 545.0, 267.0, 136.0, 92.0, 59.0, 40.0, 21.0, 20.0, 19.0, 3.0, 9.0, 8.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1888427734375, -0.18308448791503906, -0.17732620239257812, -0.1715679168701172, -0.16580963134765625, -0.1600513458251953, -0.15429306030273438, -0.14853477478027344, -0.1427764892578125, -0.13701820373535156, -0.13125991821289062, -0.1255016326904297, -0.11974334716796875, -0.11398506164550781, -0.10822677612304688, -0.10246849060058594, -0.096710205078125, -0.09095191955566406, -0.08519363403320312, -0.07943534851074219, -0.07367706298828125, -0.06791877746582031, -0.062160491943359375, -0.05640220642089844, -0.0506439208984375, -0.04488563537597656, -0.039127349853515625, -0.03336906433105469, -0.02761077880859375, -0.021852493286132812, -0.016094207763671875, -0.010335922241210938, -0.00457763671875, 0.0011806488037109375, 0.006938934326171875, 0.012697219848632812, 0.01845550537109375, 0.024213790893554688, 0.029972076416015625, 0.03573036193847656, 0.0414886474609375, 0.04724693298339844, 0.053005218505859375, 0.05876350402832031, 0.06452178955078125, 0.07028007507324219, 0.07603836059570312, 0.08179664611816406, 0.087554931640625, 0.09331321716308594, 0.09907150268554688, 0.10482978820800781, 0.11058807373046875, 0.11634635925292969, 0.12210464477539062, 0.12786293029785156, 0.1336212158203125, 0.13937950134277344, 0.14513778686523438, 0.1508960723876953, 0.15665435791015625, 0.1624126434326172, 0.16817092895507812, 0.17392921447753906, 0.1796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 5.0, 6.0, 6.0, 9.0, 14.0, 19.0, 26.0, 23.0, 66.0, 117.0, 243.0, 185.0, 105.0, 54.0, 19.0, 18.0, 26.0, 16.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010758638381958008, -0.00010372977703809738, -9.987317025661469e-05, -9.601656347513199e-05, -9.215995669364929e-05, -8.83033499121666e-05, -8.44467431306839e-05, -8.05901363492012e-05, -7.67335295677185e-05, -7.287692278623581e-05, -6.902031600475311e-05, -6.516370922327042e-05, -6.130710244178772e-05, -5.745049566030502e-05, -5.359388887882233e-05, -4.973728209733963e-05, -4.5880675315856934e-05, -4.202406853437424e-05, -3.816746175289154e-05, -3.4310854971408844e-05, -3.0454248189926147e-05, -2.659764140844345e-05, -2.2741034626960754e-05, -1.8884427845478058e-05, -1.5027821063995361e-05, -1.1171214282512665e-05, -7.314607501029968e-06, -3.4580007195472717e-06, 3.986060619354248e-07, 4.255212843418121e-06, 8.111819624900818e-06, 1.1968426406383514e-05, 1.582503318786621e-05, 1.9681639969348907e-05, 2.3538246750831604e-05, 2.73948535323143e-05, 3.1251460313797e-05, 3.5108067095279694e-05, 3.896467387676239e-05, 4.282128065824509e-05, 4.667788743972778e-05, 5.053449422121048e-05, 5.4391101002693176e-05, 5.824770778417587e-05, 6.210431456565857e-05, 6.596092134714127e-05, 6.981752812862396e-05, 7.367413491010666e-05, 7.753074169158936e-05, 8.138734847307205e-05, 8.524395525455475e-05, 8.910056203603745e-05, 9.295716881752014e-05, 9.681377559900284e-05, 0.00010067038238048553, 0.00010452698916196823, 0.00010838359594345093, 0.00011224020272493362, 0.00011609680950641632, 0.00011995341628789902, 0.00012381002306938171, 0.0001276666298508644, 0.0001315232366323471, 0.0001353798434138298, 0.0001392364501953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 21.0, 43.0, 50.0, 75.0, 164.0, 332.0, 651.0, 1367.0, 2797.0, 7102.0, 22917.0, 180086.0, 785593.0, 31646.0, 9074.0, 3538.0, 1544.0, 713.0, 374.0, 198.0, 101.0, 53.0, 30.0, 20.0, 8.0, 11.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1795654296875, -0.17485427856445312, -0.17014312744140625, -0.16543197631835938, -0.1607208251953125, -0.15600967407226562, -0.15129852294921875, -0.14658737182617188, -0.141876220703125, -0.13716506958007812, -0.13245391845703125, -0.12774276733398438, -0.1230316162109375, -0.11832046508789062, -0.11360931396484375, -0.10889816284179688, -0.10418701171875, -0.09947586059570312, -0.09476470947265625, -0.09005355834960938, -0.0853424072265625, -0.08063125610351562, -0.07592010498046875, -0.07120895385742188, -0.066497802734375, -0.061786651611328125, -0.05707550048828125, -0.052364349365234375, -0.0476531982421875, -0.042942047119140625, -0.03823089599609375, -0.033519744873046875, -0.02880859375, -0.024097442626953125, -0.01938629150390625, -0.014675140380859375, -0.0099639892578125, -0.005252838134765625, -0.00054168701171875, 0.004169464111328125, 0.008880615234375, 0.013591766357421875, 0.01830291748046875, 0.023014068603515625, 0.0277252197265625, 0.032436370849609375, 0.03714752197265625, 0.041858673095703125, 0.04656982421875, 0.051280975341796875, 0.05599212646484375, 0.060703277587890625, 0.0654144287109375, 0.07012557983398438, 0.07483673095703125, 0.07954788208007812, 0.084259033203125, 0.08897018432617188, 0.09368133544921875, 0.09839248657226562, 0.1031036376953125, 0.10781478881835938, 0.11252593994140625, 0.11723709106445312, 0.1219482421875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 12.0, 4.0, 16.0, 30.0, 35.0, 41.0, 78.0, 149.0, 176.0, 165.0, 108.0, 58.0, 40.0, 32.0, 16.0, 16.0, 11.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2376708984375, -0.23200035095214844, -0.22632980346679688, -0.2206592559814453, -0.21498870849609375, -0.2093181610107422, -0.20364761352539062, -0.19797706604003906, -0.1923065185546875, -0.18663597106933594, -0.18096542358398438, -0.1752948760986328, -0.16962432861328125, -0.1639537811279297, -0.15828323364257812, -0.15261268615722656, -0.146942138671875, -0.14127159118652344, -0.13560104370117188, -0.1299304962158203, -0.12425994873046875, -0.11858940124511719, -0.11291885375976562, -0.10724830627441406, -0.1015777587890625, -0.09590721130371094, -0.09023666381835938, -0.08456611633300781, -0.07889556884765625, -0.07322502136230469, -0.06755447387695312, -0.06188392639160156, -0.05621337890625, -0.05054283142089844, -0.044872283935546875, -0.03920173645019531, -0.03353118896484375, -0.027860641479492188, -0.022190093994140625, -0.016519546508789062, -0.0108489990234375, -0.0051784515380859375, 0.000492095947265625, 0.0061626434326171875, 0.01183319091796875, 0.017503738403320312, 0.023174285888671875, 0.028844833374023438, 0.034515380859375, 0.04018592834472656, 0.045856475830078125, 0.05152702331542969, 0.05719757080078125, 0.06286811828613281, 0.06853866577148438, 0.07420921325683594, 0.0798797607421875, 0.08555030822753906, 0.09122085571289062, 0.09689140319824219, 0.10256195068359375, 0.10823249816894531, 0.11390304565429688, 0.11957359313964844, 0.125244140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 20.0, 42.0, 76.0, 141.0, 513.0, 98.0, 44.0, 18.0, 12.0, 11.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.130375862121582, -4.976040840148926, -4.821706295013428, -4.66737174987793, -4.513036727905273, -4.358701705932617, -4.204367160797119, -4.050032615661621, -3.895697593688965, -3.7413628101348877, -3.5870280265808105, -3.4326932430267334, -3.2783584594726562, -3.124023675918579, -2.969688892364502, -2.815354108810425, -2.6610193252563477, -2.5066845417022705, -2.3523497581481934, -2.198014974594116, -2.043680191040039, -1.889345407485962, -1.7350106239318848, -1.5806758403778076, -1.4263410568237305, -1.2720062732696533, -1.1176714897155762, -0.963336706161499, -0.8090019226074219, -0.6546671390533447, -0.5003323554992676, -0.34599757194519043, -0.19166278839111328, -0.03732800483703613, 0.11700677871704102, 0.27134156227111816, 0.4256763458251953, 0.5800111293792725, 0.7343459129333496, 0.8886806964874268, 1.043015480041504, 1.197350263595581, 1.3516850471496582, 1.5060198307037354, 1.6603546142578125, 1.8146893978118896, 1.9690241813659668, 2.123358964920044, 2.277693748474121, 2.4320285320281982, 2.5863633155822754, 2.7406980991363525, 2.8950328826904297, 3.049367666244507, 3.203702449798584, 3.358037233352661, 3.5123720169067383, 3.6667068004608154, 3.8210415840148926, 3.9753763675689697, 4.129711151123047, 4.284046173095703, 4.438380718231201, 4.592715263366699, 4.7470502853393555]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 12.0, 6.0, 6.0, 12.0, 11.0, 15.0, 22.0, 16.0, 11.0, 20.0, 19.0, 16.0, 24.0, 30.0, 41.0, 177.0, 315.0, 36.0, 26.0, 27.0, 25.0, 19.0, 22.0, 19.0, 13.0, 15.0, 14.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0], "bins": [-3.386681079864502, -3.3045144081115723, -3.2223479747772217, -3.140181303024292, -3.0580148696899414, -2.9758481979370117, -2.893681764602661, -2.8115150928497314, -2.729348659515381, -2.647181987762451, -2.5650155544281006, -2.482848882675171, -2.4006824493408203, -2.3185157775878906, -2.23634934425354, -2.1541826725006104, -2.0720162391662598, -1.9898496866226196, -1.9076831340789795, -1.8255165815353394, -1.7433500289916992, -1.661183476448059, -1.579016923904419, -1.4968502521514893, -1.4146835803985596, -1.3325170278549194, -1.2503504753112793, -1.1681839227676392, -1.086017370223999, -1.0038508176803589, -0.921684205532074, -0.8395176529884338, -0.7573510408401489, -0.6751844882965088, -0.5930179357528687, -0.5108513832092285, -0.428684800863266, -0.34651824831962585, -0.26435166597366333, -0.1821851134300232, -0.10001856088638306, -0.017852000892162323, 0.06431455910205841, 0.14648112654685974, 0.22864767909049988, 0.31081423163414, 0.39298081398010254, 0.4751473665237427, 0.5573139190673828, 0.639480471611023, 0.7216470241546631, 0.8038135766983032, 0.8859801292419434, 0.9681466817855835, 1.0503132343292236, 1.1324799060821533, 1.214646339416504, 1.296812891960144, 1.3789794445037842, 1.4611459970474243, 1.5433125495910645, 1.6254791021347046, 1.7076456546783447, 1.7898123264312744, 1.8719788789749146]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 9.0, 16.0, 15.0, 23.0, 36.0, 43.0, 60.0, 76.0, 253.0, 180.0, 88.0, 50.0, 37.0, 30.0, 25.0, 13.0, 4.0, 10.0, 13.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.298370361328125, -0.28839111328125, -0.278411865234375, -0.2684326171875, -0.258453369140625, -0.24847412109375, -0.238494873046875, -0.228515625, -0.218536376953125, -0.20855712890625, -0.198577880859375, -0.1885986328125, -0.178619384765625, -0.16864013671875, -0.158660888671875, -0.148681640625, -0.138702392578125, -0.12872314453125, -0.118743896484375, -0.1087646484375, -0.098785400390625, -0.08880615234375, -0.078826904296875, -0.06884765625, -0.058868408203125, -0.04888916015625, -0.038909912109375, -0.0289306640625, -0.018951416015625, -0.00897216796875, 0.001007080078125, 0.010986328125, 0.020965576171875, 0.03094482421875, 0.040924072265625, 0.0509033203125, 0.060882568359375, 0.07086181640625, 0.080841064453125, 0.0908203125, 0.100799560546875, 0.11077880859375, 0.120758056640625, 0.1307373046875, 0.140716552734375, 0.15069580078125, 0.160675048828125, 0.170654296875, 0.180633544921875, 0.19061279296875, 0.200592041015625, 0.2105712890625, 0.220550537109375, 0.23052978515625, 0.240509033203125, 0.25048828125, 0.260467529296875, 0.27044677734375, 0.280426025390625, 0.2904052734375, 0.300384521484375, 0.31036376953125, 0.320343017578125, 0.330322265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 12.0, 6.0, 18.0, 23.0, 28.0, 42.0, 60.0, 114.0, 166.0, 316.0, 633.0, 1475.0, 4267.0, 25872.0, 8331700.0, 17649.0, 3532.0, 1331.0, 572.0, 250.0, 166.0, 107.0, 58.0, 50.0, 17.0, 32.0, 19.0, 12.0, 5.0, 3.0, 2.0, 6.0, 1.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0], "bins": [-1.7317419052124023, -1.6708252429962158, -1.6099085807800293, -1.5489919185638428, -1.4880752563476562, -1.4271585941314697, -1.3662419319152832, -1.3053252696990967, -1.2444086074829102, -1.1834919452667236, -1.122575283050537, -1.0616586208343506, -1.000741958618164, -0.9398252964019775, -0.878908634185791, -0.8179919719696045, -0.7570752501487732, -0.6961585879325867, -0.6352419257164001, -0.5743252635002136, -0.5134086012840271, -0.4524919092655182, -0.39157524704933167, -0.33065858483314514, -0.2697419226169586, -0.2088252604007721, -0.14790859818458557, -0.08699192106723785, -0.02607525885105133, 0.03484141826629639, 0.09575808048248291, 0.15667474269866943, 0.21759140491485596, 0.2785080671310425, 0.339424729347229, 0.4003413915634155, 0.46125805377960205, 0.5221747159957886, 0.5830913782119751, 0.6440080404281616, 0.7049247026443481, 0.7658413648605347, 0.8267580270767212, 0.8876746892929077, 0.9485913515090942, 1.0095080137252808, 1.0704246759414673, 1.1313413381576538, 1.1922581195831299, 1.2531747817993164, 1.314091444015503, 1.3750081062316895, 1.435924768447876, 1.4968414306640625, 1.557758092880249, 1.6186747550964355, 1.679591417312622, 1.7405080795288086, 1.8014247417449951, 1.8623414039611816, 1.9232580661773682, 1.9841747283935547, 2.045091390609741, 2.1060080528259277, 2.1669247150421143]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 7.0, 10.0, 5.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8577942848205566, -2.7734146118164062, -2.689034938812256, -2.6046550273895264, -2.520275354385376, -2.4358956813812256, -2.351515769958496, -2.2671360969543457, -2.1827564239501953, -2.098376750946045, -2.0139970779418945, -1.929617166519165, -1.8452374935150146, -1.7608578205108643, -1.6764780282974243, -1.5920982360839844, -1.507718563079834, -1.4233388900756836, -1.3389590978622437, -1.2545793056488037, -1.1701996326446533, -1.085819959640503, -1.001440167427063, -0.9170604348182678, -0.8326807022094727, -0.7483009696006775, -0.6639212369918823, -0.5795415043830872, -0.495161771774292, -0.4107820391654968, -0.32640230655670166, -0.2420225739479065, -0.15764260292053223, -0.07326287031173706, 0.011116862297058105, 0.09549659490585327, 0.17987632751464844, 0.2642560601234436, 0.34863579273223877, 0.43301552534103394, 0.5173952579498291, 0.6017749905586243, 0.6861547231674194, 0.7705344557762146, 0.8549141883850098, 0.9392939209938049, 1.0236736536026, 1.10805344581604, 1.1924331188201904, 1.2768127918243408, 1.3611925840377808, 1.4455723762512207, 1.529952049255371, 1.6143317222595215, 1.6987115144729614, 1.7830913066864014, 1.8674709796905518, 1.9518506526947021, 2.0362305641174316, 2.120610237121582, 2.2049899101257324, 2.289369583129883, 2.373749256134033, 2.4581291675567627, 2.542508840560913]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 12.0, 7.0, 16.0, 25.0, 44.0, 47.0, 82.0, 141.0, 219.0, 312.0, 593.0, 963.0, 1855.0, 3721.0, 8386.0, 22768.0, 74462.0, 219653.0, 130399.0, 37076.0, 12770.0, 5188.0, 2429.0, 1273.0, 751.0, 409.0, 245.0, 138.0, 106.0, 65.0, 38.0, 32.0, 13.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7314453125, -1.6666412353515625, -1.601837158203125, -1.5370330810546875, -1.47222900390625, -1.4074249267578125, -1.342620849609375, -1.2778167724609375, -1.2130126953125, -1.1482086181640625, -1.083404541015625, -1.0186004638671875, -0.95379638671875, -0.8889923095703125, -0.824188232421875, -0.7593841552734375, -0.694580078125, -0.6297760009765625, -0.564971923828125, -0.5001678466796875, -0.43536376953125, -0.3705596923828125, -0.305755615234375, -0.2409515380859375, -0.1761474609375, -0.1113433837890625, -0.046539306640625, 0.0182647705078125, 0.08306884765625, 0.1478729248046875, 0.212677001953125, 0.2774810791015625, 0.34228515625, 0.4070892333984375, 0.471893310546875, 0.5366973876953125, 0.60150146484375, 0.6663055419921875, 0.731109619140625, 0.7959136962890625, 0.8607177734375, 0.9255218505859375, 0.990325927734375, 1.0551300048828125, 1.11993408203125, 1.1847381591796875, 1.249542236328125, 1.3143463134765625, 1.379150390625, 1.4439544677734375, 1.508758544921875, 1.5735626220703125, 1.63836669921875, 1.7031707763671875, 1.767974853515625, 1.8327789306640625, 1.8975830078125, 1.9623870849609375, 2.027191162109375, 2.0919952392578125, 2.15679931640625, 2.2216033935546875, 2.286407470703125, 2.3512115478515625, 2.416015625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 10.0, 5.0, 10.0, 21.0, 26.0, 41.0, 56.0, 70.0, 103.0, 107.0, 116.0, 106.0, 85.0, 50.0, 48.0, 35.0, 35.0, 21.0, 13.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.23921775817871094, -0.22904586791992188, -0.2188739776611328, -0.20870208740234375, -0.1985301971435547, -0.18835830688476562, -0.17818641662597656, -0.1680145263671875, -0.15784263610839844, -0.14767074584960938, -0.1374988555908203, -0.12732696533203125, -0.11715507507324219, -0.10698318481445312, -0.09681129455566406, -0.086639404296875, -0.07646751403808594, -0.06629562377929688, -0.05612373352050781, -0.04595184326171875, -0.03577995300292969, -0.025608062744140625, -0.015436172485351562, -0.0052642822265625, 0.0049076080322265625, 0.015079498291015625, 0.025251388549804688, 0.03542327880859375, 0.04559516906738281, 0.055767059326171875, 0.06593894958496094, 0.07611083984375, 0.08628273010253906, 0.09645462036132812, 0.10662651062011719, 0.11679840087890625, 0.1269702911376953, 0.13714218139648438, 0.14731407165527344, 0.1574859619140625, 0.16765785217285156, 0.17782974243164062, 0.1880016326904297, 0.19817352294921875, 0.2083454132080078, 0.21851730346679688, 0.22868919372558594, 0.238861083984375, 0.24903297424316406, 0.2592048645019531, 0.2693767547607422, 0.27954864501953125, 0.2897205352783203, 0.2998924255371094, 0.31006431579589844, 0.3202362060546875, 0.33040809631347656, 0.3405799865722656, 0.3507518768310547, 0.36092376708984375, 0.3710956573486328, 0.3812675476074219, 0.39143943786621094, 0.401611328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 4.0, 9.0, 10.0, 15.0, 16.0, 29.0, 64.0, 113.0, 86.0, 45.0, 37.0, 15.0, 17.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1321091651916504, -3.0421223640441895, -2.9521355628967285, -2.8621485233306885, -2.7721617221832275, -2.6821749210357666, -2.5921881198883057, -2.5022010803222656, -2.4122142791748047, -2.3222274780273438, -2.232240676879883, -2.1422536373138428, -2.052266836166382, -1.962280035018921, -1.87229323387146, -1.7823063135147095, -1.6923195123672485, -1.6023327112197876, -1.512345790863037, -1.4223589897155762, -1.3323720693588257, -1.2423852682113647, -1.1523983478546143, -1.0624115467071533, -0.9724246859550476, -0.8824378252029419, -0.7924509644508362, -0.7024641036987305, -0.6124773025512695, -0.522490382194519, -0.4325035810470581, -0.3425167202949524, -0.2525298595428467, -0.16254299879074097, -0.07255615293979645, 0.01743069291114807, 0.10741755366325378, 0.1974044144153595, 0.2873912453651428, 0.37737810611724854, 0.46736496686935425, 0.55735182762146, 0.6473386883735657, 0.7373255491256714, 0.8273123502731323, 0.9172992706298828, 1.0072860717773438, 1.0972728729248047, 1.1872597932815552, 1.2772465944290161, 1.3672335147857666, 1.4572203159332275, 1.547207236289978, 1.637194037437439, 1.7271809577941895, 1.8171677589416504, 1.9071545600891113, 1.9971413612365723, 2.087128162384033, 2.1771152019500732, 2.267102003097534, 2.357088804244995, 2.447075605392456, 2.537062644958496, 2.627049446105957]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 19.0, 35.0, 50.0, 80.0, 77.0, 78.0, 36.0, 22.0, 13.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.452475905418396, -1.411645531654358, -1.3708150386810303, -1.3299846649169922, -1.289154291152954, -1.248323917388916, -1.207493543624878, -1.1666630506515503, -1.1258326768875122, -1.0850023031234741, -1.0441718101501465, -1.0033414363861084, -0.9625110626220703, -0.9216806888580322, -0.8808502554893494, -0.8400198221206665, -0.7991894483566284, -0.7583590745925903, -0.7175286412239075, -0.6766982078552246, -0.6358678340911865, -0.5950374603271484, -0.5542070269584656, -0.5133765935897827, -0.47254621982574463, -0.43171581625938416, -0.3908854126930237, -0.3500550091266632, -0.30922460556030273, -0.26839420199394226, -0.2275637984275818, -0.1867333948612213, -0.1459031105041504, -0.10507270693778992, -0.06424230337142944, -0.02341189980506897, 0.017418503761291504, 0.05824890732765198, 0.09907931089401245, 0.13990971446037292, 0.1807401180267334, 0.22157052159309387, 0.26240092515945435, 0.3032313287258148, 0.3440617322921753, 0.38489213585853577, 0.42572253942489624, 0.4665529429912567, 0.5073833465576172, 0.5482137203216553, 0.5890441536903381, 0.629874587059021, 0.6707049608230591, 0.7115353345870972, 0.75236576795578, 0.7931962013244629, 0.834026575088501, 0.8748569488525391, 0.9156873822212219, 0.9565178155899048, 0.9973481893539429, 1.038178563117981, 1.0790090560913086, 1.1198394298553467, 1.1606698036193848]}, "_wandb": {"runtime": 3640}}